Trowbridge-Reitz Sample, sample surface normal, cosTheta

Percentage Accurate: 99.4% → 99.8%
Time: 23.0s
Alternatives: 5
Speedup: 2.3×

Specification

?
\[\left(\left(\left(2.328306437 \cdot 10^{-10} \leq u0 \land u0 \leq 1\right) \land \left(2.328306437 \cdot 10^{-10} \leq u1 \land u1 \leq 0.5\right)\right) \land \left(0.0001 \leq alphax \land alphax \leq 1\right)\right) \land \left(0.0001 \leq alphay \land alphay \leq 1\right)\]
\[\begin{array}{l} \\ \begin{array}{l} t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\ t_1 := \sin t\_0\\ t_2 := \cos t\_0\\ \frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0
         (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
        (t_1 (sin t_0))
        (t_2 (cos t_0)))
   (/
    1.0
    (sqrt
     (+
      1.0
      (/
       (*
        (/
         1.0
         (+
          (/ (* t_2 t_2) (* alphax alphax))
          (/ (* t_1 t_1) (* alphay alphay))))
        u0)
       (- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
	float t_1 = sinf(t_0);
	float t_2 = cosf(t_0);
	return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay)
	t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi))))))
	t_1 = sin(t_0)
	t_2 = cos(t_0)
	return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0)))))
end
function tmp = code(u0, u1, alphax, alphay)
	t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi))))));
	t_1 = sin(t_0);
	t_2 = cos(t_0);
	tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}

Sampling outcomes in binary32 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 5 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 99.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\ t_1 := \sin t\_0\\ t_2 := \cos t\_0\\ \frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0
         (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
        (t_1 (sin t_0))
        (t_2 (cos t_0)))
   (/
    1.0
    (sqrt
     (+
      1.0
      (/
       (*
        (/
         1.0
         (+
          (/ (* t_2 t_2) (* alphax alphax))
          (/ (* t_1 t_1) (* alphay alphay))))
        u0)
       (- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
	float t_1 = sinf(t_0);
	float t_2 = cosf(t_0);
	return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay)
	t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi))))))
	t_1 = sin(t_0)
	t_2 = cos(t_0)
	return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0)))))
end
function tmp = code(u0, u1, alphax, alphay)
	t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi))))));
	t_1 = sin(t_0);
	t_2 = cos(t_0);
	tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}

Alternative 1: 99.8% accurate, 2.3× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}\\ {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, t\_0, alphax\right)} + \frac{1 + \frac{1}{-1 - t\_0}}{alphay \cdot alphay}\right)}\right)}^{-0.5} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0 (pow (* (/ alphay alphax) (tan (* (fma 2.0 u1 0.5) PI))) 2.0)))
   (pow
    (+
     1.0
     (/
      u0
      (*
       (- 1.0 u0)
       (+
        (/ 1.0 (* alphax (fma alphax t_0 alphax)))
        (/ (+ 1.0 (/ 1.0 (- -1.0 t_0))) (* alphay alphay))))))
    -0.5)))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = powf(((alphay / alphax) * tanf((fmaf(2.0f, u1, 0.5f) * ((float) M_PI)))), 2.0f);
	return powf((1.0f + (u0 / ((1.0f - u0) * ((1.0f / (alphax * fmaf(alphax, t_0, alphax))) + ((1.0f + (1.0f / (-1.0f - t_0))) / (alphay * alphay)))))), -0.5f);
}
function code(u0, u1, alphax, alphay)
	t_0 = Float32(Float32(alphay / alphax) * tan(Float32(fma(Float32(2.0), u1, Float32(0.5)) * Float32(pi)))) ^ Float32(2.0)
	return Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(1.0) / Float32(alphax * fma(alphax, t_0, alphax))) + Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - t_0))) / Float32(alphay * alphay)))))) ^ Float32(-0.5)
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}\\
{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, t\_0, alphax\right)} + \frac{1 + \frac{1}{-1 - t\_0}}{alphay \cdot alphay}\right)}\right)}^{-0.5}
\end{array}
\end{array}
Derivation
  1. Initial program 99.4%

    \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
  2. Add Preprocessing
  3. Applied rewrites99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{\frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)}^{2}}}{alphax \cdot alphax} + \frac{1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)\right)}{\left(alphay \cdot alphay\right) \cdot 2}\right)}}}} \]
  4. Applied rewrites100.0%

    \[\leadsto \color{blue}{{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)} + \frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}}}{alphay \cdot alphay}\right)}\right)}^{-0.5}} \]
  5. Applied rewrites100.0%

    \[\leadsto {\color{blue}{\left(\frac{u0}{\left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1 + \frac{-1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}}}{alphay \cdot alphay}\right) \cdot \left(1 - u0\right)} + 1\right)}}^{-0.5} \]
  6. Final simplification100.0%

    \[\leadsto {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1 + \frac{1}{-1 - {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}}}{alphay \cdot alphay}\right)}\right)}^{-0.5} \]
  7. Add Preprocessing

Alternative 2: 99.3% accurate, 2.6× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}\\ \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, t\_0, alphax\right)} + \frac{1 + \frac{1}{-1 - t\_0}}{alphay \cdot alphay}\right)}}} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0 (pow (* (/ alphay alphax) (tan (* (fma 2.0 u1 0.5) PI))) 2.0)))
   (/
    1.0
    (sqrt
     (+
      1.0
      (/
       u0
       (*
        (- 1.0 u0)
        (+
         (/ 1.0 (* alphax (fma alphax t_0 alphax)))
         (/ (+ 1.0 (/ 1.0 (- -1.0 t_0))) (* alphay alphay))))))))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = powf(((alphay / alphax) * tanf((fmaf(2.0f, u1, 0.5f) * ((float) M_PI)))), 2.0f);
	return 1.0f / sqrtf((1.0f + (u0 / ((1.0f - u0) * ((1.0f / (alphax * fmaf(alphax, t_0, alphax))) + ((1.0f + (1.0f / (-1.0f - t_0))) / (alphay * alphay)))))));
}
function code(u0, u1, alphax, alphay)
	t_0 = Float32(Float32(alphay / alphax) * tan(Float32(fma(Float32(2.0), u1, Float32(0.5)) * Float32(pi)))) ^ Float32(2.0)
	return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(1.0) / Float32(alphax * fma(alphax, t_0, alphax))) + Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - t_0))) / Float32(alphay * alphay))))))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}\\
\frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, t\_0, alphax\right)} + \frac{1 + \frac{1}{-1 - t\_0}}{alphay \cdot alphay}\right)}}}
\end{array}
\end{array}
Derivation
  1. Initial program 99.4%

    \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
  2. Add Preprocessing
  3. Applied rewrites99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{\frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)}^{2}}}{alphax \cdot alphax} + \frac{1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)\right)}{\left(alphay \cdot alphay\right) \cdot 2}\right)}}}} \]
  4. Applied rewrites99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \color{blue}{\left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)}\right)}}}} \]
  5. Step-by-step derivation
    1. lift-PI.f32N/A

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\color{blue}{\mathsf{PI}\left(\right)} \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)}\right)}}} \]
    2. lift-*.f32N/A

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \color{blue}{\left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)}\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)}\right)}}} \]
    3. *-commutativeN/A

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \color{blue}{\left(\mathsf{fma}\left(2, u1, \frac{1}{2}\right) \cdot \mathsf{PI}\left(\right)\right)}\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)}\right)}}} \]
    4. lift-*.f32N/A

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \color{blue}{\left(\mathsf{fma}\left(2, u1, \frac{1}{2}\right) \cdot \mathsf{PI}\left(\right)\right)}\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)}\right)}}} \]
    5. lift-PI.f3299.4

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \color{blue}{\pi}\right)\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)}\right)}}} \]
    6. lift-/.f32N/A

      \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, \frac{1}{2}\right) \cdot \mathsf{PI}\left(\right)\right)\right)}^{2}}}{alphay \cdot alphay} + \color{blue}{\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)}}\right)}}} \]
  6. Applied rewrites99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \color{blue}{\left(\frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}}}{alphay \cdot alphay} + \frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)}\right)}}}} \]
  7. Final simplification99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1 + \frac{1}{-1 - {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}}}{alphay \cdot alphay}\right)}}} \]
  8. Add Preprocessing

Alternative 3: 98.7% accurate, 3.7× speedup?

\[\begin{array}{l} \\ {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1}{alphay \cdot alphay}\right)}\right)}^{-0.5} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (pow
  (+
   1.0
   (/
    u0
    (*
     (- 1.0 u0)
     (+
      (/
       1.0
       (*
        alphax
        (fma
         alphax
         (pow (* (/ alphay alphax) (tan (* (fma 2.0 u1 0.5) PI))) 2.0)
         alphax)))
      (/ 1.0 (* alphay alphay))))))
  -0.5))
float code(float u0, float u1, float alphax, float alphay) {
	return powf((1.0f + (u0 / ((1.0f - u0) * ((1.0f / (alphax * fmaf(alphax, powf(((alphay / alphax) * tanf((fmaf(2.0f, u1, 0.5f) * ((float) M_PI)))), 2.0f), alphax))) + (1.0f / (alphay * alphay)))))), -0.5f);
}
function code(u0, u1, alphax, alphay)
	return Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(1.0) / Float32(alphax * fma(alphax, (Float32(Float32(alphay / alphax) * tan(Float32(fma(Float32(2.0), u1, Float32(0.5)) * Float32(pi)))) ^ Float32(2.0)), alphax))) + Float32(Float32(1.0) / Float32(alphay * alphay)))))) ^ Float32(-0.5)
end
\begin{array}{l}

\\
{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1}{alphay \cdot alphay}\right)}\right)}^{-0.5}
\end{array}
Derivation
  1. Initial program 99.4%

    \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
  2. Add Preprocessing
  3. Applied rewrites99.4%

    \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{\frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)}^{2}}}{alphax \cdot alphax} + \frac{1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)\right)}{\left(alphay \cdot alphay\right) \cdot 2}\right)}}}} \]
  4. Applied rewrites100.0%

    \[\leadsto \color{blue}{{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)} + \frac{1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}}}{alphay \cdot alphay}\right)}\right)}^{-0.5}} \]
  5. Taylor expanded in alphay around inf

    \[\leadsto {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)} + \frac{\color{blue}{1}}{alphay \cdot alphay}\right)}\right)}^{\frac{-1}{2}} \]
  6. Step-by-step derivation
    1. Applied rewrites99.3%

      \[\leadsto {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)} + \frac{\color{blue}{1}}{alphay \cdot alphay}\right)}\right)}^{-0.5} \]
    2. Step-by-step derivation
      1. lift-+.f32N/A

        \[\leadsto {\color{blue}{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)} + \frac{1}{alphay \cdot alphay}\right)}\right)}}^{\frac{-1}{2}} \]
      2. +-commutativeN/A

        \[\leadsto {\color{blue}{\left(\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{PI}\left(\right) \cdot \mathsf{fma}\left(2, u1, \frac{1}{2}\right)\right)\right)}^{2}\right)\right)} + \frac{1}{alphay \cdot alphay}\right)} + 1\right)}}^{\frac{-1}{2}} \]
      3. lower-+.f3299.3

        \[\leadsto {\color{blue}{\left(\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}\right)\right)} + \frac{1}{alphay \cdot alphay}\right)} + 1\right)}}^{-0.5} \]
    3. Applied rewrites99.3%

      \[\leadsto {\color{blue}{\left(\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1}{alphay \cdot alphay}\right)} + 1\right)}}^{-0.5} \]
    4. Final simplification99.3%

      \[\leadsto {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right)\right)}^{2}, alphax\right)} + \frac{1}{alphay \cdot alphay}\right)}\right)}^{-0.5} \]
    5. Add Preprocessing

    Alternative 4: 98.0% accurate, 6.2× speedup?

    \[\begin{array}{l} \\ e^{-0.5 \cdot \mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{1 - u0}\right)} \end{array} \]
    (FPCore (u0 u1 alphax alphay)
     :precision binary32
     (exp (* -0.5 (log1p (/ (* u0 (* alphay alphay)) (- 1.0 u0))))))
    float code(float u0, float u1, float alphax, float alphay) {
    	return expf((-0.5f * log1pf(((u0 * (alphay * alphay)) / (1.0f - u0)))));
    }
    
    function code(u0, u1, alphax, alphay)
    	return exp(Float32(Float32(-0.5) * log1p(Float32(Float32(u0 * Float32(alphay * alphay)) / Float32(Float32(1.0) - u0)))))
    end
    
    \begin{array}{l}
    
    \\
    e^{-0.5 \cdot \mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{1 - u0}\right)}
    \end{array}
    
    Derivation
    1. Initial program 99.4%

      \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
    2. Add Preprocessing
    3. Taylor expanded in alphay around 0

      \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{{alphay}^{2} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
    4. Step-by-step derivation
      1. lower-/.f32N/A

        \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{{alphay}^{2} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
      2. unpow2N/A

        \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{\left(alphay \cdot alphay\right)} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
      3. associate-*l*N/A

        \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{alphay \cdot \left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
      4. lower-*.f32N/A

        \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{alphay \cdot \left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
      5. lower-*.f32N/A

        \[\leadsto \frac{1}{\sqrt{1 + \frac{alphay \cdot \color{blue}{\left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
      6. lower-*.f32N/A

        \[\leadsto \frac{1}{\sqrt{1 + \frac{alphay \cdot \left(alphay \cdot u0\right)}{\color{blue}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
    5. Applied rewrites98.0%

      \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{alphay \cdot \left(alphay \cdot u0\right)}{{\sin \tan^{-1} \left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
    6. Applied rewrites98.4%

      \[\leadsto \color{blue}{e^{\mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{\left(1 - \frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\right)}^{2}}\right) \cdot \left(1 - u0\right)}\right) \cdot -0.5}} \]
    7. Taylor expanded in alphay around inf

      \[\leadsto e^{\mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{1 - \color{blue}{u0}}\right) \cdot \frac{-1}{2}} \]
    8. Step-by-step derivation
      1. Applied rewrites98.9%

        \[\leadsto e^{\mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{1 - \color{blue}{u0}}\right) \cdot -0.5} \]
      2. Final simplification98.9%

        \[\leadsto e^{-0.5 \cdot \mathsf{log1p}\left(\frac{u0 \cdot \left(alphay \cdot alphay\right)}{1 - u0}\right)} \]
      3. Add Preprocessing

      Alternative 5: 91.2% accurate, 1436.0× speedup?

      \[\begin{array}{l} \\ 1 \end{array} \]
      (FPCore (u0 u1 alphax alphay) :precision binary32 1.0)
      float code(float u0, float u1, float alphax, float alphay) {
      	return 1.0f;
      }
      
      real(4) function code(u0, u1, alphax, alphay)
          real(4), intent (in) :: u0
          real(4), intent (in) :: u1
          real(4), intent (in) :: alphax
          real(4), intent (in) :: alphay
          code = 1.0e0
      end function
      
      function code(u0, u1, alphax, alphay)
      	return Float32(1.0)
      end
      
      function tmp = code(u0, u1, alphax, alphay)
      	tmp = single(1.0);
      end
      
      \begin{array}{l}
      
      \\
      1
      \end{array}
      
      Derivation
      1. Initial program 99.4%

        \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
      2. Add Preprocessing
      3. Taylor expanded in alphay around 0

        \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{{alphay}^{2} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
      4. Step-by-step derivation
        1. lower-/.f32N/A

          \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{{alphay}^{2} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
        2. unpow2N/A

          \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{\left(alphay \cdot alphay\right)} \cdot u0}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
        3. associate-*l*N/A

          \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{alphay \cdot \left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
        4. lower-*.f32N/A

          \[\leadsto \frac{1}{\sqrt{1 + \frac{\color{blue}{alphay \cdot \left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
        5. lower-*.f32N/A

          \[\leadsto \frac{1}{\sqrt{1 + \frac{alphay \cdot \color{blue}{\left(alphay \cdot u0\right)}}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}} \]
        6. lower-*.f32N/A

          \[\leadsto \frac{1}{\sqrt{1 + \frac{alphay \cdot \left(alphay \cdot u0\right)}{\color{blue}{{\sin \tan^{-1} \left(\frac{alphay \cdot \tan \left(\frac{1}{2} \cdot \mathsf{PI}\left(\right) + 2 \cdot \left(u1 \cdot \mathsf{PI}\left(\right)\right)\right)}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
      5. Applied rewrites98.0%

        \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{alphay \cdot \left(alphay \cdot u0\right)}{{\sin \tan^{-1} \left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}}}} \]
      6. Taylor expanded in alphay around 0

        \[\leadsto \color{blue}{1} \]
      7. Step-by-step derivation
        1. Applied rewrites93.3%

          \[\leadsto \color{blue}{1} \]
        2. Add Preprocessing

        Reproduce

        ?
        herbie shell --seed 2024233 
        (FPCore (u0 u1 alphax alphay)
          :name "Trowbridge-Reitz Sample, sample surface normal, cosTheta"
          :precision binary32
          :pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 0.5))) (and (<= 0.0001 alphax) (<= alphax 1.0))) (and (<= 0.0001 alphay) (<= alphay 1.0)))
          (/ 1.0 (sqrt (+ 1.0 (/ (* (/ 1.0 (+ (/ (* (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphax alphax)) (/ (* (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphay alphay)))) u0) (- 1.0 u0))))))