Trowbridge-Reitz Sample, sample surface normal, cosTheta

Percentage Accurate: 99.4% → 99.9%
Time: 23.8s
Alternatives: 11
Speedup: 2.0×

Specification

?
\[\left(\left(\left(2.328306437 \cdot 10^{-10} \leq u0 \land u0 \leq 1\right) \land \left(2.328306437 \cdot 10^{-10} \leq u1 \land u1 \leq 0.5\right)\right) \land \left(0.0001 \leq alphax \land alphax \leq 1\right)\right) \land \left(0.0001 \leq alphay \land alphay \leq 1\right)\]
\[\begin{array}{l} \\ \begin{array}{l} t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\ t_1 := \sin t\_0\\ t_2 := \cos t\_0\\ \frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0
         (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
        (t_1 (sin t_0))
        (t_2 (cos t_0)))
   (/
    1.0
    (sqrt
     (+
      1.0
      (/
       (*
        (/
         1.0
         (+
          (/ (* t_2 t_2) (* alphax alphax))
          (/ (* t_1 t_1) (* alphay alphay))))
        u0)
       (- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
	float t_1 = sinf(t_0);
	float t_2 = cosf(t_0);
	return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay)
	t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi))))))
	t_1 = sin(t_0)
	t_2 = cos(t_0)
	return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0)))))
end
function tmp = code(u0, u1, alphax, alphay)
	t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi))))));
	t_1 = sin(t_0);
	t_2 = cos(t_0);
	tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}

Sampling outcomes in binary32 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 11 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 99.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\ t_1 := \sin t\_0\\ t_2 := \cos t\_0\\ \frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0
         (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
        (t_1 (sin t_0))
        (t_2 (cos t_0)))
   (/
    1.0
    (sqrt
     (+
      1.0
      (/
       (*
        (/
         1.0
         (+
          (/ (* t_2 t_2) (* alphax alphax))
          (/ (* t_1 t_1) (* alphay alphay))))
        u0)
       (- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
	float t_1 = sinf(t_0);
	float t_2 = cosf(t_0);
	return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay)
	t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi))))))
	t_1 = sin(t_0)
	t_2 = cos(t_0)
	return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0)))))
end
function tmp = code(u0, u1, alphax, alphay)
	t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi))))));
	t_1 = sin(t_0);
	t_2 = cos(t_0);
	tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}

Alternative 1: 99.9% accurate, 1.7× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\\ e^{\mathsf{log1p}\left(\frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} t\_0\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {t\_0}^{2}\right)\right)}\right)}\right) \cdot -0.5} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0 (/ (* alphay (tan (* PI (fma 2.0 u1 0.5)))) alphax)))
   (exp
    (*
     (log1p
      (/
       u0
       (*
        (- 1.0 u0)
        (fma
         (- 1.0 (cos (* 2.0 (atan t_0))))
         (/ 0.5 (* alphay alphay))
         (/ 1.0 (* alphax (* alphax (+ 1.0 (pow t_0 2.0)))))))))
     -0.5))))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = (alphay * tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f)))) / alphax;
	return expf((log1pf((u0 / ((1.0f - u0) * fmaf((1.0f - cosf((2.0f * atanf(t_0)))), (0.5f / (alphay * alphay)), (1.0f / (alphax * (alphax * (1.0f + powf(t_0, 2.0f))))))))) * -0.5f));
}
function code(u0, u1, alphax, alphay)
	t_0 = Float32(Float32(alphay * tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5))))) / alphax)
	return exp(Float32(log1p(Float32(u0 / Float32(Float32(Float32(1.0) - u0) * fma(Float32(Float32(1.0) - cos(Float32(Float32(2.0) * atan(t_0)))), Float32(Float32(0.5) / Float32(alphay * alphay)), Float32(Float32(1.0) / Float32(alphax * Float32(alphax * Float32(Float32(1.0) + (t_0 ^ Float32(2.0)))))))))) * Float32(-0.5)))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\\
e^{\mathsf{log1p}\left(\frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} t\_0\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {t\_0}^{2}\right)\right)}\right)}\right) \cdot -0.5}
\end{array}
\end{array}
Derivation
  1. Initial program 99.4%

    \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
  2. Add Preprocessing
  3. Applied rewrites99.3%

    \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{\frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)}^{2}}}{alphax \cdot alphax} + \frac{1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)\right)}{\left(alphay \cdot alphay\right) \cdot 2}\right)}}}} \]
  4. Applied rewrites99.9%

    \[\leadsto \color{blue}{e^{\mathsf{log1p}\left(\frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\right)\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\right)}^{2}\right)\right)}\right)}\right) \cdot -0.5}} \]
  5. Add Preprocessing

Alternative 2: 99.8% accurate, 2.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\\ {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} t\_0\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {t\_0}^{2}, alphax\right)}\right)}\right)}^{-0.5} \end{array} \end{array} \]
(FPCore (u0 u1 alphax alphay)
 :precision binary32
 (let* ((t_0 (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax))))
   (pow
    (+
     1.0
     (/
      u0
      (*
       (- 1.0 u0)
       (fma
        (- 1.0 (cos (* 2.0 (atan t_0))))
        (/ 0.5 (* alphay alphay))
        (/ 1.0 (* alphax (fma alphax (pow t_0 2.0) alphax)))))))
    -0.5)))
float code(float u0, float u1, float alphax, float alphay) {
	float t_0 = tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax);
	return powf((1.0f + (u0 / ((1.0f - u0) * fmaf((1.0f - cosf((2.0f * atanf(t_0)))), (0.5f / (alphay * alphay)), (1.0f / (alphax * fmaf(alphax, powf(t_0, 2.0f), alphax))))))), -0.5f);
}
function code(u0, u1, alphax, alphay)
	t_0 = Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax))
	return Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * fma(Float32(Float32(1.0) - cos(Float32(Float32(2.0) * atan(t_0)))), Float32(Float32(0.5) / Float32(alphay * alphay)), Float32(Float32(1.0) / Float32(alphax * fma(alphax, (t_0 ^ Float32(2.0)), alphax))))))) ^ Float32(-0.5)
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\\
{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} t\_0\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {t\_0}^{2}, alphax\right)}\right)}\right)}^{-0.5}
\end{array}
\end{array}
Derivation
  1. Initial program 99.4%

    \[\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{\cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \cos \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphax \cdot alphax} + \frac{\sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right) \cdot \sin \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)}{alphay \cdot alphay}} \cdot u0}{1 - u0}}} \]
  2. Add Preprocessing
  3. Applied rewrites99.3%

    \[\leadsto \frac{1}{\sqrt{1 + \color{blue}{\frac{u0}{\left(1 - u0\right) \cdot \left(\frac{\frac{1}{1 + {\left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)}^{2}}}{alphax \cdot alphax} + \frac{1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\mathsf{fma}\left(2, \pi \cdot u1, \pi \cdot 0.5\right)\right)\right)\right)}{\left(alphay \cdot alphay\right) \cdot 2}\right)}}}} \]
  4. Applied rewrites99.8%

    \[\leadsto \color{blue}{{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\right)\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \left(alphax \cdot \left(1 + {\left(\frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\right)}^{2}\right)\right)}\right)}\right)}^{-0.5}} \]
  5. Applied rewrites99.8%

    \[\leadsto {\color{blue}{\left(\frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} \left(\tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right) \cdot \frac{alphay}{alphax}\right)\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\tan \left(\mathsf{fma}\left(2, u1, 0.5\right) \cdot \pi\right) \cdot \frac{alphay}{alphax}\right)}^{2}, alphax\right)}\right)} + 1\right)}}^{-0.5} \]
  6. Final simplification99.8%

    \[\leadsto {\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \mathsf{fma}\left(1 - \cos \left(2 \cdot \tan^{-1} \left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)\right), \frac{0.5}{alphay \cdot alphay}, \frac{1}{alphax \cdot \mathsf{fma}\left(alphax, {\left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2}, alphax\right)}\right)}\right)}^{-0.5} \]
  7. Add Preprocessing

Reproduce

?
herbie shell --seed 2024230 
(FPCore (u0 u1 alphax alphay)
  :name "Trowbridge-Reitz Sample, sample surface normal, cosTheta"
  :precision binary32
  :pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 0.5))) (and (<= 0.0001 alphax) (<= alphax 1.0))) (and (<= 0.0001 alphay) (<= alphay 1.0)))
  (/ 1.0 (sqrt (+ 1.0 (/ (* (/ 1.0 (+ (/ (* (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphax alphax)) (/ (* (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphay alphay)))) u0) (- 1.0 u0))))))