
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0
(atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
(t_1 (sin t_0))
(t_2 (cos t_0)))
(/
1.0
(sqrt
(+
1.0
(/
(*
(/
1.0
(+
(/ (* t_2 t_2) (* alphax alphax))
(/ (* t_1 t_1) (* alphay alphay))))
u0)
(- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
float t_1 = sinf(t_0);
float t_2 = cosf(t_0);
return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay) t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi)))))) t_1 = sin(t_0) t_2 = cos(t_0) return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0))))) end
function tmp = code(u0, u1, alphax, alphay) t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi)))))); t_1 = sin(t_0); t_2 = cos(t_0); tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0)))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0
(atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
(t_1 (sin t_0))
(t_2 (cos t_0)))
(/
1.0
(sqrt
(+
1.0
(/
(*
(/
1.0
(+
(/ (* t_2 t_2) (* alphax alphax))
(/ (* t_1 t_1) (* alphay alphay))))
u0)
(- 1.0 u0)))))))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
float t_1 = sinf(t_0);
float t_2 = cosf(t_0);
return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay) t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi)))))) t_1 = sin(t_0) t_2 = cos(t_0) return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0))))) end
function tmp = code(u0, u1, alphax, alphay) t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi)))))); t_1 = sin(t_0); t_2 = cos(t_0); tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0)))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
\end{array}
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0 (tan (* PI (fma 2.0 u1 0.5)))))
(exp
(*
(log1p
(/
u0
(*
(+
(/ 1.0 (fma alphax alphax (pow (* alphay t_0) 2.0)))
(/
(+ 1.0 (/ 1.0 (- -1.0 (pow (* t_0 (/ alphay alphax)) 2.0))))
(* alphay alphay)))
(- 1.0 u0))))
-0.5))))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f)));
return expf((log1pf((u0 / (((1.0f / fmaf(alphax, alphax, powf((alphay * t_0), 2.0f))) + ((1.0f + (1.0f / (-1.0f - powf((t_0 * (alphay / alphax)), 2.0f)))) / (alphay * alphay))) * (1.0f - u0)))) * -0.5f));
}
function code(u0, u1, alphax, alphay) t_0 = tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) return exp(Float32(log1p(Float32(u0 / Float32(Float32(Float32(Float32(1.0) / fma(alphax, alphax, (Float32(alphay * t_0) ^ Float32(2.0)))) + Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - (Float32(t_0 * Float32(alphay / alphax)) ^ Float32(2.0))))) / Float32(alphay * alphay))) * Float32(Float32(1.0) - u0)))) * Float32(-0.5))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\\
e^{\mathsf{log1p}\left(\frac{u0}{\left(\frac{1}{\mathsf{fma}\left(alphax, alphax, {\left(alphay \cdot t\_0\right)}^{2}\right)} + \frac{1 + \frac{1}{-1 - {\left(t\_0 \cdot \frac{alphay}{alphax}\right)}^{2}}}{alphay \cdot alphay}\right) \cdot \left(1 - u0\right)}\right) \cdot -0.5}
\end{array}
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Applied egg-rr100.0%
*-commutativeN/A
distribute-lft-inN/A
metadata-evalN/A
div-invN/A
/-rgt-identityN/A
accelerator-lowering-fma.f32N/A
pow2N/A
pow-prod-downN/A
pow-lowering-pow.f32N/A
Applied egg-rr100.0%
*-commutativeN/A
associate-*l/N/A
div-invN/A
associate-*l*N/A
inv-powN/A
pow-plusN/A
metadata-evalN/A
metadata-evalN/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
tan-lowering-tan.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
accelerator-lowering-fma.f32100.0
Applied egg-rr100.0%
Final simplification100.0%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0 (tan (* PI (fma 2.0 u1 0.5)))))
(pow
(+
1.0
(/
u0
(*
(- 1.0 u0)
(+
(/ 1.0 (fma alphax alphax (pow (* alphay t_0) 2.0)))
(/
(+ 1.0 (/ -1.0 (+ 1.0 (pow (* alphay (/ t_0 alphax)) 2.0))))
(* alphay alphay))))))
-0.5)))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f)));
return powf((1.0f + (u0 / ((1.0f - u0) * ((1.0f / fmaf(alphax, alphax, powf((alphay * t_0), 2.0f))) + ((1.0f + (-1.0f / (1.0f + powf((alphay * (t_0 / alphax)), 2.0f)))) / (alphay * alphay)))))), -0.5f);
}
function code(u0, u1, alphax, alphay) t_0 = tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) return Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(1.0) / fma(alphax, alphax, (Float32(alphay * t_0) ^ Float32(2.0)))) + Float32(Float32(Float32(1.0) + Float32(Float32(-1.0) / Float32(Float32(1.0) + (Float32(alphay * Float32(t_0 / alphax)) ^ Float32(2.0))))) / Float32(alphay * alphay)))))) ^ Float32(-0.5) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)\\
{\left(1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{\mathsf{fma}\left(alphax, alphax, {\left(alphay \cdot t\_0\right)}^{2}\right)} + \frac{1 + \frac{-1}{1 + {\left(alphay \cdot \frac{t\_0}{alphax}\right)}^{2}}}{alphay \cdot alphay}\right)}\right)}^{-0.5}
\end{array}
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Applied egg-rr100.0%
*-commutativeN/A
distribute-lft-inN/A
metadata-evalN/A
div-invN/A
/-rgt-identityN/A
accelerator-lowering-fma.f32N/A
pow2N/A
pow-prod-downN/A
pow-lowering-pow.f32N/A
Applied egg-rr100.0%
Applied egg-rr99.9%
Final simplification99.9%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0 (pow (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax)) 2.0)))
(/
1.0
(sqrt
(+
1.0
(/
u0
(*
(- 1.0 u0)
(+
(/ (+ 1.0 (/ 1.0 (- -1.0 t_0))) (* alphay alphay))
(/ 1.0 (* (+ 1.0 t_0) (* alphax alphax)))))))))))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = powf((tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax)), 2.0f);
return 1.0f / sqrtf((1.0f + (u0 / ((1.0f - u0) * (((1.0f + (1.0f / (-1.0f - t_0))) / (alphay * alphay)) + (1.0f / ((1.0f + t_0) * (alphax * alphax))))))));
}
function code(u0, u1, alphax, alphay) t_0 = Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax)) ^ Float32(2.0) return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - t_0))) / Float32(alphay * alphay)) + Float32(Float32(1.0) / Float32(Float32(Float32(1.0) + t_0) * Float32(alphax * alphax))))))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := {\left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2}\\
\frac{1}{\sqrt{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1 + \frac{1}{-1 - t\_0}}{alphay \cdot alphay} + \frac{1}{\left(1 + t\_0\right) \cdot \left(alphax \cdot alphax\right)}\right)}}}
\end{array}
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Applied egg-rr99.4%
Final simplification99.4%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(let* ((t_0 (* PI (fma 2.0 u1 0.5))))
(sqrt
(/
1.0
(+
1.0
(/
u0
(*
(- 1.0 u0)
(+
(/ 1.0 (* alphay alphay))
(/
(pow (cos t_0) 2.0)
(* (* alphay alphay) (pow (sin t_0) 2.0)))))))))))
float code(float u0, float u1, float alphax, float alphay) {
float t_0 = ((float) M_PI) * fmaf(2.0f, u1, 0.5f);
return sqrtf((1.0f / (1.0f + (u0 / ((1.0f - u0) * ((1.0f / (alphay * alphay)) + (powf(cosf(t_0), 2.0f) / ((alphay * alphay) * powf(sinf(t_0), 2.0f)))))))));
}
function code(u0, u1, alphax, alphay) t_0 = Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5))) return sqrt(Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(Float32(1.0) / Float32(alphay * alphay)) + Float32((cos(t_0) ^ Float32(2.0)) / Float32(Float32(alphay * alphay) * (sin(t_0) ^ Float32(2.0)))))))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\\
\sqrt{\frac{1}{1 + \frac{u0}{\left(1 - u0\right) \cdot \left(\frac{1}{alphay \cdot alphay} + \frac{{\cos t\_0}^{2}}{\left(alphay \cdot alphay\right) \cdot {\sin t\_0}^{2}}\right)}}}
\end{array}
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Applied egg-rr100.0%
Taylor expanded in alphax around 0
sqrt-lowering-sqrt.f32N/A
/-lowering-/.f32N/A
+-lowering-+.f32N/A
/-lowering-/.f32N/A
Simplified98.9%
Final simplification98.9%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(sqrt
(/
1.0
(fma
2.0
(/
(* u0 (* alphay alphay))
(*
(- 1.0 u0)
(-
1.0
(cos
(* 2.0 (atan (/ (* alphay (tan (* PI (fma 2.0 u1 0.5)))) alphax)))))))
1.0))))
float code(float u0, float u1, float alphax, float alphay) {
return sqrtf((1.0f / fmaf(2.0f, ((u0 * (alphay * alphay)) / ((1.0f - u0) * (1.0f - cosf((2.0f * atanf(((alphay * tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f)))) / alphax))))))), 1.0f)));
}
function code(u0, u1, alphax, alphay) return sqrt(Float32(Float32(1.0) / fma(Float32(2.0), Float32(Float32(u0 * Float32(alphay * alphay)) / Float32(Float32(Float32(1.0) - u0) * Float32(Float32(1.0) - cos(Float32(Float32(2.0) * atan(Float32(Float32(alphay * tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5))))) / alphax))))))), Float32(1.0)))) end
\begin{array}{l}
\\
\sqrt{\frac{1}{\mathsf{fma}\left(2, \frac{u0 \cdot \left(alphay \cdot alphay\right)}{\left(1 - u0\right) \cdot \left(1 - \cos \left(2 \cdot \tan^{-1} \left(\frac{alphay \cdot \tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right)}{alphax}\right)\right)\right)}, 1\right)}}
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Taylor expanded in alphax around inf
Simplified98.4%
Final simplification98.4%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(pow
(fma
(* alphay alphay)
(/
u0
(*
(+
1.0
(/
1.0
(- -1.0 (pow (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax)) 2.0))))
(- 1.0 u0)))
1.0)
-0.5))
float code(float u0, float u1, float alphax, float alphay) {
return powf(fmaf((alphay * alphay), (u0 / ((1.0f + (1.0f / (-1.0f - powf((tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax)), 2.0f)))) * (1.0f - u0))), 1.0f), -0.5f);
}
function code(u0, u1, alphax, alphay) return fma(Float32(alphay * alphay), Float32(u0 / Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - (Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax)) ^ Float32(2.0))))) * Float32(Float32(1.0) - u0))), Float32(1.0)) ^ Float32(-0.5) end
\begin{array}{l}
\\
{\left(\mathsf{fma}\left(alphay \cdot alphay, \frac{u0}{\left(1 + \frac{1}{-1 - {\left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2}}\right) \cdot \left(1 - u0\right)}, 1\right)\right)}^{-0.5}
\end{array}
Initial program 99.4%
Taylor expanded in alphay around 0
/-lowering-/.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
Simplified98.0%
Applied egg-rr98.4%
Final simplification98.4%
(FPCore (u0 u1 alphax alphay)
:precision binary32
(/
1.0
(sqrt
(fma
(/
u0
(*
(+
1.0
(/
1.0
(-
-1.0
(pow (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax)) 2.0))))
(- 1.0 u0)))
(* alphay alphay)
1.0))))
float code(float u0, float u1, float alphax, float alphay) {
return 1.0f / sqrtf(fmaf((u0 / ((1.0f + (1.0f / (-1.0f - powf((tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax)), 2.0f)))) * (1.0f - u0))), (alphay * alphay), 1.0f));
}
function code(u0, u1, alphax, alphay) return Float32(Float32(1.0) / sqrt(fma(Float32(u0 / Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / Float32(Float32(-1.0) - (Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax)) ^ Float32(2.0))))) * Float32(Float32(1.0) - u0))), Float32(alphay * alphay), Float32(1.0)))) end
\begin{array}{l}
\\
\frac{1}{\sqrt{\mathsf{fma}\left(\frac{u0}{\left(1 + \frac{1}{-1 - {\left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)}^{2}}\right) \cdot \left(1 - u0\right)}, alphay \cdot alphay, 1\right)}}
\end{array}
Initial program 99.4%
Taylor expanded in alphay around 0
/-lowering-/.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
Simplified98.0%
Applied egg-rr98.0%
Final simplification98.0%
(FPCore (u0 u1 alphax alphay) :precision binary32 1.0)
float code(float u0, float u1, float alphax, float alphay) {
return 1.0f;
}
real(4) function code(u0, u1, alphax, alphay)
real(4), intent (in) :: u0
real(4), intent (in) :: u1
real(4), intent (in) :: alphax
real(4), intent (in) :: alphay
code = 1.0e0
end function
function code(u0, u1, alphax, alphay) return Float32(1.0) end
function tmp = code(u0, u1, alphax, alphay) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.4%
Applied egg-rr99.4%
Taylor expanded in u0 around 0
Simplified92.8%
herbie shell --seed 2024199
(FPCore (u0 u1 alphax alphay)
:name "Trowbridge-Reitz Sample, sample surface normal, cosTheta"
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 0.5))) (and (<= 0.0001 alphax) (<= alphax 1.0))) (and (<= 0.0001 alphay) (<= alphay 1.0)))
(/ 1.0 (sqrt (+ 1.0 (/ (* (/ 1.0 (+ (/ (* (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphax alphax)) (/ (* (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphay alphay)))) u0) (- 1.0 u0))))))