
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(let* ((t_0
(atan
(*
(/ alphay alphax)
(tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
(t_1 (sin t_0))
(t_2 (cos t_0)))
(/
1.0
(sqrt
(+
1.0
(/
(*
(/
1.0
(+
(/ (* t_2 t_2) (* alphax alphax))
(/ (* t_1 t_1) (* alphay alphay))))
u0)
(- 1.0 u0)))))))float code(float u0, float u1, float alphax, float alphay) {
float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
float t_1 = sinf(t_0);
float t_2 = cosf(t_0);
return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay) t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi)))))) t_1 = sin(t_0) t_2 = cos(t_0) return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0))))) end
function tmp = code(u0, u1, alphax, alphay) t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi)))))); t_1 = sin(t_0); t_2 = cos(t_0); tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0)))); end
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(let* ((t_0
(atan
(*
(/ alphay alphax)
(tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))
(t_1 (sin t_0))
(t_2 (cos t_0)))
(/
1.0
(sqrt
(+
1.0
(/
(*
(/
1.0
(+
(/ (* t_2 t_2) (* alphax alphax))
(/ (* t_1 t_1) (* alphay alphay))))
u0)
(- 1.0 u0)))))))float code(float u0, float u1, float alphax, float alphay) {
float t_0 = atanf(((alphay / alphax) * tanf((((2.0f * ((float) M_PI)) * u1) + (0.5f * ((float) M_PI))))));
float t_1 = sinf(t_0);
float t_2 = cosf(t_0);
return 1.0f / sqrtf((1.0f + (((1.0f / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (1.0f - u0))));
}
function code(u0, u1, alphax, alphay) t_0 = atan(Float32(Float32(alphay / alphax) * tan(Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * u1) + Float32(Float32(0.5) * Float32(pi)))))) t_1 = sin(t_0) t_2 = cos(t_0) return Float32(Float32(1.0) / sqrt(Float32(Float32(1.0) + Float32(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(t_2 * t_2) / Float32(alphax * alphax)) + Float32(Float32(t_1 * t_1) / Float32(alphay * alphay)))) * u0) / Float32(Float32(1.0) - u0))))) end
function tmp = code(u0, u1, alphax, alphay) t_0 = atan(((alphay / alphax) * tan((((single(2.0) * single(pi)) * u1) + (single(0.5) * single(pi)))))); t_1 = sin(t_0); t_2 = cos(t_0); tmp = single(1.0) / sqrt((single(1.0) + (((single(1.0) / (((t_2 * t_2) / (alphax * alphax)) + ((t_1 * t_1) / (alphay * alphay)))) * u0) / (single(1.0) - u0)))); end
\begin{array}{l}
t_0 := \tan^{-1} \left(\frac{alphay}{alphax} \cdot \tan \left(\left(2 \cdot \pi\right) \cdot u1 + 0.5 \cdot \pi\right)\right)\\
t_1 := \sin t\_0\\
t_2 := \cos t\_0\\
\frac{1}{\sqrt{1 + \frac{\frac{1}{\frac{t\_2 \cdot t\_2}{alphax \cdot alphax} + \frac{t\_1 \cdot t\_1}{alphay \cdot alphay}} \cdot u0}{1 - u0}}}
\end{array}
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(let* ((t_0
(asinh (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax)))))
(pow
(-
(/
u0
(*
(- 1.0 u0)
(+
(pow (/ (tanh t_0) alphay) 2.0)
(/ (pow (cosh t_0) -2.0) (* alphax alphax)))))
-1.0)
-0.5)))float code(float u0, float u1, float alphax, float alphay) {
float t_0 = asinhf((tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax)));
return powf(((u0 / ((1.0f - u0) * (powf((tanhf(t_0) / alphay), 2.0f) + (powf(coshf(t_0), -2.0f) / (alphax * alphax))))) - -1.0f), -0.5f);
}
function code(u0, u1, alphax, alphay) t_0 = asinh(Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax))) return Float32(Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32((Float32(tanh(t_0) / alphay) ^ Float32(2.0)) + Float32((cosh(t_0) ^ Float32(-2.0)) / Float32(alphax * alphax))))) - Float32(-1.0)) ^ Float32(-0.5) end
\begin{array}{l}
t_0 := \sinh^{-1} \left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)\\
{\left(\frac{u0}{\left(1 - u0\right) \cdot \left({\left(\frac{\tanh t\_0}{alphay}\right)}^{2} + \frac{{\cosh t\_0}^{-2}}{alphax \cdot alphax}\right)} - -1\right)}^{-0.5}
\end{array}
Initial program 99.4%
Applied rewrites99.9%
Applied rewrites99.9%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(let* ((t_0
(asinh (* (tan (* PI (fma 2.0 u1 0.5))) (/ alphay alphax)))))
(/
1.0
(sqrt
(-
(/
u0
(*
(- 1.0 u0)
(+
(pow (/ (tanh t_0) alphay) 2.0)
(/ (pow (cosh t_0) -2.0) (* alphax alphax)))))
-1.0)))))float code(float u0, float u1, float alphax, float alphay) {
float t_0 = asinhf((tanf((((float) M_PI) * fmaf(2.0f, u1, 0.5f))) * (alphay / alphax)));
return 1.0f / sqrtf(((u0 / ((1.0f - u0) * (powf((tanhf(t_0) / alphay), 2.0f) + (powf(coshf(t_0), -2.0f) / (alphax * alphax))))) - -1.0f));
}
function code(u0, u1, alphax, alphay) t_0 = asinh(Float32(tan(Float32(Float32(pi) * fma(Float32(2.0), u1, Float32(0.5)))) * Float32(alphay / alphax))) return Float32(Float32(1.0) / sqrt(Float32(Float32(u0 / Float32(Float32(Float32(1.0) - u0) * Float32((Float32(tanh(t_0) / alphay) ^ Float32(2.0)) + Float32((cosh(t_0) ^ Float32(-2.0)) / Float32(alphax * alphax))))) - Float32(-1.0)))) end
\begin{array}{l}
t_0 := \sinh^{-1} \left(\tan \left(\pi \cdot \mathsf{fma}\left(2, u1, 0.5\right)\right) \cdot \frac{alphay}{alphax}\right)\\
\frac{1}{\sqrt{\frac{u0}{\left(1 - u0\right) \cdot \left({\left(\frac{\tanh t\_0}{alphay}\right)}^{2} + \frac{{\cosh t\_0}^{-2}}{alphax \cdot alphax}\right)} - -1}}
\end{array}
Initial program 99.4%
Applied rewrites99.4%
Applied rewrites99.4%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(pow
(-
(/
(* (* alphay alphay) u0)
(*
(pow
(tanh
(asinh (* (tan (* (fma u1 2.0 0.5) PI)) (/ alphay alphax))))
2.0)
(- 1.0 u0)))
-1.0)
-0.5))float code(float u0, float u1, float alphax, float alphay) {
return powf(((((alphay * alphay) * u0) / (powf(tanhf(asinhf((tanf((fmaf(u1, 2.0f, 0.5f) * ((float) M_PI))) * (alphay / alphax)))), 2.0f) * (1.0f - u0))) - -1.0f), -0.5f);
}
function code(u0, u1, alphax, alphay) return Float32(Float32(Float32(Float32(alphay * alphay) * u0) / Float32((tanh(asinh(Float32(tan(Float32(fma(u1, Float32(2.0), Float32(0.5)) * Float32(pi))) * Float32(alphay / alphax)))) ^ Float32(2.0)) * Float32(Float32(1.0) - u0))) - Float32(-1.0)) ^ Float32(-0.5) end
{\left(\frac{\left(alphay \cdot alphay\right) \cdot u0}{{\tanh \sinh^{-1} \left(\tan \left(\mathsf{fma}\left(u1, 2, 0.5\right) \cdot \pi\right) \cdot \frac{alphay}{alphax}\right)}^{2} \cdot \left(1 - u0\right)} - -1\right)}^{-0.5}
Initial program 99.4%
Taylor expanded in alphax around inf
Applied rewrites97.7%
Applied rewrites98.1%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(/
1.0
(sqrt
(-
(/
(* (* alphay alphay) u0)
(*
(pow
(tanh
(asinh (* (tan (* (fma u1 2.0 0.5) PI)) (/ alphay alphax))))
2.0)
(- 1.0 u0)))
-1.0))))float code(float u0, float u1, float alphax, float alphay) {
return 1.0f / sqrtf(((((alphay * alphay) * u0) / (powf(tanhf(asinhf((tanf((fmaf(u1, 2.0f, 0.5f) * ((float) M_PI))) * (alphay / alphax)))), 2.0f) * (1.0f - u0))) - -1.0f));
}
function code(u0, u1, alphax, alphay) return Float32(Float32(1.0) / sqrt(Float32(Float32(Float32(Float32(alphay * alphay) * u0) / Float32((tanh(asinh(Float32(tan(Float32(fma(u1, Float32(2.0), Float32(0.5)) * Float32(pi))) * Float32(alphay / alphax)))) ^ Float32(2.0)) * Float32(Float32(1.0) - u0))) - Float32(-1.0)))) end
\frac{1}{\sqrt{\frac{\left(alphay \cdot alphay\right) \cdot u0}{{\tanh \sinh^{-1} \left(\tan \left(\mathsf{fma}\left(u1, 2, 0.5\right) \cdot \pi\right) \cdot \frac{alphay}{alphax}\right)}^{2} \cdot \left(1 - u0\right)} - -1}}
Initial program 99.4%
Taylor expanded in alphax around inf
Applied rewrites97.7%
Applied rewrites97.7%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(fma
(/
(* (* alphay alphay) u0)
(*
(pow
(tanh (asinh (* (tan (* (fma u1 2.0 0.5) PI)) (/ alphay alphax))))
2.0)
(- 1.0 u0)))
-0.5
1.0))float code(float u0, float u1, float alphax, float alphay) {
return fmaf((((alphay * alphay) * u0) / (powf(tanhf(asinhf((tanf((fmaf(u1, 2.0f, 0.5f) * ((float) M_PI))) * (alphay / alphax)))), 2.0f) * (1.0f - u0))), -0.5f, 1.0f);
}
function code(u0, u1, alphax, alphay) return fma(Float32(Float32(Float32(alphay * alphay) * u0) / Float32((tanh(asinh(Float32(tan(Float32(fma(u1, Float32(2.0), Float32(0.5)) * Float32(pi))) * Float32(alphay / alphax)))) ^ Float32(2.0)) * Float32(Float32(1.0) - u0))), Float32(-0.5), Float32(1.0)) end
\mathsf{fma}\left(\frac{\left(alphay \cdot alphay\right) \cdot u0}{{\tanh \sinh^{-1} \left(\tan \left(\mathsf{fma}\left(u1, 2, 0.5\right) \cdot \pi\right) \cdot \frac{alphay}{alphax}\right)}^{2} \cdot \left(1 - u0\right)}, -0.5, 1\right)
Initial program 99.4%
Taylor expanded in alphax around 0
Applied rewrites42.1%
Taylor expanded in alphay around 0
Applied rewrites96.3%
Applied rewrites96.3%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(pow (/ (- 1.0 u0) (- 1.0 u0)) -0.5))float code(float u0, float u1, float alphax, float alphay) {
return powf(((1.0f - u0) / (1.0f - u0)), -0.5f);
}
real(4) function code(u0, u1, alphax, alphay)
use fmin_fmax_functions
real(4), intent (in) :: u0
real(4), intent (in) :: u1
real(4), intent (in) :: alphax
real(4), intent (in) :: alphay
code = ((1.0e0 - u0) / (1.0e0 - u0)) ** (-0.5e0)
end function
function code(u0, u1, alphax, alphay) return Float32(Float32(Float32(1.0) - u0) / Float32(Float32(1.0) - u0)) ^ Float32(-0.5) end
function tmp = code(u0, u1, alphax, alphay) tmp = ((single(1.0) - u0) / (single(1.0) - u0)) ^ single(-0.5); end
{\left(\frac{1 - u0}{1 - u0}\right)}^{-0.5}
Initial program 99.4%
Applied rewrites99.9%
Applied rewrites99.9%
Applied rewrites99.7%
Taylor expanded in alphax around 0
Applied rewrites91.1%
(FPCore (u0 u1 alphax alphay)
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0))
(and (<= 2.328306437e-10 u1) (<= u1 0.5)))
(and (<= 0.0001 alphax) (<= alphax 1.0)))
(and (<= 0.0001 alphay) (<= alphay 1.0)))
(fma (/ (* (* alphax alphax) u0) 1.0) -0.5 1.0))float code(float u0, float u1, float alphax, float alphay) {
return fmaf((((alphax * alphax) * u0) / 1.0f), -0.5f, 1.0f);
}
function code(u0, u1, alphax, alphay) return fma(Float32(Float32(Float32(alphax * alphax) * u0) / Float32(1.0)), Float32(-0.5), Float32(1.0)) end
\mathsf{fma}\left(\frac{\left(alphax \cdot alphax\right) \cdot u0}{1}, -0.5, 1\right)
Initial program 99.4%
Taylor expanded in alphax around 0
Applied rewrites42.1%
Applied rewrites33.1%
Taylor expanded in alphax around inf
Applied rewrites87.9%
Taylor expanded in u0 around 0
Applied rewrites88.1%
herbie shell --seed 2025359
(FPCore (u0 u1 alphax alphay)
:name "Trowbridge-Reitz Sample, sample surface normal, cosTheta"
:precision binary32
:pre (and (and (and (and (<= 2.328306437e-10 u0) (<= u0 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 0.5))) (and (<= 0.0001 alphax) (<= alphax 1.0))) (and (<= 0.0001 alphay) (<= alphay 1.0)))
(/ 1.0 (sqrt (+ 1.0 (/ (* (/ 1.0 (+ (/ (* (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (cos (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphax alphax)) (/ (* (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI)))))) (sin (atan (* (/ alphay alphax) (tan (+ (* (* 2.0 PI) u1) (* 0.5 PI))))))) (* alphay alphay)))) u0) (- 1.0 u0))))))