
(FPCore (sinTheta_O h eta)
:precision binary32
(asin
(/
h
(sqrt
(-
(* eta eta)
(/
(* sinTheta_O sinTheta_O)
(sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))
float code(float sinTheta_O, float h, float eta) {
return asinf((h / sqrtf(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrtf((1.0f - (sinTheta_O * sinTheta_O))))))));
}
real(4) function code(sintheta_o, h, eta)
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / sqrt(((eta * eta) - ((sintheta_o * sintheta_o) / sqrt((1.0e0 - (sintheta_o * sintheta_o))))))))
end function
function code(sinTheta_O, h, eta) return asin(Float32(h / sqrt(Float32(Float32(eta * eta) - Float32(Float32(sinTheta_O * sinTheta_O) / sqrt(Float32(Float32(1.0) - Float32(sinTheta_O * sinTheta_O)))))))) end
function tmp = code(sinTheta_O, h, eta) tmp = asin((h / sqrt(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrt((single(1.0) - (sinTheta_O * sinTheta_O)))))))); end
\begin{array}{l}
\\
\sin^{-1} \left(\frac{h}{\sqrt{eta \cdot eta - \frac{sinTheta\_O \cdot sinTheta\_O}{\sqrt{1 - sinTheta\_O \cdot sinTheta\_O}}}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (sinTheta_O h eta)
:precision binary32
(asin
(/
h
(sqrt
(-
(* eta eta)
(/
(* sinTheta_O sinTheta_O)
(sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))
float code(float sinTheta_O, float h, float eta) {
return asinf((h / sqrtf(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrtf((1.0f - (sinTheta_O * sinTheta_O))))))));
}
real(4) function code(sintheta_o, h, eta)
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / sqrt(((eta * eta) - ((sintheta_o * sintheta_o) / sqrt((1.0e0 - (sintheta_o * sintheta_o))))))))
end function
function code(sinTheta_O, h, eta) return asin(Float32(h / sqrt(Float32(Float32(eta * eta) - Float32(Float32(sinTheta_O * sinTheta_O) / sqrt(Float32(Float32(1.0) - Float32(sinTheta_O * sinTheta_O)))))))) end
function tmp = code(sinTheta_O, h, eta) tmp = asin((h / sqrt(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrt((single(1.0) - (sinTheta_O * sinTheta_O)))))))); end
\begin{array}{l}
\\
\sin^{-1} \left(\frac{h}{\sqrt{eta \cdot eta - \frac{sinTheta\_O \cdot sinTheta\_O}{\sqrt{1 - sinTheta\_O \cdot sinTheta\_O}}}}\right)
\end{array}
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (if (<= sinTheta_O_m 4.22000007260429e-25) (asin (/ h eta)) (asin (/ h (sqrt (* (- eta sinTheta_O_m) (+ eta sinTheta_O_m)))))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
float tmp;
if (sinTheta_O_m <= 4.22000007260429e-25f) {
tmp = asinf((h / eta));
} else {
tmp = asinf((h / sqrtf(((eta - sinTheta_O_m) * (eta + sinTheta_O_m)))));
}
return tmp;
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
real(4) :: tmp
if (sintheta_o_m <= 4.22000007260429e-25) then
tmp = asin((h / eta))
else
tmp = asin((h / sqrt(((eta - sintheta_o_m) * (eta + sintheta_o_m)))))
end if
code = tmp
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) tmp = Float32(0.0) if (sinTheta_O_m <= Float32(4.22000007260429e-25)) tmp = asin(Float32(h / eta)); else tmp = asin(Float32(h / sqrt(Float32(Float32(eta - sinTheta_O_m) * Float32(eta + sinTheta_O_m))))); end return tmp end
sinTheta_O_m = abs(sinTheta_O); function tmp_2 = code(sinTheta_O_m, h, eta) tmp = single(0.0); if (sinTheta_O_m <= single(4.22000007260429e-25)) tmp = asin((h / eta)); else tmp = asin((h / sqrt(((eta - sinTheta_O_m) * (eta + sinTheta_O_m))))); end tmp_2 = tmp; end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\begin{array}{l}
\mathbf{if}\;sinTheta\_O\_m \leq 4.22000007260429 \cdot 10^{-25}:\\
\;\;\;\;\sin^{-1} \left(\frac{h}{eta}\right)\\
\mathbf{else}:\\
\;\;\;\;\sin^{-1} \left(\frac{h}{\sqrt{\left(eta - sinTheta\_O\_m\right) \cdot \left(eta + sinTheta\_O\_m\right)}}\right)\\
\end{array}
\end{array}
if sinTheta_O < 4.22000007e-25Initial program 91.1%
Taylor expanded in eta around inf
lower-/.f3294.4
Simplified94.4%
if 4.22000007e-25 < sinTheta_O Initial program 98.5%
Taylor expanded in sinTheta_O around 0
+-commutativeN/A
mul-1-negN/A
unsub-negN/A
unpow2N/A
unpow2N/A
difference-of-squaresN/A
lower-*.f32N/A
lower-+.f32N/A
lower--.f3297.0
Simplified97.0%
Final simplification95.0%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h (* (sqrt (- eta sinTheta_O_m)) (sqrt (+ eta sinTheta_O_m))))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / (sqrtf((eta - sinTheta_O_m)) * sqrtf((eta + sinTheta_O_m)))));
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / (sqrt((eta - sintheta_o_m)) * sqrt((eta + sintheta_o_m)))))
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / Float32(sqrt(Float32(eta - sinTheta_O_m)) * sqrt(Float32(eta + sinTheta_O_m))))) end
sinTheta_O_m = abs(sinTheta_O); function tmp = code(sinTheta_O_m, h, eta) tmp = asin((h / (sqrt((eta - sinTheta_O_m)) * sqrt((eta + sinTheta_O_m))))); end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{\sqrt{eta - sinTheta\_O\_m} \cdot \sqrt{eta + sinTheta\_O\_m}}\right)
\end{array}
Initial program 92.9%
Taylor expanded in sinTheta_O around 0
+-commutativeN/A
mul-1-negN/A
unsub-negN/A
unpow2N/A
unpow2N/A
difference-of-squaresN/A
lower-*.f32N/A
lower-+.f32N/A
lower--.f3292.4
Simplified92.4%
lift-+.f32N/A
lift--.f32N/A
sqrt-prodN/A
pow1/2N/A
pow1/2N/A
*-commutativeN/A
lower-*.f32N/A
pow1/2N/A
lower-sqrt.f32N/A
pow1/2N/A
lower-sqrt.f3297.9
lift-+.f32N/A
+-commutativeN/A
lower-+.f3297.9
Applied egg-rr97.9%
Final simplification97.9%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h (fma (* sinTheta_O_m (/ -0.5 eta)) sinTheta_O_m eta))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / fmaf((sinTheta_O_m * (-0.5f / eta)), sinTheta_O_m, eta)));
}
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / fma(Float32(sinTheta_O_m * Float32(Float32(-0.5) / eta)), sinTheta_O_m, eta))) end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{\mathsf{fma}\left(sinTheta\_O\_m \cdot \frac{-0.5}{eta}, sinTheta\_O\_m, eta\right)}\right)
\end{array}
Initial program 92.9%
Taylor expanded in sinTheta_O around 0
+-commutativeN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
associate-*r/N/A
lower-fma.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f3295.4
Simplified95.4%
lift-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-*l*N/A
*-commutativeN/A
lower-fma.f32N/A
lower-*.f3296.3
Applied egg-rr96.3%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h (fma (* sinTheta_O_m sinTheta_O_m) (/ -0.5 eta) eta))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / fmaf((sinTheta_O_m * sinTheta_O_m), (-0.5f / eta), eta)));
}
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / fma(Float32(sinTheta_O_m * sinTheta_O_m), Float32(Float32(-0.5) / eta), eta))) end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{\mathsf{fma}\left(sinTheta\_O\_m \cdot sinTheta\_O\_m, \frac{-0.5}{eta}, eta\right)}\right)
\end{array}
Initial program 92.9%
Taylor expanded in sinTheta_O around 0
+-commutativeN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
associate-*r/N/A
lower-fma.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f3295.4
Simplified95.4%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h eta)))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / eta));
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / eta))
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / eta)) end
sinTheta_O_m = abs(sinTheta_O); function tmp = code(sinTheta_O_m, h, eta) tmp = asin((h / eta)); end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{eta}\right)
\end{array}
Initial program 92.9%
Taylor expanded in eta around inf
lower-/.f3292.5
Simplified92.5%
herbie shell --seed 2024208
(FPCore (sinTheta_O h eta)
:name "HairBSDF, gamma for a refracted ray"
:precision binary32
:pre (and (and (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0)) (and (<= -1.0 h) (<= h 1.0))) (and (<= 0.0 eta) (<= eta 10.0)))
(asin (/ h (sqrt (- (* eta eta) (/ (* sinTheta_O sinTheta_O) (sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))