
(FPCore (sinTheta_O h eta)
:precision binary32
(asin
(/
h
(sqrt
(-
(* eta eta)
(/
(* sinTheta_O sinTheta_O)
(sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))
float code(float sinTheta_O, float h, float eta) {
return asinf((h / sqrtf(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrtf((1.0f - (sinTheta_O * sinTheta_O))))))));
}
real(4) function code(sintheta_o, h, eta)
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / sqrt(((eta * eta) - ((sintheta_o * sintheta_o) / sqrt((1.0e0 - (sintheta_o * sintheta_o))))))))
end function
function code(sinTheta_O, h, eta) return asin(Float32(h / sqrt(Float32(Float32(eta * eta) - Float32(Float32(sinTheta_O * sinTheta_O) / sqrt(Float32(Float32(1.0) - Float32(sinTheta_O * sinTheta_O)))))))) end
function tmp = code(sinTheta_O, h, eta) tmp = asin((h / sqrt(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrt((single(1.0) - (sinTheta_O * sinTheta_O)))))))); end
\begin{array}{l}
\\
\sin^{-1} \left(\frac{h}{\sqrt{eta \cdot eta - \frac{sinTheta\_O \cdot sinTheta\_O}{\sqrt{1 - sinTheta\_O \cdot sinTheta\_O}}}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (sinTheta_O h eta)
:precision binary32
(asin
(/
h
(sqrt
(-
(* eta eta)
(/
(* sinTheta_O sinTheta_O)
(sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))
float code(float sinTheta_O, float h, float eta) {
return asinf((h / sqrtf(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrtf((1.0f - (sinTheta_O * sinTheta_O))))))));
}
real(4) function code(sintheta_o, h, eta)
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / sqrt(((eta * eta) - ((sintheta_o * sintheta_o) / sqrt((1.0e0 - (sintheta_o * sintheta_o))))))))
end function
function code(sinTheta_O, h, eta) return asin(Float32(h / sqrt(Float32(Float32(eta * eta) - Float32(Float32(sinTheta_O * sinTheta_O) / sqrt(Float32(Float32(1.0) - Float32(sinTheta_O * sinTheta_O)))))))) end
function tmp = code(sinTheta_O, h, eta) tmp = asin((h / sqrt(((eta * eta) - ((sinTheta_O * sinTheta_O) / sqrt((single(1.0) - (sinTheta_O * sinTheta_O)))))))); end
\begin{array}{l}
\\
\sin^{-1} \left(\frac{h}{\sqrt{eta \cdot eta - \frac{sinTheta\_O \cdot sinTheta\_O}{\sqrt{1 - sinTheta\_O \cdot sinTheta\_O}}}}\right)
\end{array}
sinTheta_O_m = (fabs.f32 sinTheta_O)
(FPCore (sinTheta_O_m h eta)
:precision binary32
(let* ((t_0 (pow (- 1.0 (pow sinTheta_O_m 2.0)) -0.25)))
(asin
(/
h
(*
(sqrt (fma sinTheta_O_m t_0 eta))
(sqrt (- eta (* sinTheta_O_m t_0))))))))sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
float t_0 = powf((1.0f - powf(sinTheta_O_m, 2.0f)), -0.25f);
return asinf((h / (sqrtf(fmaf(sinTheta_O_m, t_0, eta)) * sqrtf((eta - (sinTheta_O_m * t_0))))));
}
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) t_0 = Float32(Float32(1.0) - (sinTheta_O_m ^ Float32(2.0))) ^ Float32(-0.25) return asin(Float32(h / Float32(sqrt(fma(sinTheta_O_m, t_0, eta)) * sqrt(Float32(eta - Float32(sinTheta_O_m * t_0)))))) end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\begin{array}{l}
t_0 := {\left(1 - {sinTheta\_O\_m}^{2}\right)}^{-0.25}\\
\sin^{-1} \left(\frac{h}{\sqrt{\mathsf{fma}\left(sinTheta\_O\_m, t\_0, eta\right)} \cdot \sqrt{eta - sinTheta\_O\_m \cdot t\_0}}\right)
\end{array}
\end{array}
Initial program 93.5%
add-sqr-sqrt93.5%
difference-of-squares93.5%
sqrt-div93.5%
sqrt-prod43.8%
add-sqr-sqrt89.6%
pow1/289.6%
sqrt-pow189.6%
pow289.6%
metadata-eval89.6%
sqrt-div89.6%
sqrt-prod44.0%
add-sqr-sqrt93.6%
pow1/293.6%
sqrt-pow193.6%
Applied egg-rr93.6%
sqrt-prod98.5%
+-commutative98.5%
div-inv98.5%
fma-define98.5%
pow-flip98.5%
metadata-eval98.5%
div-inv98.5%
pow-flip98.5%
metadata-eval98.5%
Applied egg-rr98.5%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ (/ h eta) (fma -0.5 (pow (/ sinTheta_O_m eta) 2.0) 1.0))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf(((h / eta) / fmaf(-0.5f, powf((sinTheta_O_m / eta), 2.0f), 1.0f)));
}
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(Float32(h / eta) / fma(Float32(-0.5), (Float32(sinTheta_O_m / eta) ^ Float32(2.0)), Float32(1.0)))) end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{\frac{h}{eta}}{\mathsf{fma}\left(-0.5, {\left(\frac{sinTheta\_O\_m}{eta}\right)}^{2}, 1\right)}\right)
\end{array}
Initial program 93.5%
Taylor expanded in eta around inf 92.9%
Taylor expanded in sinTheta_O around 0 92.8%
*-un-lft-identity92.8%
associate-/r*92.8%
+-commutative92.8%
fma-define92.8%
add-sqr-sqrt92.8%
pow292.8%
sqrt-div92.8%
sqrt-pow193.3%
metadata-eval93.3%
pow193.3%
sqrt-pow197.7%
metadata-eval97.7%
pow197.7%
Applied egg-rr97.7%
*-lft-identity97.7%
Simplified97.7%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h (* eta (+ 1.0 (* -0.5 (pow (/ sinTheta_O_m eta) 2.0)))))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / (eta * (1.0f + (-0.5f * powf((sinTheta_O_m / eta), 2.0f))))));
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / (eta * (1.0e0 + ((-0.5e0) * ((sintheta_o_m / eta) ** 2.0e0))))))
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / Float32(eta * Float32(Float32(1.0) + Float32(Float32(-0.5) * (Float32(sinTheta_O_m / eta) ^ Float32(2.0))))))) end
sinTheta_O_m = abs(sinTheta_O); function tmp = code(sinTheta_O_m, h, eta) tmp = asin((h / (eta * (single(1.0) + (single(-0.5) * ((sinTheta_O_m / eta) ^ single(2.0))))))); end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{eta \cdot \left(1 + -0.5 \cdot {\left(\frac{sinTheta\_O\_m}{eta}\right)}^{2}\right)}\right)
\end{array}
Initial program 93.5%
Taylor expanded in eta around inf 92.9%
Taylor expanded in sinTheta_O around 0 92.8%
associate-*r/92.8%
Applied egg-rr92.8%
associate-/l*92.8%
unpow292.8%
unpow292.8%
times-frac97.7%
unpow297.7%
Simplified97.7%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h (+ eta (* -0.5 (/ (pow sinTheta_O_m 2.0) eta))))))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / (eta + (-0.5f * (powf(sinTheta_O_m, 2.0f) / eta)))));
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / (eta + ((-0.5e0) * ((sintheta_o_m ** 2.0e0) / eta)))))
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / Float32(eta + Float32(Float32(-0.5) * Float32((sinTheta_O_m ^ Float32(2.0)) / eta))))) end
sinTheta_O_m = abs(sinTheta_O); function tmp = code(sinTheta_O_m, h, eta) tmp = asin((h / (eta + (single(-0.5) * ((sinTheta_O_m ^ single(2.0)) / eta))))); end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{eta + -0.5 \cdot \frac{{sinTheta\_O\_m}^{2}}{eta}}\right)
\end{array}
Initial program 93.5%
Taylor expanded in sinTheta_O around 0 97.2%
sinTheta_O_m = (fabs.f32 sinTheta_O) (FPCore (sinTheta_O_m h eta) :precision binary32 (asin (/ h eta)))
sinTheta_O_m = fabs(sinTheta_O);
float code(float sinTheta_O_m, float h, float eta) {
return asinf((h / eta));
}
sinTheta_O_m = abs(sintheta_o)
real(4) function code(sintheta_o_m, h, eta)
real(4), intent (in) :: sintheta_o_m
real(4), intent (in) :: h
real(4), intent (in) :: eta
code = asin((h / eta))
end function
sinTheta_O_m = abs(sinTheta_O) function code(sinTheta_O_m, h, eta) return asin(Float32(h / eta)) end
sinTheta_O_m = abs(sinTheta_O); function tmp = code(sinTheta_O_m, h, eta) tmp = asin((h / eta)); end
\begin{array}{l}
sinTheta_O_m = \left|sinTheta\_O\right|
\\
\sin^{-1} \left(\frac{h}{eta}\right)
\end{array}
Initial program 93.5%
Taylor expanded in eta around inf 95.1%
herbie shell --seed 2024090
(FPCore (sinTheta_O h eta)
:name "HairBSDF, gamma for a refracted ray"
:precision binary32
:pre (and (and (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0)) (and (<= -1.0 h) (<= h 1.0))) (and (<= 0.0 eta) (<= eta 10.0)))
(asin (/ h (sqrt (- (* eta eta) (/ (* sinTheta_O sinTheta_O) (sqrt (- 1.0 (* sinTheta_O sinTheta_O)))))))))