
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta_i \cdot cosTheta_O}{v} - \frac{sinTheta_i \cdot sinTheta_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 9 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta_i \cdot cosTheta_O}{v} - \frac{sinTheta_i \cdot sinTheta_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (let* ((t_0 (cbrt (sqrt (exp (/ (fma cosTheta_O cosTheta_i -1.0) v)))))) (* (/ 0.5 v) (* (exp 0.6931) (pow (* t_0 t_0) 3.0)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = cbrtf(sqrtf(expf((fmaf(cosTheta_O, cosTheta_i, -1.0f) / v))));
return (0.5f / v) * (expf(0.6931f) * powf((t_0 * t_0), 3.0f));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = cbrt(sqrt(exp(Float32(fma(cosTheta_O, cosTheta_i, Float32(-1.0)) / v)))) return Float32(Float32(Float32(0.5) / v) * Float32(exp(Float32(0.6931)) * (Float32(t_0 * t_0) ^ Float32(3.0)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt[3]{\sqrt{e^{\frac{\mathsf{fma}\left(cosTheta_O, cosTheta_i, -1\right)}{v}}}}\\
\frac{0.5}{v} \cdot \left(e^{0.6931} \cdot {\left(t_0 \cdot t_0\right)}^{3}\right)
\end{array}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.7%
associate-/r*99.7%
metadata-eval99.7%
+-rgt-identity99.7%
metadata-eval99.7%
metadata-eval99.7%
+-rgt-identity99.7%
sub-neg99.7%
associate-+l+99.7%
Simplified99.7%
Taylor expanded in sinTheta_i around 0 99.7%
associate--l+99.7%
associate-*r/99.7%
exp-sum99.7%
associate-*r/99.7%
sub-div99.7%
Applied egg-rr99.7%
add-cube-cbrt99.7%
pow399.7%
div-inv99.7%
div-inv99.7%
fma-neg99.7%
metadata-eval99.7%
Applied egg-rr99.7%
pow1/399.5%
rem-cube-cbrt99.5%
add-sqr-sqrt99.5%
unpow-prod-down99.5%
rem-cube-cbrt99.5%
rem-cube-cbrt99.5%
Applied egg-rr99.5%
unpow1/399.6%
unpow1/399.7%
Simplified99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (* (exp 0.6931) (pow (cbrt (exp (/ -1.0 v))) 3.0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * (expf(0.6931f) * powf(cbrtf(expf((-1.0f / v))), 3.0f));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * Float32(exp(Float32(0.6931)) * (cbrt(exp(Float32(Float32(-1.0) / v))) ^ Float32(3.0)))) end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot \left(e^{0.6931} \cdot {\left(\sqrt[3]{e^{\frac{-1}{v}}}\right)}^{3}\right)
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.7%
associate-/r*99.7%
metadata-eval99.7%
+-rgt-identity99.7%
metadata-eval99.7%
metadata-eval99.7%
+-rgt-identity99.7%
sub-neg99.7%
associate-+l+99.7%
Simplified99.7%
Taylor expanded in sinTheta_i around 0 99.7%
associate--l+99.7%
associate-*r/99.7%
exp-sum99.7%
associate-*r/99.7%
sub-div99.7%
Applied egg-rr99.7%
add-cube-cbrt99.7%
pow399.7%
div-inv99.7%
div-inv99.7%
fma-neg99.7%
metadata-eval99.7%
Applied egg-rr99.7%
Taylor expanded in cosTheta_O around 0 99.5%
unpow1/399.7%
Simplified99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (* (exp 0.6931) (exp (/ -1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * (expf(0.6931f) * expf((-1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * (exp(0.6931e0) * exp(((-1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * Float32(exp(Float32(0.6931)) * exp(Float32(Float32(-1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * (exp(single(0.6931)) * exp((single(-1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot \left(e^{0.6931} \cdot e^{\frac{-1}{v}}\right)
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.7%
associate-/r*99.7%
metadata-eval99.7%
+-rgt-identity99.7%
metadata-eval99.7%
metadata-eval99.7%
+-rgt-identity99.7%
sub-neg99.7%
associate-+l+99.7%
Simplified99.7%
Taylor expanded in sinTheta_i around 0 99.7%
associate--l+99.7%
associate-*r/99.7%
exp-sum99.7%
associate-*r/99.7%
sub-div99.7%
Applied egg-rr99.7%
Taylor expanded in cosTheta_O around 0 99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (if (<= sinTheta_i 4.999999999099794e-24) (/ (* sinTheta_i (- sinTheta_O)) v) (exp (* sinTheta_O (/ (- sinTheta_i) v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if (sinTheta_i <= 4.999999999099794e-24f) {
tmp = (sinTheta_i * -sinTheta_O) / v;
} else {
tmp = expf((sinTheta_O * (-sinTheta_i / v)));
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: tmp
if (sintheta_i <= 4.999999999099794e-24) then
tmp = (sintheta_i * -sintheta_o) / v
else
tmp = exp((sintheta_o * (-sintheta_i / v)))
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (sinTheta_i <= Float32(4.999999999099794e-24)) tmp = Float32(Float32(sinTheta_i * Float32(-sinTheta_O)) / v); else tmp = exp(Float32(sinTheta_O * Float32(Float32(-sinTheta_i) / v))); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.0); if (sinTheta_i <= single(4.999999999099794e-24)) tmp = (sinTheta_i * -sinTheta_O) / v; else tmp = exp((sinTheta_O * (-sinTheta_i / v))); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;sinTheta_i \leq 4.999999999099794 \cdot 10^{-24}:\\
\;\;\;\;\frac{sinTheta_i \cdot \left(-sinTheta_O\right)}{v}\\
\mathbf{else}:\\
\;\;\;\;e^{sinTheta_O \cdot \frac{-sinTheta_i}{v}}\\
\end{array}
\end{array}
if sinTheta_i < 5e-24Initial program 99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around inf 11.2%
Taylor expanded in sinTheta_O around 0 6.4%
mul-1-neg6.4%
associate-/l*6.4%
unsub-neg6.4%
associate-/l*6.4%
associate-*r/6.4%
Simplified6.4%
Taylor expanded in sinTheta_O around inf 44.4%
if 5e-24 < sinTheta_i Initial program 99.9%
Simplified99.9%
Taylor expanded in sinTheta_i around inf 19.1%
associate-*r/19.1%
neg-mul-119.1%
*-commutative19.1%
distribute-rgt-neg-in19.1%
Simplified19.1%
Final simplification36.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (let* ((t_0 (/ (* sinTheta_i (- sinTheta_O)) v))) (if (<= sinTheta_i 4.999999999099794e-24) t_0 (exp t_0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (sinTheta_i * -sinTheta_O) / v;
float tmp;
if (sinTheta_i <= 4.999999999099794e-24f) {
tmp = t_0;
} else {
tmp = expf(t_0);
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: tmp
t_0 = (sintheta_i * -sintheta_o) / v
if (sintheta_i <= 4.999999999099794e-24) then
tmp = t_0
else
tmp = exp(t_0)
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(sinTheta_i * Float32(-sinTheta_O)) / v) tmp = Float32(0.0) if (sinTheta_i <= Float32(4.999999999099794e-24)) tmp = t_0; else tmp = exp(t_0); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (sinTheta_i * -sinTheta_O) / v; tmp = single(0.0); if (sinTheta_i <= single(4.999999999099794e-24)) tmp = t_0; else tmp = exp(t_0); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{sinTheta_i \cdot \left(-sinTheta_O\right)}{v}\\
\mathbf{if}\;sinTheta_i \leq 4.999999999099794 \cdot 10^{-24}:\\
\;\;\;\;t_0\\
\mathbf{else}:\\
\;\;\;\;e^{t_0}\\
\end{array}
\end{array}
if sinTheta_i < 5e-24Initial program 99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around inf 11.2%
Taylor expanded in sinTheta_O around 0 6.4%
mul-1-neg6.4%
associate-/l*6.4%
unsub-neg6.4%
associate-/l*6.4%
associate-*r/6.4%
Simplified6.4%
Taylor expanded in sinTheta_O around inf 44.4%
if 5e-24 < sinTheta_i Initial program 99.9%
Simplified99.9%
Taylor expanded in sinTheta_i around inf 19.1%
Final simplification36.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (+ 0.6931 (/ -1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f + (-1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 + ((-1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(Float32(-1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) + (single(-1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 + \frac{-1}{v}}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.7%
associate-/r*99.7%
metadata-eval99.7%
+-rgt-identity99.7%
metadata-eval99.7%
metadata-eval99.7%
+-rgt-identity99.7%
sub-neg99.7%
associate-+l+99.7%
Simplified99.7%
Taylor expanded in sinTheta_i around 0 99.7%
Taylor expanded in cosTheta_O around 0 99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* sinTheta_O (/ (- sinTheta_i) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return sinTheta_O * (-sinTheta_i / v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = sintheta_o * (-sintheta_i / v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(sinTheta_O * Float32(Float32(-sinTheta_i) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = sinTheta_O * (-sinTheta_i / v); end
\begin{array}{l}
\\
sinTheta_O \cdot \frac{-sinTheta_i}{v}
\end{array}
Initial program 99.6%
Simplified99.6%
Taylor expanded in sinTheta_i around inf 13.6%
Taylor expanded in sinTheta_O around 0 6.3%
mul-1-neg6.3%
associate-/l*6.3%
unsub-neg6.3%
associate-/l*6.3%
associate-*r/6.3%
Simplified6.3%
Taylor expanded in sinTheta_O around inf 36.6%
mul-1-neg36.6%
associate-*r/19.5%
distribute-rgt-neg-in19.5%
distribute-neg-frac19.5%
Simplified19.5%
Final simplification19.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* sinTheta_i (- sinTheta_O)) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (sinTheta_i * -sinTheta_O) / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (sintheta_i * -sintheta_o) / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(sinTheta_i * Float32(-sinTheta_O)) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (sinTheta_i * -sinTheta_O) / v; end
\begin{array}{l}
\\
\frac{sinTheta_i \cdot \left(-sinTheta_O\right)}{v}
\end{array}
Initial program 99.6%
Simplified99.6%
Taylor expanded in sinTheta_i around inf 13.6%
Taylor expanded in sinTheta_O around 0 6.3%
mul-1-neg6.3%
associate-/l*6.3%
unsub-neg6.3%
associate-/l*6.3%
associate-*r/6.3%
Simplified6.3%
Taylor expanded in sinTheta_O around inf 36.6%
Final simplification36.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 1.0)
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(1.0) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.6%
Simplified99.6%
Taylor expanded in sinTheta_i around inf 13.6%
Taylor expanded in sinTheta_O around 0 6.5%
Final simplification6.5%
herbie shell --seed 2024026
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))