
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 13 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (pow (* (* v 2.0) (exp -0.6931)) -0.5)))
(*
(* t_0 t_0)
(pow
E
(/ (fma sinTheta_O (- sinTheta_i) (fma cosTheta_i cosTheta_O -1.0)) v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = powf(((v * 2.0f) * expf(-0.6931f)), -0.5f);
return (t_0 * t_0) * powf(((float) M_E), (fmaf(sinTheta_O, -sinTheta_i, fmaf(cosTheta_i, cosTheta_O, -1.0f)) / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(v * Float32(2.0)) * exp(Float32(-0.6931))) ^ Float32(-0.5) return Float32(Float32(t_0 * t_0) * (Float32(exp(1)) ^ Float32(fma(sinTheta_O, Float32(-sinTheta_i), fma(cosTheta_i, cosTheta_O, Float32(-1.0))) / v))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := {\left(\left(v \cdot 2\right) \cdot e^{-0.6931}\right)}^{-0.5}\\
\left(t\_0 \cdot t\_0\right) \cdot {e}^{\left(\frac{\mathsf{fma}\left(sinTheta\_O, -sinTheta\_i, \mathsf{fma}\left(cosTheta\_i, cosTheta\_O, -1\right)\right)}{v}\right)}
\end{array}
\end{array}
Initial program 99.5%
associate-+l+N/A
+-commutativeN/A
exp-sumN/A
*-lowering-*.f32N/A
log-recN/A
unsub-negN/A
exp-diffN/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
sub-divN/A
Applied egg-rr99.5%
clear-numN/A
div-invN/A
clear-numN/A
exp-prodN/A
pow-lowering-pow.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
+-commutativeN/A
associate-+l+N/A
accelerator-lowering-fma.f32N/A
neg-lowering-neg.f32N/A
accelerator-lowering-fma.f3299.5
Applied egg-rr99.5%
clear-numN/A
inv-powN/A
sqr-powN/A
*-lowering-*.f32N/A
pow-lowering-pow.f32N/A
div-invN/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
rec-expN/A
exp-lowering-exp.f32N/A
metadata-evalN/A
metadata-evalN/A
pow-lowering-pow.f32N/A
div-invN/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
rec-expN/A
exp-lowering-exp.f32N/A
metadata-evalN/A
metadata-eval99.5
Applied egg-rr99.5%
Final simplification99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (* (/ 0.5 v) (exp 0.6931)) (pow E (/ (fma cosTheta_O cosTheta_i -1.0) v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return ((0.5f / v) * expf(0.6931f)) * powf(((float) M_E), (fmaf(cosTheta_O, cosTheta_i, -1.0f) / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(Float32(0.5) / v) * exp(Float32(0.6931))) * (Float32(exp(1)) ^ Float32(fma(cosTheta_O, cosTheta_i, Float32(-1.0)) / v))) end
\begin{array}{l}
\\
\left(\frac{0.5}{v} \cdot e^{0.6931}\right) \cdot {e}^{\left(\frac{\mathsf{fma}\left(cosTheta\_O, cosTheta\_i, -1\right)}{v}\right)}
\end{array}
Initial program 99.5%
associate-+l+N/A
+-commutativeN/A
exp-sumN/A
*-lowering-*.f32N/A
log-recN/A
unsub-negN/A
exp-diffN/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
sub-divN/A
Applied egg-rr99.5%
Taylor expanded in sinTheta_O around 0
sub-negN/A
metadata-evalN/A
accelerator-lowering-fma.f3299.5
Simplified99.5%
*-lft-identityN/A
exp-prodN/A
pow-lowering-pow.f32N/A
exp-1-eN/A
E-lowering-E.f32N/A
*-commutativeN/A
/-lowering-/.f32N/A
*-commutativeN/A
accelerator-lowering-fma.f3299.5
Applied egg-rr99.5%
clear-numN/A
associate-/r/N/A
*-lowering-*.f32N/A
*-commutativeN/A
associate-/r*N/A
metadata-evalN/A
/-lowering-/.f32N/A
exp-lowering-exp.f3299.5
Applied egg-rr99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ (exp 0.6931) (* v 2.0)) (pow E (/ -1.0 v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(0.6931f) / (v * 2.0f)) * powf(((float) M_E), (-1.0f / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(0.6931)) / Float32(v * Float32(2.0))) * (Float32(exp(1)) ^ Float32(Float32(-1.0) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(single(0.6931)) / (v * single(2.0))) * (single(2.71828182845904523536) ^ (single(-1.0) / v)); end
\begin{array}{l}
\\
\frac{e^{0.6931}}{v \cdot 2} \cdot {e}^{\left(\frac{-1}{v}\right)}
\end{array}
Initial program 99.5%
associate-+l+N/A
+-commutativeN/A
exp-sumN/A
*-lowering-*.f32N/A
log-recN/A
unsub-negN/A
exp-diffN/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
sub-divN/A
Applied egg-rr99.5%
Taylor expanded in sinTheta_O around 0
sub-negN/A
metadata-evalN/A
accelerator-lowering-fma.f3299.5
Simplified99.5%
*-lft-identityN/A
exp-prodN/A
pow-lowering-pow.f32N/A
exp-1-eN/A
E-lowering-E.f32N/A
*-commutativeN/A
/-lowering-/.f32N/A
*-commutativeN/A
accelerator-lowering-fma.f3299.5
Applied egg-rr99.5%
Taylor expanded in cosTheta_O around 0
/-lowering-/.f3299.5
Simplified99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (* (exp 0.6931) (exp (/ -1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * (expf(0.6931f) * expf((-1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * (exp(0.6931e0) * exp(((-1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * Float32(exp(Float32(0.6931)) * exp(Float32(Float32(-1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * (exp(single(0.6931)) * exp((single(-1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot \left(e^{0.6931} \cdot e^{\frac{-1}{v}}\right)
\end{array}
Initial program 99.5%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
*-lowering-*.f32N/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
sub-negN/A
+-lowering-+.f32N/A
distribute-neg-inN/A
mul-1-negN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
distribute-rgt1-inN/A
+-commutativeN/A
*-lowering-*.f32N/A
Simplified99.5%
Taylor expanded in sinTheta_O around 0
/-lowering-/.f3299.5
Simplified99.5%
+-commutativeN/A
exp-sumN/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
exp-lowering-exp.f3299.5
Applied egg-rr99.5%
Final simplification99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (/ (* cosTheta_i cosTheta_O) v)))
(if (<= (* cosTheta_i cosTheta_O) -2.9999999105145657e-35)
(exp t_0)
(if (<= (* cosTheta_i cosTheta_O) 2.000000036005019e-35)
t_0
(exp (- (* cosTheta_O (/ cosTheta_i v))))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (cosTheta_i * cosTheta_O) / v;
float tmp;
if ((cosTheta_i * cosTheta_O) <= -2.9999999105145657e-35f) {
tmp = expf(t_0);
} else if ((cosTheta_i * cosTheta_O) <= 2.000000036005019e-35f) {
tmp = t_0;
} else {
tmp = expf(-(cosTheta_O * (cosTheta_i / v)));
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: tmp
t_0 = (costheta_i * costheta_o) / v
if ((costheta_i * costheta_o) <= (-2.9999999105145657e-35)) then
tmp = exp(t_0)
else if ((costheta_i * costheta_o) <= 2.000000036005019e-35) then
tmp = t_0
else
tmp = exp(-(costheta_o * (costheta_i / v)))
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(cosTheta_i * cosTheta_O) / v) tmp = Float32(0.0) if (Float32(cosTheta_i * cosTheta_O) <= Float32(-2.9999999105145657e-35)) tmp = exp(t_0); elseif (Float32(cosTheta_i * cosTheta_O) <= Float32(2.000000036005019e-35)) tmp = t_0; else tmp = exp(Float32(-Float32(cosTheta_O * Float32(cosTheta_i / v)))); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (cosTheta_i * cosTheta_O) / v; tmp = single(0.0); if ((cosTheta_i * cosTheta_O) <= single(-2.9999999105145657e-35)) tmp = exp(t_0); elseif ((cosTheta_i * cosTheta_O) <= single(2.000000036005019e-35)) tmp = t_0; else tmp = exp(-(cosTheta_O * (cosTheta_i / v))); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta\_i \cdot cosTheta\_O}{v}\\
\mathbf{if}\;cosTheta\_i \cdot cosTheta\_O \leq -2.9999999105145657 \cdot 10^{-35}:\\
\;\;\;\;e^{t\_0}\\
\mathbf{elif}\;cosTheta\_i \cdot cosTheta\_O \leq 2.000000036005019 \cdot 10^{-35}:\\
\;\;\;\;t\_0\\
\mathbf{else}:\\
\;\;\;\;e^{-cosTheta\_O \cdot \frac{cosTheta\_i}{v}}\\
\end{array}
\end{array}
if (*.f32 cosTheta_i cosTheta_O) < -2.99999991e-35Initial program 99.2%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3239.3
Simplified39.3%
exp-lowering-exp.f32N/A
associate-*r/N/A
/-lowering-/.f32N/A
*-lowering-*.f3239.3
Applied egg-rr39.3%
if -2.99999991e-35 < (*.f32 cosTheta_i cosTheta_O) < 2.00000004e-35Initial program 99.7%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_O around inf
/-lowering-/.f32N/A
*-lowering-*.f3261.9
Simplified61.9%
if 2.00000004e-35 < (*.f32 cosTheta_i cosTheta_O) Initial program 99.1%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f325.7
Simplified5.7%
frac-2negN/A
div-invN/A
inv-powN/A
metadata-evalN/A
metadata-evalN/A
pow-powN/A
pow2N/A
sqr-negN/A
pow2N/A
pow-powN/A
metadata-evalN/A
metadata-evalN/A
inv-powN/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f3235.7
Applied egg-rr35.7%
*-commutativeN/A
associate-*r*N/A
*-lowering-*.f32N/A
un-div-invN/A
/-lowering-/.f32N/A
neg-lowering-neg.f3235.7
Applied egg-rr35.7%
Final simplification51.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (/ (* cosTheta_i cosTheta_O) v)))
(if (<= (* cosTheta_i cosTheta_O) -2.9999999105145657e-35)
(exp t_0)
(if (<= (* cosTheta_i cosTheta_O) 2.000000036005019e-35)
t_0
(exp (* cosTheta_i (/ cosTheta_O (- v))))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (cosTheta_i * cosTheta_O) / v;
float tmp;
if ((cosTheta_i * cosTheta_O) <= -2.9999999105145657e-35f) {
tmp = expf(t_0);
} else if ((cosTheta_i * cosTheta_O) <= 2.000000036005019e-35f) {
tmp = t_0;
} else {
tmp = expf((cosTheta_i * (cosTheta_O / -v)));
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: tmp
t_0 = (costheta_i * costheta_o) / v
if ((costheta_i * costheta_o) <= (-2.9999999105145657e-35)) then
tmp = exp(t_0)
else if ((costheta_i * costheta_o) <= 2.000000036005019e-35) then
tmp = t_0
else
tmp = exp((costheta_i * (costheta_o / -v)))
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(cosTheta_i * cosTheta_O) / v) tmp = Float32(0.0) if (Float32(cosTheta_i * cosTheta_O) <= Float32(-2.9999999105145657e-35)) tmp = exp(t_0); elseif (Float32(cosTheta_i * cosTheta_O) <= Float32(2.000000036005019e-35)) tmp = t_0; else tmp = exp(Float32(cosTheta_i * Float32(cosTheta_O / Float32(-v)))); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (cosTheta_i * cosTheta_O) / v; tmp = single(0.0); if ((cosTheta_i * cosTheta_O) <= single(-2.9999999105145657e-35)) tmp = exp(t_0); elseif ((cosTheta_i * cosTheta_O) <= single(2.000000036005019e-35)) tmp = t_0; else tmp = exp((cosTheta_i * (cosTheta_O / -v))); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta\_i \cdot cosTheta\_O}{v}\\
\mathbf{if}\;cosTheta\_i \cdot cosTheta\_O \leq -2.9999999105145657 \cdot 10^{-35}:\\
\;\;\;\;e^{t\_0}\\
\mathbf{elif}\;cosTheta\_i \cdot cosTheta\_O \leq 2.000000036005019 \cdot 10^{-35}:\\
\;\;\;\;t\_0\\
\mathbf{else}:\\
\;\;\;\;e^{cosTheta\_i \cdot \frac{cosTheta\_O}{-v}}\\
\end{array}
\end{array}
if (*.f32 cosTheta_i cosTheta_O) < -2.99999991e-35Initial program 99.2%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3239.3
Simplified39.3%
exp-lowering-exp.f32N/A
associate-*r/N/A
/-lowering-/.f32N/A
*-lowering-*.f3239.3
Applied egg-rr39.3%
if -2.99999991e-35 < (*.f32 cosTheta_i cosTheta_O) < 2.00000004e-35Initial program 99.7%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_O around inf
/-lowering-/.f32N/A
*-lowering-*.f3261.9
Simplified61.9%
if 2.00000004e-35 < (*.f32 cosTheta_i cosTheta_O) Initial program 99.1%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f325.7
Simplified5.7%
frac-2negN/A
neg-mul-1N/A
*-commutativeN/A
metadata-evalN/A
div-invN/A
clear-numN/A
frac-2negN/A
metadata-evalN/A
inv-powN/A
metadata-evalN/A
metadata-evalN/A
pow-powN/A
pow2N/A
sqr-negN/A
pow2N/A
pow-powN/A
metadata-evalN/A
metadata-evalN/A
inv-powN/A
clear-numN/A
/-rgt-identityN/A
/-lowering-/.f32N/A
neg-lowering-neg.f3235.7
Applied egg-rr35.7%
Final simplification51.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (+ 0.6931 (/ -1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f + (-1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 + ((-1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(Float32(-1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) + (single(-1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 + \frac{-1}{v}}
\end{array}
Initial program 99.5%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
*-lowering-*.f32N/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
sub-negN/A
+-lowering-+.f32N/A
distribute-neg-inN/A
mul-1-negN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
distribute-rgt1-inN/A
+-commutativeN/A
*-lowering-*.f32N/A
Simplified99.5%
Taylor expanded in sinTheta_O around 0
/-lowering-/.f3299.5
Simplified99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (let* ((t_0 (/ (* cosTheta_i cosTheta_O) v))) (if (<= (* cosTheta_i cosTheta_O) -2.9999999105145657e-35) (exp t_0) t_0)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (cosTheta_i * cosTheta_O) / v;
float tmp;
if ((cosTheta_i * cosTheta_O) <= -2.9999999105145657e-35f) {
tmp = expf(t_0);
} else {
tmp = t_0;
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: tmp
t_0 = (costheta_i * costheta_o) / v
if ((costheta_i * costheta_o) <= (-2.9999999105145657e-35)) then
tmp = exp(t_0)
else
tmp = t_0
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(cosTheta_i * cosTheta_O) / v) tmp = Float32(0.0) if (Float32(cosTheta_i * cosTheta_O) <= Float32(-2.9999999105145657e-35)) tmp = exp(t_0); else tmp = t_0; end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (cosTheta_i * cosTheta_O) / v; tmp = single(0.0); if ((cosTheta_i * cosTheta_O) <= single(-2.9999999105145657e-35)) tmp = exp(t_0); else tmp = t_0; end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta\_i \cdot cosTheta\_O}{v}\\
\mathbf{if}\;cosTheta\_i \cdot cosTheta\_O \leq -2.9999999105145657 \cdot 10^{-35}:\\
\;\;\;\;e^{t\_0}\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if (*.f32 cosTheta_i cosTheta_O) < -2.99999991e-35Initial program 99.2%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3239.3
Simplified39.3%
exp-lowering-exp.f32N/A
associate-*r/N/A
/-lowering-/.f32N/A
*-lowering-*.f3239.3
Applied egg-rr39.3%
if -2.99999991e-35 < (*.f32 cosTheta_i cosTheta_O) Initial program 99.6%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f326.2
Simplified6.2%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_O around inf
/-lowering-/.f32N/A
*-lowering-*.f3246.9
Simplified46.9%
Final simplification45.4%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (if (<= (* cosTheta_i cosTheta_O) -2.9999999105145657e-35) (exp (* cosTheta_i (/ cosTheta_O v))) (/ (* cosTheta_i cosTheta_O) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if ((cosTheta_i * cosTheta_O) <= -2.9999999105145657e-35f) {
tmp = expf((cosTheta_i * (cosTheta_O / v)));
} else {
tmp = (cosTheta_i * cosTheta_O) / v;
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: tmp
if ((costheta_i * costheta_o) <= (-2.9999999105145657e-35)) then
tmp = exp((costheta_i * (costheta_o / v)))
else
tmp = (costheta_i * costheta_o) / v
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (Float32(cosTheta_i * cosTheta_O) <= Float32(-2.9999999105145657e-35)) tmp = exp(Float32(cosTheta_i * Float32(cosTheta_O / v))); else tmp = Float32(Float32(cosTheta_i * cosTheta_O) / v); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.0); if ((cosTheta_i * cosTheta_O) <= single(-2.9999999105145657e-35)) tmp = exp((cosTheta_i * (cosTheta_O / v))); else tmp = (cosTheta_i * cosTheta_O) / v; end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;cosTheta\_i \cdot cosTheta\_O \leq -2.9999999105145657 \cdot 10^{-35}:\\
\;\;\;\;e^{cosTheta\_i \cdot \frac{cosTheta\_O}{v}}\\
\mathbf{else}:\\
\;\;\;\;\frac{cosTheta\_i \cdot cosTheta\_O}{v}\\
\end{array}
\end{array}
if (*.f32 cosTheta_i cosTheta_O) < -2.99999991e-35Initial program 99.2%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3239.3
Simplified39.3%
if -2.99999991e-35 < (*.f32 cosTheta_i cosTheta_O) Initial program 99.6%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f326.2
Simplified6.2%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_O around inf
/-lowering-/.f32N/A
*-lowering-*.f3246.9
Simplified46.9%
Final simplification45.4%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (/ -1.0 v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(-1.0) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(-1.0) / v)); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{\frac{-1}{v}}
\end{array}
Initial program 99.5%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
*-lowering-*.f32N/A
rem-exp-logN/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
sub-negN/A
+-lowering-+.f32N/A
distribute-neg-inN/A
mul-1-negN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
distribute-rgt1-inN/A
+-commutativeN/A
*-lowering-*.f32N/A
Simplified99.5%
Taylor expanded in sinTheta_O around 0
/-lowering-/.f3299.5
Simplified99.5%
Taylor expanded in v around 0
/-lowering-/.f3296.6
Simplified96.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ (fma cosTheta_O cosTheta_i (fma sinTheta_O (- sinTheta_i) -1.0)) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((fmaf(cosTheta_O, cosTheta_i, fmaf(sinTheta_O, -sinTheta_i, -1.0f)) / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(fma(cosTheta_O, cosTheta_i, fma(sinTheta_O, Float32(-sinTheta_i), Float32(-1.0))) / v)) end
\begin{array}{l}
\\
e^{\frac{\mathsf{fma}\left(cosTheta\_O, cosTheta\_i, \mathsf{fma}\left(sinTheta\_O, -sinTheta\_i, -1\right)\right)}{v}}
\end{array}
Initial program 99.5%
Taylor expanded in v around 0
/-lowering-/.f32N/A
sub-negN/A
accelerator-lowering-fma.f32N/A
+-commutativeN/A
distribute-neg-inN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
metadata-evalN/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f3296.3
Simplified96.3%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* cosTheta_i cosTheta_O) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (cosTheta_i * cosTheta_O) / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (costheta_i * costheta_o) / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(cosTheta_i * cosTheta_O) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (cosTheta_i * cosTheta_O) / v; end
\begin{array}{l}
\\
\frac{cosTheta\_i \cdot cosTheta\_O}{v}
\end{array}
Initial program 99.5%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3212.5
Simplified12.5%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f326.4
Simplified6.4%
Taylor expanded in cosTheta_O around inf
/-lowering-/.f32N/A
*-lowering-*.f3239.2
Simplified39.2%
Final simplification39.2%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 1.0)
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(1.0) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.5%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
*-lowering-*.f32N/A
/-lowering-/.f3212.5
Simplified12.5%
Taylor expanded in cosTheta_i around 0
Simplified6.5%
herbie shell --seed 2024204
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))