
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 9 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (exp (+ (/ (- -1.0 (* sinTheta_O sinTheta_i)) v) 0.6931)) (* v 2.0)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((((-1.0f - (sinTheta_O * sinTheta_i)) / v) + 0.6931f)) / (v * 2.0f);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((-1.0e0) - (sintheta_o * sintheta_i)) / v) + 0.6931e0)) / (v * 2.0e0)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(exp(Float32(Float32(Float32(Float32(-1.0) - Float32(sinTheta_O * sinTheta_i)) / v) + Float32(0.6931))) / Float32(v * Float32(2.0))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((((single(-1.0) - (sinTheta_O * sinTheta_i)) / v) + single(0.6931))) / (v * single(2.0)); end
\begin{array}{l}
\\
\frac{e^{\frac{-1 - sinTheta\_O \cdot sinTheta\_i}{v} + 0.6931}}{v \cdot 2}
\end{array}
Initial program 99.6%
Applied rewrites99.2%
Taylor expanded in cosTheta_i around 0
mul-1-negN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f3299.6
Applied rewrites99.6%
lift-neg.f32N/A
lift-*.f32N/A
+-commutativeN/A
lift-*.f32N/A
lift-neg.f32N/A
distribute-rgt-neg-outN/A
unsub-negN/A
lower--.f32N/A
lower-*.f3299.6
Applied rewrites99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(if (<=
(+
(+
0.6931
(+
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_O sinTheta_i) v))
(/ -1.0 v)))
(log (/ 1.0 (* v 2.0))))
-3.999999911278523e+22)
(*
(* cosTheta_O cosTheta_O)
(fma
0.5
(/ (* cosTheta_i cosTheta_i) (* v v))
(/ cosTheta_i (* v cosTheta_O))))
(/
(* cosTheta_i (* cosTheta_i (* 0.5 (* cosTheta_O cosTheta_O))))
(* v v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if (((0.6931f + ((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_O * sinTheta_i) / v)) + (-1.0f / v))) + logf((1.0f / (v * 2.0f)))) <= -3.999999911278523e+22f) {
tmp = (cosTheta_O * cosTheta_O) * fmaf(0.5f, ((cosTheta_i * cosTheta_i) / (v * v)), (cosTheta_i / (v * cosTheta_O)));
} else {
tmp = (cosTheta_i * (cosTheta_i * (0.5f * (cosTheta_O * cosTheta_O)))) / (v * v);
}
return tmp;
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (Float32(Float32(Float32(0.6931) + Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_O * sinTheta_i) / v)) + Float32(Float32(-1.0) / v))) + log(Float32(Float32(1.0) / Float32(v * Float32(2.0))))) <= Float32(-3.999999911278523e+22)) tmp = Float32(Float32(cosTheta_O * cosTheta_O) * fma(Float32(0.5), Float32(Float32(cosTheta_i * cosTheta_i) / Float32(v * v)), Float32(cosTheta_i / Float32(v * cosTheta_O)))); else tmp = Float32(Float32(cosTheta_i * Float32(cosTheta_i * Float32(Float32(0.5) * Float32(cosTheta_O * cosTheta_O)))) / Float32(v * v)); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\left(0.6931 + \left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_O \cdot sinTheta\_i}{v}\right) + \frac{-1}{v}\right)\right) + \log \left(\frac{1}{v \cdot 2}\right) \leq -3.999999911278523 \cdot 10^{+22}:\\
\;\;\;\;\left(cosTheta\_O \cdot cosTheta\_O\right) \cdot \mathsf{fma}\left(0.5, \frac{cosTheta\_i \cdot cosTheta\_i}{v \cdot v}, \frac{cosTheta\_i}{v \cdot cosTheta\_O}\right)\\
\mathbf{else}:\\
\;\;\;\;\frac{cosTheta\_i \cdot \left(cosTheta\_i \cdot \left(0.5 \cdot \left(cosTheta\_O \cdot cosTheta\_O\right)\right)\right)}{v \cdot v}\\
\end{array}
\end{array}
if (+.f32 (+.f32 (-.f32 (-.f32 (/.f32 (*.f32 cosTheta_i cosTheta_O) v) (/.f32 (*.f32 sinTheta_i sinTheta_O) v)) (/.f32 #s(literal 1 binary32) v)) #s(literal 6931/10000 binary32)) (log.f32 (/.f32 #s(literal 1 binary32) (*.f32 #s(literal 2 binary32) v)))) < -3.99999991e22Initial program 100.0%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3220.0
Applied rewrites20.0%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f327.2
Applied rewrites7.2%
Taylor expanded in cosTheta_O around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-/.f32N/A
*-commutativeN/A
lower-*.f3253.3
Applied rewrites4.2%
if -3.99999991e22 < (+.f32 (+.f32 (-.f32 (-.f32 (/.f32 (*.f32 cosTheta_i cosTheta_O) v) (/.f32 (*.f32 sinTheta_i sinTheta_O) v)) (/.f32 #s(literal 1 binary32) v)) #s(literal 6931/10000 binary32)) (log.f32 (/.f32 #s(literal 1 binary32) (*.f32 #s(literal 2 binary32) v)))) Initial program 99.3%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f328.9
Applied rewrites8.9%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f327.2
Applied rewrites7.2%
Taylor expanded in cosTheta_O around inf
associate-*r/N/A
lower-/.f32N/A
associate-*r*N/A
unpow2N/A
associate-*r*N/A
associate-*r*N/A
lower-*.f32N/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f3280.0
Applied rewrites80.0%
Final simplification74.1%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (/ (* cosTheta_i cosTheta_O) v)))
(if (<=
(+
(+ 0.6931 (+ (- t_0 (/ (* sinTheta_O sinTheta_i) v)) (/ -1.0 v)))
(log (/ 1.0 (* v 2.0))))
-3.999999911278523e+22)
t_0
(/
(* cosTheta_i (* cosTheta_i (* 0.5 (* cosTheta_O cosTheta_O))))
(* v v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (cosTheta_i * cosTheta_O) / v;
float tmp;
if (((0.6931f + ((t_0 - ((sinTheta_O * sinTheta_i) / v)) + (-1.0f / v))) + logf((1.0f / (v * 2.0f)))) <= -3.999999911278523e+22f) {
tmp = t_0;
} else {
tmp = (cosTheta_i * (cosTheta_i * (0.5f * (cosTheta_O * cosTheta_O)))) / (v * v);
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: tmp
t_0 = (costheta_i * costheta_o) / v
if (((0.6931e0 + ((t_0 - ((sintheta_o * sintheta_i) / v)) + ((-1.0e0) / v))) + log((1.0e0 / (v * 2.0e0)))) <= (-3.999999911278523e+22)) then
tmp = t_0
else
tmp = (costheta_i * (costheta_i * (0.5e0 * (costheta_o * costheta_o)))) / (v * v)
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(cosTheta_i * cosTheta_O) / v) tmp = Float32(0.0) if (Float32(Float32(Float32(0.6931) + Float32(Float32(t_0 - Float32(Float32(sinTheta_O * sinTheta_i) / v)) + Float32(Float32(-1.0) / v))) + log(Float32(Float32(1.0) / Float32(v * Float32(2.0))))) <= Float32(-3.999999911278523e+22)) tmp = t_0; else tmp = Float32(Float32(cosTheta_i * Float32(cosTheta_i * Float32(Float32(0.5) * Float32(cosTheta_O * cosTheta_O)))) / Float32(v * v)); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (cosTheta_i * cosTheta_O) / v; tmp = single(0.0); if (((single(0.6931) + ((t_0 - ((sinTheta_O * sinTheta_i) / v)) + (single(-1.0) / v))) + log((single(1.0) / (v * single(2.0))))) <= single(-3.999999911278523e+22)) tmp = t_0; else tmp = (cosTheta_i * (cosTheta_i * (single(0.5) * (cosTheta_O * cosTheta_O)))) / (v * v); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta\_i \cdot cosTheta\_O}{v}\\
\mathbf{if}\;\left(0.6931 + \left(\left(t\_0 - \frac{sinTheta\_O \cdot sinTheta\_i}{v}\right) + \frac{-1}{v}\right)\right) + \log \left(\frac{1}{v \cdot 2}\right) \leq -3.999999911278523 \cdot 10^{+22}:\\
\;\;\;\;t\_0\\
\mathbf{else}:\\
\;\;\;\;\frac{cosTheta\_i \cdot \left(cosTheta\_i \cdot \left(0.5 \cdot \left(cosTheta\_O \cdot cosTheta\_O\right)\right)\right)}{v \cdot v}\\
\end{array}
\end{array}
if (+.f32 (+.f32 (-.f32 (-.f32 (/.f32 (*.f32 cosTheta_i cosTheta_O) v) (/.f32 (*.f32 sinTheta_i sinTheta_O) v)) (/.f32 #s(literal 1 binary32) v)) #s(literal 6931/10000 binary32)) (log.f32 (/.f32 #s(literal 1 binary32) (*.f32 #s(literal 2 binary32) v)))) < -3.99999991e22Initial program 100.0%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3220.0
Applied rewrites20.0%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f3211.5
Applied rewrites11.5%
Taylor expanded in cosTheta_O around inf
lower-/.f32N/A
lower-*.f3235.2
Applied rewrites35.2%
if -3.99999991e22 < (+.f32 (+.f32 (-.f32 (-.f32 (/.f32 (*.f32 cosTheta_i cosTheta_O) v) (/.f32 (*.f32 sinTheta_i sinTheta_O) v)) (/.f32 #s(literal 1 binary32) v)) #s(literal 6931/10000 binary32)) (log.f32 (/.f32 #s(literal 1 binary32) (*.f32 #s(literal 2 binary32) v)))) Initial program 99.3%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f328.9
Applied rewrites8.9%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f327.2
Applied rewrites7.2%
Taylor expanded in cosTheta_O around inf
associate-*r/N/A
lower-/.f32N/A
associate-*r*N/A
unpow2N/A
associate-*r*N/A
associate-*r*N/A
lower-*.f32N/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f3280.0
Applied rewrites80.0%
Final simplification62.4%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (exp (+ 0.6931 (/ -1.0 v))) (/ 0.5 v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((0.6931f + (-1.0f / v))) * (0.5f / v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp((0.6931e0 + ((-1.0e0) / v))) * (0.5e0 / v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(exp(Float32(Float32(0.6931) + Float32(Float32(-1.0) / v))) * Float32(Float32(0.5) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(0.6931) + (single(-1.0) / v))) * (single(0.5) / v); end
\begin{array}{l}
\\
e^{0.6931 + \frac{-1}{v}} \cdot \frac{0.5}{v}
\end{array}
Initial program 99.6%
Applied rewrites99.2%
Taylor expanded in cosTheta_i around 0
mul-1-negN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f3299.6
Applied rewrites99.6%
lift-neg.f32N/A
lift-*.f32N/A
+-commutativeN/A
lift-*.f32N/A
lift-neg.f32N/A
distribute-rgt-neg-outN/A
unsub-negN/A
lower--.f32N/A
lower-*.f3299.6
Applied rewrites99.6%
Taylor expanded in sinTheta_O around 0
*-commutativeN/A
associate-*l/N/A
associate-/l*N/A
lower-*.f32N/A
lower-exp.f32N/A
sub-negN/A
lft-mult-inverseN/A
associate-*l/N/A
associate-/r*N/A
lower-+.f32N/A
associate-/r*N/A
associate-*l/N/A
lft-mult-inverseN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f32N/A
lower-/.f3299.5
Applied rewrites99.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ -1.0 v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(-1.0) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(-1.0) / v)); end
\begin{array}{l}
\\
e^{\frac{-1}{v}}
\end{array}
Initial program 99.6%
Taylor expanded in v around 0
lower-/.f32N/A
sub-negN/A
lower-fma.f32N/A
+-commutativeN/A
distribute-neg-inN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
metadata-evalN/A
lower-fma.f32N/A
mul-1-negN/A
lower-neg.f3295.4
Applied rewrites94.6%
Taylor expanded in sinTheta_O around 0
div-subN/A
lower-exp.f32N/A
div-subN/A
lower-/.f32N/A
sub-negN/A
metadata-evalN/A
lower-fma.f3294.3
Applied rewrites94.3%
Taylor expanded in cosTheta_O around 0
metadata-evalN/A
distribute-neg-fracN/A
lower-exp.f32N/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f3296.9
Applied rewrites96.9%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(if (<= cosTheta_i -9.999999682655225e-22)
(*
(* cosTheta_O cosTheta_O)
(fma
0.5
(/ (* cosTheta_i cosTheta_i) (* v v))
(/ (+ (/ cosTheta_i v) (/ 1.0 cosTheta_O)) cosTheta_O)))
(*
(* cosTheta_i cosTheta_i)
(fma
0.5
(/ (* cosTheta_O cosTheta_O) (* v v))
(/ cosTheta_O (* v cosTheta_i))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if (cosTheta_i <= -9.999999682655225e-22f) {
tmp = (cosTheta_O * cosTheta_O) * fmaf(0.5f, ((cosTheta_i * cosTheta_i) / (v * v)), (((cosTheta_i / v) + (1.0f / cosTheta_O)) / cosTheta_O));
} else {
tmp = (cosTheta_i * cosTheta_i) * fmaf(0.5f, ((cosTheta_O * cosTheta_O) / (v * v)), (cosTheta_O / (v * cosTheta_i)));
}
return tmp;
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (cosTheta_i <= Float32(-9.999999682655225e-22)) tmp = Float32(Float32(cosTheta_O * cosTheta_O) * fma(Float32(0.5), Float32(Float32(cosTheta_i * cosTheta_i) / Float32(v * v)), Float32(Float32(Float32(cosTheta_i / v) + Float32(Float32(1.0) / cosTheta_O)) / cosTheta_O))); else tmp = Float32(Float32(cosTheta_i * cosTheta_i) * fma(Float32(0.5), Float32(Float32(cosTheta_O * cosTheta_O) / Float32(v * v)), Float32(cosTheta_O / Float32(v * cosTheta_i)))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;cosTheta\_i \leq -9.999999682655225 \cdot 10^{-22}:\\
\;\;\;\;\left(cosTheta\_O \cdot cosTheta\_O\right) \cdot \mathsf{fma}\left(0.5, \frac{cosTheta\_i \cdot cosTheta\_i}{v \cdot v}, \frac{\frac{cosTheta\_i}{v} + \frac{1}{cosTheta\_O}}{cosTheta\_O}\right)\\
\mathbf{else}:\\
\;\;\;\;\left(cosTheta\_i \cdot cosTheta\_i\right) \cdot \mathsf{fma}\left(0.5, \frac{cosTheta\_O \cdot cosTheta\_O}{v \cdot v}, \frac{cosTheta\_O}{v \cdot cosTheta\_i}\right)\\
\end{array}
\end{array}
if cosTheta_i < -9.9999997e-22Initial program 99.9%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3215.5
Applied rewrites15.5%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f328.0
Applied rewrites8.0%
Taylor expanded in cosTheta_O around -inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
lower-/.f32N/A
Applied rewrites5.1%
if -9.9999997e-22 < cosTheta_i Initial program 99.5%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3212.6
Applied rewrites12.6%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f327.0
Applied rewrites7.0%
Taylor expanded in cosTheta_i around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-/.f32N/A
*-commutativeN/A
lower-*.f3266.6
Applied rewrites25.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(if (<= cosTheta_i -9.999999682655225e-22)
(*
(* cosTheta_O cosTheta_O)
(fma
0.5
(/ (* cosTheta_i cosTheta_i) (* v v))
(/ cosTheta_i (* v cosTheta_O))))
(*
(* cosTheta_i cosTheta_i)
(fma
0.5
(/ (* cosTheta_O cosTheta_O) (* v v))
(/ cosTheta_O (* v cosTheta_i))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if (cosTheta_i <= -9.999999682655225e-22f) {
tmp = (cosTheta_O * cosTheta_O) * fmaf(0.5f, ((cosTheta_i * cosTheta_i) / (v * v)), (cosTheta_i / (v * cosTheta_O)));
} else {
tmp = (cosTheta_i * cosTheta_i) * fmaf(0.5f, ((cosTheta_O * cosTheta_O) / (v * v)), (cosTheta_O / (v * cosTheta_i)));
}
return tmp;
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (cosTheta_i <= Float32(-9.999999682655225e-22)) tmp = Float32(Float32(cosTheta_O * cosTheta_O) * fma(Float32(0.5), Float32(Float32(cosTheta_i * cosTheta_i) / Float32(v * v)), Float32(cosTheta_i / Float32(v * cosTheta_O)))); else tmp = Float32(Float32(cosTheta_i * cosTheta_i) * fma(Float32(0.5), Float32(Float32(cosTheta_O * cosTheta_O) / Float32(v * v)), Float32(cosTheta_O / Float32(v * cosTheta_i)))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;cosTheta\_i \leq -9.999999682655225 \cdot 10^{-22}:\\
\;\;\;\;\left(cosTheta\_O \cdot cosTheta\_O\right) \cdot \mathsf{fma}\left(0.5, \frac{cosTheta\_i \cdot cosTheta\_i}{v \cdot v}, \frac{cosTheta\_i}{v \cdot cosTheta\_O}\right)\\
\mathbf{else}:\\
\;\;\;\;\left(cosTheta\_i \cdot cosTheta\_i\right) \cdot \mathsf{fma}\left(0.5, \frac{cosTheta\_O \cdot cosTheta\_O}{v \cdot v}, \frac{cosTheta\_O}{v \cdot cosTheta\_i}\right)\\
\end{array}
\end{array}
if cosTheta_i < -9.9999997e-22Initial program 99.9%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3215.5
Applied rewrites15.5%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f328.0
Applied rewrites8.0%
Taylor expanded in cosTheta_O around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-/.f32N/A
*-commutativeN/A
lower-*.f3252.7
Applied rewrites18.0%
if -9.9999997e-22 < cosTheta_i Initial program 99.5%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3212.6
Applied rewrites12.6%
Taylor expanded in v around inf
+-commutativeN/A
associate-+l+N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f327.0
Applied rewrites7.0%
Taylor expanded in cosTheta_i around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-/.f32N/A
*-commutativeN/A
lower-*.f3266.6
Applied rewrites25.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* cosTheta_i cosTheta_O) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (cosTheta_i * cosTheta_O) / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (costheta_i * costheta_o) / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(cosTheta_i * cosTheta_O) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (cosTheta_i * cosTheta_O) / v; end
\begin{array}{l}
\\
\frac{cosTheta\_i \cdot cosTheta\_O}{v}
\end{array}
Initial program 99.6%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3213.3
Applied rewrites13.3%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
lower-/.f3211.1
Applied rewrites11.1%
Taylor expanded in cosTheta_O around inf
lower-/.f32N/A
lower-*.f3237.4
Applied rewrites37.4%
Final simplification37.4%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 1.0)
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(1.0) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.6%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3213.3
Applied rewrites13.3%
Taylor expanded in cosTheta_i around 0
Applied rewrites6.5%
herbie shell --seed 2024216
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))