
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (* (exp 0.6931) (/ 0.5 v)) (/ 1.0 (exp (/ (- -1.0 (* sinTheta_i sinTheta_O)) (- v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(0.6931f) * (0.5f / v)) * (1.0f / expf(((-1.0f - (sinTheta_i * sinTheta_O)) / -v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(0.6931e0) * (0.5e0 / v)) * (1.0e0 / exp((((-1.0e0) - (sintheta_i * sintheta_o)) / -v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(0.6931)) * Float32(Float32(0.5) / v)) * Float32(Float32(1.0) / exp(Float32(Float32(Float32(-1.0) - Float32(sinTheta_i * sinTheta_O)) / Float32(-v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(single(0.6931)) * (single(0.5) / v)) * (single(1.0) / exp(((single(-1.0) - (sinTheta_i * sinTheta_O)) / -v))); end
\begin{array}{l}
\\
\left(e^{0.6931} \cdot \frac{0.5}{v}\right) \cdot \frac{1}{e^{\frac{-1 - sinTheta\_i \cdot sinTheta\_O}{-v}}}
\end{array}
Initial program 99.6%
lift-exp.f32N/A
lift-+.f32N/A
lift-+.f32N/A
associate-+l+N/A
+-commutativeN/A
exp-sumN/A
lower-*.f32N/A
Applied rewrites99.7%
Taylor expanded in cosTheta_i around 0
distribute-lft-inN/A
metadata-evalN/A
mul-1-negN/A
unsub-negN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f3299.7
Applied rewrites99.7%
lift-exp.f32N/A
lift-/.f32N/A
frac-2negN/A
distribute-frac-neg2N/A
exp-negN/A
lower-/.f32N/A
lower-exp.f32N/A
lower-/.f32N/A
lower-neg.f3299.7
Applied rewrites99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (* (exp 0.6931) (/ 0.5 v)) (exp (/ (- -1.0 (* sinTheta_i sinTheta_O)) v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(0.6931f) * (0.5f / v)) * expf(((-1.0f - (sinTheta_i * sinTheta_O)) / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(0.6931e0) * (0.5e0 / v)) * exp((((-1.0e0) - (sintheta_i * sintheta_o)) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(0.6931)) * Float32(Float32(0.5) / v)) * exp(Float32(Float32(Float32(-1.0) - Float32(sinTheta_i * sinTheta_O)) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(single(0.6931)) * (single(0.5) / v)) * exp(((single(-1.0) - (sinTheta_i * sinTheta_O)) / v)); end
\begin{array}{l}
\\
\left(e^{0.6931} \cdot \frac{0.5}{v}\right) \cdot e^{\frac{-1 - sinTheta\_i \cdot sinTheta\_O}{v}}
\end{array}
Initial program 99.6%
lift-exp.f32N/A
lift-+.f32N/A
lift-+.f32N/A
associate-+l+N/A
+-commutativeN/A
exp-sumN/A
lower-*.f32N/A
Applied rewrites99.7%
Taylor expanded in cosTheta_i around 0
distribute-lft-inN/A
metadata-evalN/A
mul-1-negN/A
unsub-negN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f3299.7
Applied rewrites99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (- 0.6931 (/ 1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f - (1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 - (1.0e0 / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) - (single(1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 - \frac{1}{v}}
\end{array}
Initial program 99.6%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
lower-*.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
sub-negN/A
+-commutativeN/A
Applied rewrites13.8%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (if (<= (* sinTheta_i sinTheta_O) 4.999999898305949e-32) (exp (* cosTheta_O (/ cosTheta_i v))) (exp (* (- sinTheta_O) (/ sinTheta_i v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float tmp;
if ((sinTheta_i * sinTheta_O) <= 4.999999898305949e-32f) {
tmp = expf((cosTheta_O * (cosTheta_i / v)));
} else {
tmp = expf((-sinTheta_O * (sinTheta_i / v)));
}
return tmp;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: tmp
if ((sintheta_i * sintheta_o) <= 4.999999898305949e-32) then
tmp = exp((costheta_o * (costheta_i / v)))
else
tmp = exp((-sintheta_o * (sintheta_i / v)))
end if
code = tmp
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = Float32(0.0) if (Float32(sinTheta_i * sinTheta_O) <= Float32(4.999999898305949e-32)) tmp = exp(Float32(cosTheta_O * Float32(cosTheta_i / v))); else tmp = exp(Float32(Float32(-sinTheta_O) * Float32(sinTheta_i / v))); end return tmp end
function tmp_2 = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.0); if ((sinTheta_i * sinTheta_O) <= single(4.999999898305949e-32)) tmp = exp((cosTheta_O * (cosTheta_i / v))); else tmp = exp((-sinTheta_O * (sinTheta_i / v))); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;sinTheta\_i \cdot sinTheta\_O \leq 4.999999898305949 \cdot 10^{-32}:\\
\;\;\;\;e^{cosTheta\_O \cdot \frac{cosTheta\_i}{v}}\\
\mathbf{else}:\\
\;\;\;\;e^{\left(-sinTheta\_O\right) \cdot \frac{sinTheta\_i}{v}}\\
\end{array}
\end{array}
if (*.f32 sinTheta_i sinTheta_O) < 4.9999999e-32Initial program 99.5%
lift-+.f32N/A
lift-log.f32N/A
lift-/.f32N/A
log-recN/A
unsub-negN/A
lower--.f32N/A
Applied rewrites99.5%
Taylor expanded in cosTheta_i around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f3212.2
Applied rewrites12.2%
Applied rewrites12.2%
if 4.9999999e-32 < (*.f32 sinTheta_i sinTheta_O) Initial program 100.0%
lift-+.f32N/A
lift-log.f32N/A
lift-/.f32N/A
log-recN/A
unsub-negN/A
lower--.f32N/A
Applied rewrites100.0%
Taylor expanded in cosTheta_i around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f328.4
Applied rewrites8.4%
Taylor expanded in sinTheta_i around inf
mul-1-negN/A
associate-/l*N/A
distribute-lft-neg-inN/A
mul-1-negN/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f32N/A
lower-/.f3248.7
Applied rewrites48.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (/ -1.0 v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(-1.0) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(-1.0) / v)); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{\frac{-1}{v}}
\end{array}
Initial program 99.6%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
lower-*.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
sub-negN/A
+-commutativeN/A
Applied rewrites15.7%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.6%
Taylor expanded in v around 0
Applied rewrites96.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ (- (fma cosTheta_i cosTheta_O -1.0) (* sinTheta_i sinTheta_O)) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((fmaf(cosTheta_i, cosTheta_O, -1.0f) - (sinTheta_i * sinTheta_O)) / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(fma(cosTheta_i, cosTheta_O, Float32(-1.0)) - Float32(sinTheta_i * sinTheta_O)) / v)) end
\begin{array}{l}
\\
e^{\frac{\mathsf{fma}\left(cosTheta\_i, cosTheta\_O, -1\right) - sinTheta\_i \cdot sinTheta\_O}{v}}
\end{array}
Initial program 99.6%
lift-+.f32N/A
lift-log.f32N/A
lift-/.f32N/A
log-recN/A
unsub-negN/A
lower--.f32N/A
Applied rewrites99.6%
Taylor expanded in cosTheta_i around 0
distribute-lft-inN/A
metadata-evalN/A
mul-1-negN/A
unsub-negN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f3299.6
Applied rewrites99.6%
Taylor expanded in v around 0
lower-/.f32N/A
associate--r+N/A
lower--.f32N/A
sub-negN/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f32N/A
*-commutativeN/A
lower-*.f3294.8
Applied rewrites94.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (* cosTheta_O (/ cosTheta_i v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((cosTheta_O * (cosTheta_i / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp((costheta_o * (costheta_i / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(cosTheta_O * Float32(cosTheta_i / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((cosTheta_O * (cosTheta_i / v))); end
\begin{array}{l}
\\
e^{cosTheta\_O \cdot \frac{cosTheta\_i}{v}}
\end{array}
Initial program 99.6%
lift-+.f32N/A
lift-log.f32N/A
lift-/.f32N/A
log-recN/A
unsub-negN/A
lower--.f32N/A
Applied rewrites99.6%
Taylor expanded in cosTheta_i around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f3211.6
Applied rewrites11.6%
Applied rewrites11.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ (exp 0.6931) v) 0.5))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(0.6931f) / v) * 0.5f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(0.6931e0) / v) * 0.5e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(0.6931)) / v) * Float32(0.5)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(single(0.6931)) / v) * single(0.5); end
\begin{array}{l}
\\
\frac{e^{0.6931}}{v} \cdot 0.5
\end{array}
Initial program 99.6%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
exp-sumN/A
lift-log.f32N/A
rem-exp-logN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
metadata-evalN/A
lower-exp.f3299.6
lift-+.f32N/A
Applied rewrites99.6%
lift-/.f32N/A
metadata-evalN/A
associate-/r*N/A
lift-*.f32N/A
clear-numN/A
inv-powN/A
sqr-powN/A
pow2N/A
lower-pow.f32N/A
metadata-evalN/A
lower-pow.f32N/A
lift-*.f32N/A
associate-/l*N/A
/-rgt-identityN/A
lift-*.f3299.6
Applied rewrites99.6%
Taylor expanded in v around inf
*-commutativeN/A
unpow2N/A
rem-square-sqrtN/A
associate-*r/N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower-exp.f324.7
Applied rewrites4.7%
herbie shell --seed 2024299
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))