
(FPCore (u v) :precision binary32 (+ 1.0 (* v (log (+ u (* (- 1.0 u) (exp (/ -2.0 v))))))))
float code(float u, float v) {
return 1.0f + (v * logf((u + ((1.0f - u) * expf((-2.0f / v))))));
}
real(4) function code(u, v)
real(4), intent (in) :: u
real(4), intent (in) :: v
code = 1.0e0 + (v * log((u + ((1.0e0 - u) * exp(((-2.0e0) / v))))))
end function
function code(u, v) return Float32(Float32(1.0) + Float32(v * log(Float32(u + Float32(Float32(Float32(1.0) - u) * exp(Float32(Float32(-2.0) / v))))))) end
function tmp = code(u, v) tmp = single(1.0) + (v * log((u + ((single(1.0) - u) * exp((single(-2.0) / v)))))); end
\begin{array}{l}
\\
1 + v \cdot \log \left(u + \left(1 - u\right) \cdot e^{\frac{-2}{v}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 23 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u v) :precision binary32 (+ 1.0 (* v (log (+ u (* (- 1.0 u) (exp (/ -2.0 v))))))))
float code(float u, float v) {
return 1.0f + (v * logf((u + ((1.0f - u) * expf((-2.0f / v))))));
}
real(4) function code(u, v)
real(4), intent (in) :: u
real(4), intent (in) :: v
code = 1.0e0 + (v * log((u + ((1.0e0 - u) * exp(((-2.0e0) / v))))))
end function
function code(u, v) return Float32(Float32(1.0) + Float32(v * log(Float32(u + Float32(Float32(Float32(1.0) - u) * exp(Float32(Float32(-2.0) / v))))))) end
function tmp = code(u, v) tmp = single(1.0) + (v * log((u + ((single(1.0) - u) * exp((single(-2.0) / v)))))); end
\begin{array}{l}
\\
1 + v \cdot \log \left(u + \left(1 - u\right) \cdot e^{\frac{-2}{v}}\right)
\end{array}
(FPCore (u v) :precision binary32 (fma v (log (fma (/ 1.0 (exp (/ 2.0 v))) (- 1.0 u) u)) 1.0))
float code(float u, float v) {
return fmaf(v, logf(fmaf((1.0f / expf((2.0f / v))), (1.0f - u), u)), 1.0f);
}
function code(u, v) return fma(v, log(fma(Float32(Float32(1.0) / exp(Float32(Float32(2.0) / v))), Float32(Float32(1.0) - u), u)), Float32(1.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(v, \log \left(\mathsf{fma}\left(\frac{1}{e^{\frac{2}{v}}}, 1 - u, u\right)\right), 1\right)
\end{array}
Initial program 99.5%
Taylor expanded in v around 0
+-commutativeN/A
lower-fma.f32N/A
lower-log.f32N/A
+-commutativeN/A
lower-fma.f32N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
associate-*r/N/A
lower-exp.f32N/A
associate-*r/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f32N/A
lower--.f3299.5
Simplified99.5%
frac-2negN/A
metadata-evalN/A
distribute-frac-neg2N/A
exp-negN/A
lower-/.f32N/A
lower-exp.f32N/A
lower-/.f3299.5
Applied egg-rr99.5%
(FPCore (u v) :precision binary32 (if (<= (* v (log (+ u (* (- 1.0 u) (exp (/ -2.0 v)))))) -1.0) (+ 1.0 (fma u 2.0 (fma u (/ (fma v 2.0 1.3333333333333333) (* v v)) -2.0))) 1.0))
float code(float u, float v) {
float tmp;
if ((v * logf((u + ((1.0f - u) * expf((-2.0f / v)))))) <= -1.0f) {
tmp = 1.0f + fmaf(u, 2.0f, fmaf(u, (fmaf(v, 2.0f, 1.3333333333333333f) / (v * v)), -2.0f));
} else {
tmp = 1.0f;
}
return tmp;
}
function code(u, v) tmp = Float32(0.0) if (Float32(v * log(Float32(u + Float32(Float32(Float32(1.0) - u) * exp(Float32(Float32(-2.0) / v)))))) <= Float32(-1.0)) tmp = Float32(Float32(1.0) + fma(u, Float32(2.0), fma(u, Float32(fma(v, Float32(2.0), Float32(1.3333333333333333)) / Float32(v * v)), Float32(-2.0)))); else tmp = Float32(1.0); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;v \cdot \log \left(u + \left(1 - u\right) \cdot e^{\frac{-2}{v}}\right) \leq -1:\\
\;\;\;\;1 + \mathsf{fma}\left(u, 2, \mathsf{fma}\left(u, \frac{\mathsf{fma}\left(v, 2, 1.3333333333333333\right)}{v \cdot v}, -2\right)\right)\\
\mathbf{else}:\\
\;\;\;\;1\\
\end{array}
\end{array}
if (*.f32 v (log.f32 (+.f32 u (*.f32 (-.f32 #s(literal 1 binary32) u) (exp.f32 (/.f32 #s(literal -2 binary32) v)))))) < -1Initial program 93.1%
Taylor expanded in v around -inf
Simplified69.9%
Taylor expanded in u around 0
sub-negN/A
mul-1-negN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
metadata-evalN/A
lower-fma.f32N/A
Simplified64.3%
Taylor expanded in v around 0
lower-/.f32N/A
+-commutativeN/A
lower-fma.f32N/A
unpow2N/A
lower-*.f3264.3
Simplified64.3%
lift-fma.f32N/A
lift-*.f32N/A
lift-/.f32N/A
lift-+.f32N/A
lift-+.f32N/A
distribute-rgt-inN/A
*-commutativeN/A
associate-+l+N/A
lower-fma.f32N/A
*-commutativeN/A
lower-fma.f3264.3
lift-fma.f32N/A
*-commutativeN/A
lower-fma.f3264.3
Applied egg-rr64.3%
if -1 < (*.f32 v (log.f32 (+.f32 u (*.f32 (-.f32 #s(literal 1 binary32) u) (exp.f32 (/.f32 #s(literal -2 binary32) v)))))) Initial program 99.9%
Taylor expanded in v around 0
Simplified92.4%
herbie shell --seed 2024218
(FPCore (u v)
:name "HairBSDF, sample_f, cosTheta"
:precision binary32
:pre (and (and (<= 1e-5 u) (<= u 1.0)) (and (<= 0.0 v) (<= v 109.746574)))
(+ 1.0 (* v (log (+ u (* (- 1.0 u) (exp (/ -2.0 v))))))))