
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 20 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (fma (/ 0.16666666666666666 (* r PI)) (* (exp (* -0.3333333333333333 (/ r s))) (/ 0.75 s)) (* 0.125 (/ (exp (/ (- r) s)) (* (* s PI) r)))))
float code(float s, float r) {
return fmaf((0.16666666666666666f / (r * ((float) M_PI))), (expf((-0.3333333333333333f * (r / s))) * (0.75f / s)), (0.125f * (expf((-r / s)) / ((s * ((float) M_PI)) * r))));
}
function code(s, r) return fma(Float32(Float32(0.16666666666666666) / Float32(r * Float32(pi))), Float32(exp(Float32(Float32(-0.3333333333333333) * Float32(r / s))) * Float32(Float32(0.75) / s)), Float32(Float32(0.125) * Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(s * Float32(pi)) * r)))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{0.16666666666666666}{r \cdot \pi}, e^{-0.3333333333333333 \cdot \frac{r}{s}} \cdot \frac{0.75}{s}, 0.125 \cdot \frac{e^{\frac{-r}{s}}}{\left(s \cdot \pi\right) \cdot r}\right)
\end{array}
Initial program 99.8%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-*l*N/A
associate-/r*N/A
lower-/.f32N/A
Applied rewrites99.8%
Taylor expanded in r around inf
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower-exp.f32N/A
associate-*r/N/A
lower-/.f32N/A
mul-1-negN/A
lower-neg.f32N/A
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-PI.f3299.8
Applied rewrites99.8%
Applied rewrites99.8%
lift-fma.f32N/A
*-commutativeN/A
lower-fma.f3299.8
Applied rewrites99.8%
Final simplification99.8%
(FPCore (s r) :precision binary32 (+ (/ (* (* (exp (/ r (* -3.0 s))) 0.75) 0.16666666666666666) (* (* s PI) r)) (* (/ (exp (/ (- r) s)) (* (* s r) PI)) 0.125)))
float code(float s, float r) {
return (((expf((r / (-3.0f * s))) * 0.75f) * 0.16666666666666666f) / ((s * ((float) M_PI)) * r)) + ((expf((-r / s)) / ((s * r) * ((float) M_PI))) * 0.125f);
}
function code(s, r) return Float32(Float32(Float32(Float32(exp(Float32(r / Float32(Float32(-3.0) * s))) * Float32(0.75)) * Float32(0.16666666666666666)) / Float32(Float32(s * Float32(pi)) * r)) + Float32(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(s * r) * Float32(pi))) * Float32(0.125))) end
function tmp = code(s, r) tmp = (((exp((r / (single(-3.0) * s))) * single(0.75)) * single(0.16666666666666666)) / ((s * single(pi)) * r)) + ((exp((-r / s)) / ((s * r) * single(pi))) * single(0.125)); end
\begin{array}{l}
\\
\frac{\left(e^{\frac{r}{-3 \cdot s}} \cdot 0.75\right) \cdot 0.16666666666666666}{\left(s \cdot \pi\right) \cdot r} + \frac{e^{\frac{-r}{s}}}{\left(s \cdot r\right) \cdot \pi} \cdot 0.125
\end{array}
Initial program 99.6%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-*l*N/A
associate-/r*N/A
lower-/.f32N/A
Applied rewrites99.6%
Taylor expanded in r around inf
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower-exp.f32N/A
associate-*r/N/A
lower-/.f32N/A
mul-1-negN/A
lower-neg.f32N/A
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-PI.f3299.6
Applied rewrites99.6%
Final simplification99.6%
herbie shell --seed 2024229
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))