
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 22 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (* (/ 0.125 r) (fma (pow E (/ (* -0.16666666666666666 r) s)) (/ (pow E (* (/ r s) -0.16666666666666666)) (* PI s)) (/ (exp (/ (- r) s)) (* PI s)))))
float code(float s, float r) {
return (0.125f / r) * fmaf(powf(((float) M_E), ((-0.16666666666666666f * r) / s)), (powf(((float) M_E), ((r / s) * -0.16666666666666666f)) / (((float) M_PI) * s)), (expf((-r / s)) / (((float) M_PI) * s)));
}
function code(s, r) return Float32(Float32(Float32(0.125) / r) * fma((Float32(exp(1)) ^ Float32(Float32(Float32(-0.16666666666666666) * r) / s)), Float32((Float32(exp(1)) ^ Float32(Float32(r / s) * Float32(-0.16666666666666666))) / Float32(Float32(pi) * s)), Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(pi) * s)))) end
\begin{array}{l}
\\
\frac{0.125}{r} \cdot \mathsf{fma}\left({e}^{\left(\frac{-0.16666666666666666 \cdot r}{s}\right)}, \frac{{e}^{\left(\frac{r}{s} \cdot -0.16666666666666666\right)}}{\pi \cdot s}, \frac{e^{\frac{-r}{s}}}{\pi \cdot s}\right)
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
distribute-lft-outN/A
*-commutativeN/A
associate-/l*N/A
lower-*.f32N/A
Applied rewrites99.7%
Applied rewrites99.7%
Applied rewrites99.7%
Applied rewrites99.8%
Final simplification99.8%
(FPCore (s r) :precision binary32 (let* ((t_0 (pow E (* (/ r s) -0.16666666666666666)))) (* (fma t_0 (/ t_0 (* PI s)) (/ (exp (/ (- r) s)) (* PI s))) (/ 0.125 r))))
float code(float s, float r) {
float t_0 = powf(((float) M_E), ((r / s) * -0.16666666666666666f));
return fmaf(t_0, (t_0 / (((float) M_PI) * s)), (expf((-r / s)) / (((float) M_PI) * s))) * (0.125f / r);
}
function code(s, r) t_0 = Float32(exp(1)) ^ Float32(Float32(r / s) * Float32(-0.16666666666666666)) return Float32(fma(t_0, Float32(t_0 / Float32(Float32(pi) * s)), Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(pi) * s))) * Float32(Float32(0.125) / r)) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := {e}^{\left(\frac{r}{s} \cdot -0.16666666666666666\right)}\\
\mathsf{fma}\left(t\_0, \frac{t\_0}{\pi \cdot s}, \frac{e^{\frac{-r}{s}}}{\pi \cdot s}\right) \cdot \frac{0.125}{r}
\end{array}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
distribute-lft-outN/A
*-commutativeN/A
associate-/l*N/A
lower-*.f32N/A
Applied rewrites99.5%
Applied rewrites99.5%
Applied rewrites99.6%
herbie shell --seed 2024230
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))