
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 20 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (let* ((t_0 (/ 0.125 (* s PI)))) (* (/ 1.0 r) (fma (exp (/ r (- s))) t_0 (* t_0 (exp (/ r (* s -3.0))))))))
float code(float s, float r) {
float t_0 = 0.125f / (s * ((float) M_PI));
return (1.0f / r) * fmaf(expf((r / -s)), t_0, (t_0 * expf((r / (s * -3.0f)))));
}
function code(s, r) t_0 = Float32(Float32(0.125) / Float32(s * Float32(pi))) return Float32(Float32(Float32(1.0) / r) * fma(exp(Float32(r / Float32(-s))), t_0, Float32(t_0 * exp(Float32(r / Float32(s * Float32(-3.0))))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{0.125}{s \cdot \pi}\\
\frac{1}{r} \cdot \mathsf{fma}\left(e^{\frac{r}{-s}}, t\_0, t\_0 \cdot e^{\frac{r}{s \cdot -3}}\right)
\end{array}
\end{array}
Initial program 99.7%
Applied egg-rr99.8%
Final simplification99.8%
(FPCore (s r)
:precision binary32
(let* ((t_0 (exp (/ r (- s)))) (t_1 (/ 0.125 (* s PI))))
(if (<=
(+
(/ (* t_0 0.25) (* r (* s (* PI 2.0))))
(/ (* 0.75 (exp (/ r (* (- s) 3.0)))) (* r (* s (* PI 6.0)))))
1.999999987845058e-8)
(/ (/ (* 0.125 (exp (* (/ r s) -0.3333333333333333))) (* s PI)) r)
(*
(/ 1.0 r)
(fma
t_0
t_1
(*
t_1
(fma
r
(fma
r
(fma
(/ r (* s (* s s)))
-0.006172839506172839
(/ 0.05555555555555555 (* s s)))
(/ -0.3333333333333333 s))
1.0)))))))
float code(float s, float r) {
float t_0 = expf((r / -s));
float t_1 = 0.125f / (s * ((float) M_PI));
float tmp;
if ((((t_0 * 0.25f) / (r * (s * (((float) M_PI) * 2.0f)))) + ((0.75f * expf((r / (-s * 3.0f)))) / (r * (s * (((float) M_PI) * 6.0f))))) <= 1.999999987845058e-8f) {
tmp = ((0.125f * expf(((r / s) * -0.3333333333333333f))) / (s * ((float) M_PI))) / r;
} else {
tmp = (1.0f / r) * fmaf(t_0, t_1, (t_1 * fmaf(r, fmaf(r, fmaf((r / (s * (s * s))), -0.006172839506172839f, (0.05555555555555555f / (s * s))), (-0.3333333333333333f / s)), 1.0f)));
}
return tmp;
}
function code(s, r) t_0 = exp(Float32(r / Float32(-s))) t_1 = Float32(Float32(0.125) / Float32(s * Float32(pi))) tmp = Float32(0.0) if (Float32(Float32(Float32(t_0 * Float32(0.25)) / Float32(r * Float32(s * Float32(Float32(pi) * Float32(2.0))))) + Float32(Float32(Float32(0.75) * exp(Float32(r / Float32(Float32(-s) * Float32(3.0))))) / Float32(r * Float32(s * Float32(Float32(pi) * Float32(6.0)))))) <= Float32(1.999999987845058e-8)) tmp = Float32(Float32(Float32(Float32(0.125) * exp(Float32(Float32(r / s) * Float32(-0.3333333333333333)))) / Float32(s * Float32(pi))) / r); else tmp = Float32(Float32(Float32(1.0) / r) * fma(t_0, t_1, Float32(t_1 * fma(r, fma(r, fma(Float32(r / Float32(s * Float32(s * s))), Float32(-0.006172839506172839), Float32(Float32(0.05555555555555555) / Float32(s * s))), Float32(Float32(-0.3333333333333333) / s)), Float32(1.0))))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{r}{-s}}\\
t_1 := \frac{0.125}{s \cdot \pi}\\
\mathbf{if}\;\frac{t\_0 \cdot 0.25}{r \cdot \left(s \cdot \left(\pi \cdot 2\right)\right)} + \frac{0.75 \cdot e^{\frac{r}{\left(-s\right) \cdot 3}}}{r \cdot \left(s \cdot \left(\pi \cdot 6\right)\right)} \leq 1.999999987845058 \cdot 10^{-8}:\\
\;\;\;\;\frac{\frac{0.125 \cdot e^{\frac{r}{s} \cdot -0.3333333333333333}}{s \cdot \pi}}{r}\\
\mathbf{else}:\\
\;\;\;\;\frac{1}{r} \cdot \mathsf{fma}\left(t\_0, t\_1, t\_1 \cdot \mathsf{fma}\left(r, \mathsf{fma}\left(r, \mathsf{fma}\left(\frac{r}{s \cdot \left(s \cdot s\right)}, -0.006172839506172839, \frac{0.05555555555555555}{s \cdot s}\right), \frac{-0.3333333333333333}{s}\right), 1\right)\right)\\
\end{array}
\end{array}
if (+.f32 (/.f32 (*.f32 #s(literal 1/4 binary32) (exp.f32 (/.f32 (neg.f32 r) s))) (*.f32 (*.f32 (*.f32 #s(literal 2 binary32) (PI.f32)) s) r)) (/.f32 (*.f32 #s(literal 3/4 binary32) (exp.f32 (/.f32 (neg.f32 r) (*.f32 #s(literal 3 binary32) s)))) (*.f32 (*.f32 (*.f32 #s(literal 6 binary32) (PI.f32)) s) r))) < 1.99999999e-8Initial program 99.8%
Taylor expanded in r around inf
distribute-lft-outN/A
metadata-evalN/A
associate-*r*N/A
distribute-lft-outN/A
lower-/.f32N/A
Simplified99.8%
Applied egg-rr99.7%
Taylor expanded in s around -inf
mul-1-negN/A
unsub-negN/A
lower--.f32N/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f3255.7
Simplified55.7%
Taylor expanded in r around inf
associate-*r/N/A
lower-/.f32N/A
lower-*.f32N/A
lower-exp.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f3299.7
Simplified99.7%
if 1.99999999e-8 < (+.f32 (/.f32 (*.f32 #s(literal 1/4 binary32) (exp.f32 (/.f32 (neg.f32 r) s))) (*.f32 (*.f32 (*.f32 #s(literal 2 binary32) (PI.f32)) s) r)) (/.f32 (*.f32 #s(literal 3/4 binary32) (exp.f32 (/.f32 (neg.f32 r) (*.f32 #s(literal 3 binary32) s)))) (*.f32 (*.f32 (*.f32 #s(literal 6 binary32) (PI.f32)) s) r))) Initial program 97.9%
Applied egg-rr97.5%
Taylor expanded in r around 0
+-commutativeN/A
lower-fma.f32N/A
Simplified71.3%
Final simplification96.8%
herbie shell --seed 2024218
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))