
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 11 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (+ (/ (* (exp (/ r (- s))) 0.125) (* s (* r PI))) (/ (* 0.75 (exp (/ r (* s -3.0)))) (* (* r 6.0) (* s PI)))))
float code(float s, float r) {
return ((expf((r / -s)) * 0.125f) / (s * (r * ((float) M_PI)))) + ((0.75f * expf((r / (s * -3.0f)))) / ((r * 6.0f) * (s * ((float) M_PI))));
}
function code(s, r) return Float32(Float32(Float32(exp(Float32(r / Float32(-s))) * Float32(0.125)) / Float32(s * Float32(r * Float32(pi)))) + Float32(Float32(Float32(0.75) * exp(Float32(r / Float32(s * Float32(-3.0))))) / Float32(Float32(r * Float32(6.0)) * Float32(s * Float32(pi))))) end
function tmp = code(s, r) tmp = ((exp((r / -s)) * single(0.125)) / (s * (r * single(pi)))) + ((single(0.75) * exp((r / (s * single(-3.0))))) / ((r * single(6.0)) * (s * single(pi)))); end
\begin{array}{l}
\\
\frac{e^{\frac{r}{-s}} \cdot 0.125}{s \cdot \left(r \cdot \pi\right)} + \frac{0.75 \cdot e^{\frac{r}{s \cdot -3}}}{\left(r \cdot 6\right) \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
lift-PI.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f3299.7
Applied rewrites99.7%
Applied rewrites99.7%
lift-*.f32N/A
distribute-frac-negN/A
distribute-frac-neg2N/A
lower-/.f32N/A
lift-*.f32N/A
*-commutativeN/A
distribute-rgt-neg-inN/A
lower-*.f32N/A
metadata-eval99.7
Applied rewrites99.7%
(FPCore (s r) :precision binary32 (* (/ 0.125 (* s PI)) (+ (/ (exp (/ r (* s -3.0))) r) (/ (exp (/ r (- s))) r))))
float code(float s, float r) {
return (0.125f / (s * ((float) M_PI))) * ((expf((r / (s * -3.0f))) / r) + (expf((r / -s)) / r));
}
function code(s, r) return Float32(Float32(Float32(0.125) / Float32(s * Float32(pi))) * Float32(Float32(exp(Float32(r / Float32(s * Float32(-3.0)))) / r) + Float32(exp(Float32(r / Float32(-s))) / r))) end
function tmp = code(s, r) tmp = (single(0.125) / (s * single(pi))) * ((exp((r / (s * single(-3.0)))) / r) + (exp((r / -s)) / r)); end
\begin{array}{l}
\\
\frac{0.125}{s \cdot \pi} \cdot \left(\frac{e^{\frac{r}{s \cdot -3}}}{r} + \frac{e^{\frac{r}{-s}}}{r}\right)
\end{array}
Initial program 99.6%
Applied rewrites99.6%
(FPCore (s r)
:precision binary32
(+
(/ (* (exp (/ r (- s))) 0.25) (* r (* s (* PI 2.0))))
(/
(+
(/ 0.125 (* r PI))
(fma
r
(/ 0.006944444444444444 (* s (* s PI)))
(/ -0.041666666666666664 (* s PI))))
s)))
float code(float s, float r) {
return ((expf((r / -s)) * 0.25f) / (r * (s * (((float) M_PI) * 2.0f)))) + (((0.125f / (r * ((float) M_PI))) + fmaf(r, (0.006944444444444444f / (s * (s * ((float) M_PI)))), (-0.041666666666666664f / (s * ((float) M_PI))))) / s);
}
function code(s, r) return Float32(Float32(Float32(exp(Float32(r / Float32(-s))) * Float32(0.25)) / Float32(r * Float32(s * Float32(Float32(pi) * Float32(2.0))))) + Float32(Float32(Float32(Float32(0.125) / Float32(r * Float32(pi))) + fma(r, Float32(Float32(0.006944444444444444) / Float32(s * Float32(s * Float32(pi)))), Float32(Float32(-0.041666666666666664) / Float32(s * Float32(pi))))) / s)) end
\begin{array}{l}
\\
\frac{e^{\frac{r}{-s}} \cdot 0.25}{r \cdot \left(s \cdot \left(\pi \cdot 2\right)\right)} + \frac{\frac{0.125}{r \cdot \pi} + \mathsf{fma}\left(r, \frac{0.006944444444444444}{s \cdot \left(s \cdot \pi\right)}, \frac{-0.041666666666666664}{s \cdot \pi}\right)}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
Applied rewrites10.0%
Final simplification10.0%
(FPCore (s r) :precision binary32 (fma (+ (/ 0.75 r) (/ (fma (/ r s) 0.041666666666666664 -0.25) s)) (/ 0.16666666666666666 (* s PI)) (* (exp (/ r (- s))) (/ 0.125 (* PI (* r s))))))
float code(float s, float r) {
return fmaf(((0.75f / r) + (fmaf((r / s), 0.041666666666666664f, -0.25f) / s)), (0.16666666666666666f / (s * ((float) M_PI))), (expf((r / -s)) * (0.125f / (((float) M_PI) * (r * s)))));
}
function code(s, r) return fma(Float32(Float32(Float32(0.75) / r) + Float32(fma(Float32(r / s), Float32(0.041666666666666664), Float32(-0.25)) / s)), Float32(Float32(0.16666666666666666) / Float32(s * Float32(pi))), Float32(exp(Float32(r / Float32(-s))) * Float32(Float32(0.125) / Float32(Float32(pi) * Float32(r * s))))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{0.75}{r} + \frac{\mathsf{fma}\left(\frac{r}{s}, 0.041666666666666664, -0.25\right)}{s}, \frac{0.16666666666666666}{s \cdot \pi}, e^{\frac{r}{-s}} \cdot \frac{0.125}{\pi \cdot \left(r \cdot s\right)}\right)
\end{array}
Initial program 99.6%
Applied rewrites98.1%
Taylor expanded in s around -inf
+-commutativeN/A
lower-+.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f32N/A
associate-*r/N/A
lower-/.f32N/A
+-commutativeN/A
distribute-rgt-inN/A
*-commutativeN/A
associate-*l*N/A
metadata-evalN/A
metadata-evalN/A
lower-fma.f32N/A
lower-/.f329.9
Applied rewrites9.9%
(FPCore (s r)
:precision binary32
(/
(fma
r
(/
(fma 0.06944444444444445 (/ r (* s PI)) (/ -0.16666666666666666 PI))
(* s s))
(/ 0.25 (* s PI)))
r))
float code(float s, float r) {
return fmaf(r, (fmaf(0.06944444444444445f, (r / (s * ((float) M_PI))), (-0.16666666666666666f / ((float) M_PI))) / (s * s)), (0.25f / (s * ((float) M_PI)))) / r;
}
function code(s, r) return Float32(fma(r, Float32(fma(Float32(0.06944444444444445), Float32(r / Float32(s * Float32(pi))), Float32(Float32(-0.16666666666666666) / Float32(pi))) / Float32(s * s)), Float32(Float32(0.25) / Float32(s * Float32(pi)))) / r) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(r, \frac{\mathsf{fma}\left(0.06944444444444445, \frac{r}{s \cdot \pi}, \frac{-0.16666666666666666}{\pi}\right)}{s \cdot s}, \frac{0.25}{s \cdot \pi}\right)}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
Applied rewrites9.5%
(FPCore (s r) :precision binary32 (- (/ (fma (/ r PI) (/ -0.06944444444444445 s) (/ 0.16666666666666666 PI)) (- (* s s))) (/ -0.25 (* s (* r PI)))))
float code(float s, float r) {
return (fmaf((r / ((float) M_PI)), (-0.06944444444444445f / s), (0.16666666666666666f / ((float) M_PI))) / -(s * s)) - (-0.25f / (s * (r * ((float) M_PI))));
}
function code(s, r) return Float32(Float32(fma(Float32(r / Float32(pi)), Float32(Float32(-0.06944444444444445) / s), Float32(Float32(0.16666666666666666) / Float32(pi))) / Float32(-Float32(s * s))) - Float32(Float32(-0.25) / Float32(s * Float32(r * Float32(pi))))) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(\frac{r}{\pi}, \frac{-0.06944444444444445}{s}, \frac{0.16666666666666666}{\pi}\right)}{-s \cdot s} - \frac{-0.25}{s \cdot \left(r \cdot \pi\right)}
\end{array}
Initial program 99.6%
lift-PI.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f3299.7
Applied rewrites99.7%
Applied rewrites99.7%
Taylor expanded in s around -inf
mul-1-negN/A
lower-neg.f32N/A
div-subN/A
sub-negN/A
lower-+.f32N/A
Applied rewrites9.4%
Final simplification9.4%
(FPCore (s r) :precision binary32 (+ (/ (fma 0.06944444444444445 (/ r (* s PI)) (/ -0.16666666666666666 PI)) (* s s)) (/ 0.25 (* r (* s PI)))))
float code(float s, float r) {
return (fmaf(0.06944444444444445f, (r / (s * ((float) M_PI))), (-0.16666666666666666f / ((float) M_PI))) / (s * s)) + (0.25f / (r * (s * ((float) M_PI))));
}
function code(s, r) return Float32(Float32(fma(Float32(0.06944444444444445), Float32(r / Float32(s * Float32(pi))), Float32(Float32(-0.16666666666666666) / Float32(pi))) / Float32(s * s)) + Float32(Float32(0.25) / Float32(r * Float32(s * Float32(pi))))) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(0.06944444444444445, \frac{r}{s \cdot \pi}, \frac{-0.16666666666666666}{\pi}\right)}{s \cdot s} + \frac{0.25}{r \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
Applied rewrites9.4%
(FPCore (s r) :precision binary32 (/ 0.25 (* r (* (sqrt PI) (* s (sqrt PI))))))
float code(float s, float r) {
return 0.25f / (r * (sqrtf(((float) M_PI)) * (s * sqrtf(((float) M_PI)))));
}
function code(s, r) return Float32(Float32(0.25) / Float32(r * Float32(sqrt(Float32(pi)) * Float32(s * sqrt(Float32(pi)))))) end
function tmp = code(s, r) tmp = single(0.25) / (r * (sqrt(single(pi)) * (s * sqrt(single(pi))))); end
\begin{array}{l}
\\
\frac{0.25}{r \cdot \left(\sqrt{\pi} \cdot \left(s \cdot \sqrt{\pi}\right)\right)}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f328.5
Applied rewrites8.5%
add-sqr-sqrtN/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
lift-PI.f32N/A
lower-sqrt.f32N/A
lift-PI.f32N/A
lower-sqrt.f328.5
Applied rewrites8.5%
Final simplification8.5%
(FPCore (s r) :precision binary32 (/ 0.25 (* r (* s PI))))
float code(float s, float r) {
return 0.25f / (r * (s * ((float) M_PI)));
}
function code(s, r) return Float32(Float32(0.25) / Float32(r * Float32(s * Float32(pi)))) end
function tmp = code(s, r) tmp = single(0.25) / (r * (s * single(pi))); end
\begin{array}{l}
\\
\frac{0.25}{r \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f328.5
Applied rewrites8.5%
(FPCore (s r) :precision binary32 (/ 0.125 (* PI (* r s))))
float code(float s, float r) {
return 0.125f / (((float) M_PI) * (r * s));
}
function code(s, r) return Float32(Float32(0.125) / Float32(Float32(pi) * Float32(r * s))) end
function tmp = code(s, r) tmp = single(0.125) / (single(pi) * (r * s)); end
\begin{array}{l}
\\
\frac{0.125}{\pi \cdot \left(r \cdot s\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
Applied rewrites9.8%
Taylor expanded in r around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
sub-negN/A
associate-*r/N/A
metadata-evalN/A
lower-+.f32N/A
lower-/.f32N/A
lower-*.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
Applied rewrites4.2%
Taylor expanded in r around 0
lower-/.f32N/A
*-commutativeN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f326.9
Applied rewrites6.9%
lift-PI.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f326.9
Applied rewrites6.9%
Final simplification6.9%
(FPCore (s r) :precision binary32 (/ 0.125 (* s (* r PI))))
float code(float s, float r) {
return 0.125f / (s * (r * ((float) M_PI)));
}
function code(s, r) return Float32(Float32(0.125) / Float32(s * Float32(r * Float32(pi)))) end
function tmp = code(s, r) tmp = single(0.125) / (s * (r * single(pi))); end
\begin{array}{l}
\\
\frac{0.125}{s \cdot \left(r \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
Applied rewrites9.8%
Taylor expanded in r around inf
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
sub-negN/A
associate-*r/N/A
metadata-evalN/A
lower-+.f32N/A
lower-/.f32N/A
lower-*.f32N/A
unpow2N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
Applied rewrites4.2%
Taylor expanded in r around 0
lower-/.f32N/A
*-commutativeN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f326.9
Applied rewrites6.9%
herbie shell --seed 2024219
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))