
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (/ (fma (exp (/ (- r) s)) 0.125 (* 0.125 (exp (/ r (* s -3.0))))) (* (* PI r) s)))
float code(float s, float r) {
return fmaf(expf((-r / s)), 0.125f, (0.125f * expf((r / (s * -3.0f))))) / ((((float) M_PI) * r) * s);
}
function code(s, r) return Float32(fma(exp(Float32(Float32(-r) / s)), Float32(0.125), Float32(Float32(0.125) * exp(Float32(r / Float32(s * Float32(-3.0)))))) / Float32(Float32(Float32(pi) * r) * s)) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(e^{\frac{-r}{s}}, 0.125, 0.125 \cdot e^{\frac{r}{s \cdot -3}}\right)}{\left(\pi \cdot r\right) \cdot s}
\end{array}
Initial program 99.6%
lift-+.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
div-add-revN/A
lower-/.f32N/A
Applied rewrites99.5%
Applied rewrites99.6%
lift-fma.f32N/A
lift-/.f32N/A
lift-/.f32N/A
frac-timesN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-/.f32N/A
+-commutativeN/A
lift-*.f32N/A
Applied rewrites99.5%
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
*-commutativeN/A
associate-*l*N/A
lift-*.f32N/A
lift-*.f3299.5
Applied rewrites99.5%
(FPCore (s r) :precision binary32 (/ (* 0.125 (+ (exp (/ (- r) s)) (exp (/ r (* -3.0 s))))) (* (* PI s) r)))
float code(float s, float r) {
return (0.125f * (expf((-r / s)) + expf((r / (-3.0f * s))))) / ((((float) M_PI) * s) * r);
}
function code(s, r) return Float32(Float32(Float32(0.125) * Float32(exp(Float32(Float32(-r) / s)) + exp(Float32(r / Float32(Float32(-3.0) * s))))) / Float32(Float32(Float32(pi) * s) * r)) end
function tmp = code(s, r) tmp = (single(0.125) * (exp((-r / s)) + exp((r / (single(-3.0) * s))))) / ((single(pi) * s) * r); end
\begin{array}{l}
\\
\frac{0.125 \cdot \left(e^{\frac{-r}{s}} + e^{\frac{r}{-3 \cdot s}}\right)}{\left(\pi \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
lift-+.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
div-add-revN/A
lower-/.f32N/A
Applied rewrites99.5%
Applied rewrites99.6%
lift-fma.f32N/A
lift-/.f32N/A
lift-/.f32N/A
frac-timesN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-/.f32N/A
+-commutativeN/A
lift-*.f32N/A
Applied rewrites99.5%
lift-fma.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
distribute-rgt-outN/A
lower-*.f32N/A
lower-+.f3299.5
Applied rewrites99.5%
(FPCore (s r) :precision binary32 (/ 0.25 (* (log (pow (exp PI) r)) s)))
float code(float s, float r) {
return 0.25f / (logf(powf(expf(((float) M_PI)), r)) * s);
}
function code(s, r) return Float32(Float32(0.25) / Float32(log((exp(Float32(pi)) ^ r)) * s)) end
function tmp = code(s, r) tmp = single(0.25) / (log((exp(single(pi)) ^ r)) * s); end
\begin{array}{l}
\\
\frac{0.25}{\log \left({\left(e^{\pi}\right)}^{r}\right) \cdot s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
associate-*r*N/A
lift-*.f32N/A
lower-*.f329.0
lift-*.f32N/A
*-commutativeN/A
lower-*.f329.0
Applied rewrites9.0%
lift-*.f32N/A
*-commutativeN/A
lift-PI.f32N/A
add-log-expN/A
log-pow-revN/A
lower-log.f32N/A
lower-pow.f32N/A
lift-PI.f32N/A
lower-exp.f3243.1
Applied rewrites43.1%
(FPCore (s r) :precision binary32 (- (/ 0.25 (* (* PI s) r)) (/ (- (/ 0.16666666666666666 PI) (/ (* (/ r PI) 0.06944444444444445) s)) (* s s))))
float code(float s, float r) {
return (0.25f / ((((float) M_PI) * s) * r)) - (((0.16666666666666666f / ((float) M_PI)) - (((r / ((float) M_PI)) * 0.06944444444444445f) / s)) / (s * s));
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(Float32(Float32(pi) * s) * r)) - Float32(Float32(Float32(Float32(0.16666666666666666) / Float32(pi)) - Float32(Float32(Float32(r / Float32(pi)) * Float32(0.06944444444444445)) / s)) / Float32(s * s))) end
function tmp = code(s, r) tmp = (single(0.25) / ((single(pi) * s) * r)) - (((single(0.16666666666666666) / single(pi)) - (((r / single(pi)) * single(0.06944444444444445)) / s)) / (s * s)); end
\begin{array}{l}
\\
\frac{0.25}{\left(\pi \cdot s\right) \cdot r} - \frac{\frac{0.16666666666666666}{\pi} - \frac{\frac{r}{\pi} \cdot 0.06944444444444445}{s}}{s \cdot s}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
lower-*.f32N/A
lower-/.f32N/A
Applied rewrites10.2%
Applied rewrites10.2%
(FPCore (s r) :precision binary32 (/ (- (/ 0.25 (* PI r)) (/ (- (/ 0.16666666666666666 PI) (/ (* (/ r PI) 0.06944444444444445) s)) s)) s))
float code(float s, float r) {
return ((0.25f / (((float) M_PI) * r)) - (((0.16666666666666666f / ((float) M_PI)) - (((r / ((float) M_PI)) * 0.06944444444444445f) / s)) / s)) / s;
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) / Float32(Float32(pi) * r)) - Float32(Float32(Float32(Float32(0.16666666666666666) / Float32(pi)) - Float32(Float32(Float32(r / Float32(pi)) * Float32(0.06944444444444445)) / s)) / s)) / s) end
function tmp = code(s, r) tmp = ((single(0.25) / (single(pi) * r)) - (((single(0.16666666666666666) / single(pi)) - (((r / single(pi)) * single(0.06944444444444445)) / s)) / s)) / s; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi \cdot r} - \frac{\frac{0.16666666666666666}{\pi} - \frac{\frac{r}{\pi} \cdot 0.06944444444444445}{s}}{s}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
lower-*.f32N/A
lower-/.f32N/A
Applied rewrites10.2%
lift-*.f32N/A
mul-1-negN/A
lift-/.f32N/A
distribute-neg-fracN/A
lower-/.f32N/A
Applied rewrites10.2%
(FPCore (s r) :precision binary32 (/ (fma (exp (/ (- r) s)) 0.125 0.125) (* (* PI s) r)))
float code(float s, float r) {
return fmaf(expf((-r / s)), 0.125f, 0.125f) / ((((float) M_PI) * s) * r);
}
function code(s, r) return Float32(fma(exp(Float32(Float32(-r) / s)), Float32(0.125), Float32(0.125)) / Float32(Float32(Float32(pi) * s) * r)) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(e^{\frac{-r}{s}}, 0.125, 0.125\right)}{\left(\pi \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
lift-+.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
div-add-revN/A
lower-/.f32N/A
Applied rewrites99.5%
Applied rewrites99.6%
lift-fma.f32N/A
lift-/.f32N/A
lift-/.f32N/A
frac-timesN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-/.f32N/A
+-commutativeN/A
lift-*.f32N/A
Applied rewrites99.5%
Taylor expanded in s around inf
Applied rewrites9.5%
(FPCore (s r) :precision binary32 (* (/ 1.0 (sqrt PI)) (/ 0.25 (* (* s r) (sqrt PI)))))
float code(float s, float r) {
return (1.0f / sqrtf(((float) M_PI))) * (0.25f / ((s * r) * sqrtf(((float) M_PI))));
}
function code(s, r) return Float32(Float32(Float32(1.0) / sqrt(Float32(pi))) * Float32(Float32(0.25) / Float32(Float32(s * r) * sqrt(Float32(pi))))) end
function tmp = code(s, r) tmp = (single(1.0) / sqrt(single(pi))) * (single(0.25) / ((s * r) * sqrt(single(pi)))); end
\begin{array}{l}
\\
\frac{1}{\sqrt{\pi}} \cdot \frac{0.25}{\left(s \cdot r\right) \cdot \sqrt{\pi}}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lower-*.f32N/A
lower-*.f329.0
Applied rewrites9.0%
lift-/.f32N/A
div-flipN/A
inv-powN/A
lift-*.f32N/A
lift-PI.f32N/A
add-sqr-sqrtN/A
lift-PI.f32N/A
lift-sqrt.f32N/A
lift-PI.f32N/A
lift-sqrt.f32N/A
associate-*l*N/A
lift-*.f32N/A
*-commutativeN/A
associate-/l*N/A
unpow-prod-downN/A
inv-powN/A
div-flipN/A
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
lift-*.f32N/A
*-commutativeN/A
lower-*.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (* (/ 1.0 (* PI r)) (/ 0.25 s)))
float code(float s, float r) {
return (1.0f / (((float) M_PI) * r)) * (0.25f / s);
}
function code(s, r) return Float32(Float32(Float32(1.0) / Float32(Float32(pi) * r)) * Float32(Float32(0.25) / s)) end
function tmp = code(s, r) tmp = (single(1.0) / (single(pi) * r)) * (single(0.25) / s); end
\begin{array}{l}
\\
\frac{1}{\pi \cdot r} \cdot \frac{0.25}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
associate-*r*N/A
lift-*.f32N/A
associate-/l/N/A
mult-flip-revN/A
lift-/.f32N/A
*-commutativeN/A
associate-/l*N/A
lower-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 s) (* PI r)))
float code(float s, float r) {
return (0.25f / s) / (((float) M_PI) * r);
}
function code(s, r) return Float32(Float32(Float32(0.25) / s) / Float32(Float32(pi) * r)) end
function tmp = code(s, r) tmp = (single(0.25) / s) / (single(pi) * r); end
\begin{array}{l}
\\
\frac{\frac{0.25}{s}}{\pi \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lower-*.f32N/A
lower-*.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f32N/A
*-commutativeN/A
lower-*.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ 0.25 (* r (* s PI))))
float code(float s, float r) {
return 0.25f / (r * (s * ((float) M_PI)));
}
function code(s, r) return Float32(Float32(0.25) / Float32(r * Float32(s * Float32(pi)))) end
function tmp = code(s, r) tmp = single(0.25) / (r * (s * single(pi))); end
\begin{array}{l}
\\
\frac{0.25}{r \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
herbie shell --seed 2025149
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))