
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (fma (/ (exp (/ (* r -0.3333333333333333) s)) (* (* (* 6.0 PI) s) r)) 0.75 (/ 0.125 (* (* PI s) (* (exp (/ r s)) r)))))
float code(float s, float r) {
return fmaf((expf(((r * -0.3333333333333333f) / s)) / (((6.0f * ((float) M_PI)) * s) * r)), 0.75f, (0.125f / ((((float) M_PI) * s) * (expf((r / s)) * r))));
}
function code(s, r) return fma(Float32(exp(Float32(Float32(r * Float32(-0.3333333333333333)) / s)) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r)), Float32(0.75), Float32(Float32(0.125) / Float32(Float32(Float32(pi) * s) * Float32(exp(Float32(r / s)) * r)))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{e^{\frac{r \cdot -0.3333333333333333}{s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}, 0.75, \frac{0.125}{\left(\pi \cdot s\right) \cdot \left(e^{\frac{r}{s}} \cdot r\right)}\right)
\end{array}
Initial program 99.6%
Applied rewrites99.6%
lift-/.f32N/A
lift-/.f32N/A
associate-/l/N/A
lower-/.f32N/A
lift-*.f32N/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f3299.6
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (/ (fma (/ (exp (/ (* r -0.3333333333333333) s)) (* PI s)) 0.125 (/ 0.125 (* (* PI s) (exp (/ r s))))) r))
float code(float s, float r) {
return fmaf((expf(((r * -0.3333333333333333f) / s)) / (((float) M_PI) * s)), 0.125f, (0.125f / ((((float) M_PI) * s) * expf((r / s))))) / r;
}
function code(s, r) return Float32(fma(Float32(exp(Float32(Float32(r * Float32(-0.3333333333333333)) / s)) / Float32(Float32(pi) * s)), Float32(0.125), Float32(Float32(0.125) / Float32(Float32(Float32(pi) * s) * exp(Float32(r / s))))) / r) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(\frac{e^{\frac{r \cdot -0.3333333333333333}{s}}}{\pi \cdot s}, 0.125, \frac{0.125}{\left(\pi \cdot s\right) \cdot e^{\frac{r}{s}}}\right)}{r}
\end{array}
Initial program 99.6%
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (/ (* 0.125 (/ (+ (exp (/ (* -0.3333333333333333 r) s)) (exp (/ (- r) s))) (* PI s))) r))
float code(float s, float r) {
return (0.125f * ((expf(((-0.3333333333333333f * r) / s)) + expf((-r / s))) / (((float) M_PI) * s))) / r;
}
function code(s, r) return Float32(Float32(Float32(0.125) * Float32(Float32(exp(Float32(Float32(Float32(-0.3333333333333333) * r) / s)) + exp(Float32(Float32(-r) / s))) / Float32(Float32(pi) * s))) / r) end
function tmp = code(s, r) tmp = (single(0.125) * ((exp(((single(-0.3333333333333333) * r) / s)) + exp((-r / s))) / (single(pi) * s))) / r; end
\begin{array}{l}
\\
\frac{0.125 \cdot \frac{e^{\frac{-0.3333333333333333 \cdot r}{s}} + e^{\frac{-r}{s}}}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Applied rewrites99.6%
lift-fma.f32N/A
*-commutativeN/A
lift-/.f32N/A
mult-flipN/A
distribute-lft-outN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
*-commutativeN/A
associate-/r*N/A
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (/ 0.25 (* (log (exp (* PI r))) s)))
float code(float s, float r) {
return 0.25f / (logf(expf((((float) M_PI) * r))) * s);
}
function code(s, r) return Float32(Float32(0.25) / Float32(log(exp(Float32(Float32(pi) * r))) * s)) end
function tmp = code(s, r) tmp = single(0.25) / (log(exp((single(pi) * r))) * s); end
\begin{array}{l}
\\
\frac{0.25}{\log \left(e^{\pi \cdot r}\right) \cdot s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-PI.f32N/A
add-log-expN/A
log-pow-revN/A
lower-log.f32N/A
lift-PI.f32N/A
pow-expN/A
*-commutativeN/A
lift-*.f32N/A
lower-exp.f3243.0
lift-*.f32N/A
*-commutativeN/A
lower-*.f3243.0
Applied rewrites43.0%
(FPCore (s r) :precision binary32 (/ 0.25 (log (exp (* (* PI s) r)))))
float code(float s, float r) {
return 0.25f / logf(expf(((((float) M_PI) * s) * r)));
}
function code(s, r) return Float32(Float32(0.25) / log(exp(Float32(Float32(Float32(pi) * s) * r)))) end
function tmp = code(s, r) tmp = single(0.25) / log(exp(((single(pi) * s) * r))); end
\begin{array}{l}
\\
\frac{0.25}{\log \left(e^{\left(\pi \cdot s\right) \cdot r}\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f32N/A
add-log-expN/A
log-pow-revN/A
lower-log.f32N/A
lift-PI.f32N/A
pow-expN/A
lift-*.f32N/A
associate-*l*N/A
*-commutativeN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lower-exp.f3210.4
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f3210.4
Applied rewrites10.4%
(FPCore (s r) :precision binary32 (/ (fma (/ 1.0 PI) (/ 0.125 s) (/ 0.125 (* (+ s r) PI))) r))
float code(float s, float r) {
return fmaf((1.0f / ((float) M_PI)), (0.125f / s), (0.125f / ((s + r) * ((float) M_PI)))) / r;
}
function code(s, r) return Float32(fma(Float32(Float32(1.0) / Float32(pi)), Float32(Float32(0.125) / s), Float32(Float32(0.125) / Float32(Float32(s + r) * Float32(pi)))) / r) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(\frac{1}{\pi}, \frac{0.125}{s}, \frac{0.125}{\left(s + r\right) \cdot \pi}\right)}{r}
\end{array}
Initial program 99.6%
Applied rewrites99.6%
Taylor expanded in r around 0
lower-fma.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3212.3
Applied rewrites12.3%
lift-fma.f32N/A
lift-/.f32N/A
associate-*l/N/A
lift-*.f32N/A
times-fracN/A
lift-exp.f32N/A
lift-/.f32N/A
lift-*.f32N/A
lift-PI.f32N/A
lower-fma.f32N/A
Applied rewrites12.3%
Taylor expanded in s around inf
lower-/.f32N/A
lower-PI.f329.4
Applied rewrites9.4%
(FPCore (s r) :precision binary32 (* (/ 0.25 (* s r)) (/ 1.0 PI)))
float code(float s, float r) {
return (0.25f / (s * r)) * (1.0f / ((float) M_PI));
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(s * r)) * Float32(Float32(1.0) / Float32(pi))) end
function tmp = code(s, r) tmp = (single(0.25) / (s * r)) * (single(1.0) / single(pi)); end
\begin{array}{l}
\\
\frac{0.25}{s \cdot r} \cdot \frac{1}{\pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
mult-flipN/A
lower-*.f32N/A
lower-/.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ (/ 0.25 r) PI) s))
float code(float s, float r) {
return ((0.25f / r) / ((float) M_PI)) / s;
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) / r) / Float32(pi)) / s) end
function tmp = code(s, r) tmp = ((single(0.25) / r) / single(pi)) / s; end
\begin{array}{l}
\\
\frac{\frac{\frac{0.25}{r}}{\pi}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lift-*.f32N/A
*-commutativeN/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 PI) (* s r)))
float code(float s, float r) {
return (0.25f / ((float) M_PI)) / (s * r);
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(pi)) / Float32(s * r)) end
function tmp = code(s, r) tmp = (single(0.25) / single(pi)) / (s * r); end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi}}{s \cdot r}
\end{array}
Initial program 99.6%
Applied rewrites99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 (* s r)) PI))
float code(float s, float r) {
return (0.25f / (s * r)) / ((float) M_PI);
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(s * r)) / Float32(pi)) end
function tmp = code(s, r) tmp = (single(0.25) / (s * r)) / single(pi); end
\begin{array}{l}
\\
\frac{\frac{0.25}{s \cdot r}}{\pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ 0.25 (* (* s r) PI)))
float code(float s, float r) {
return 0.25f / ((s * r) * ((float) M_PI));
}
function code(s, r) return Float32(Float32(0.25) / Float32(Float32(s * r) * Float32(pi))) end
function tmp = code(s, r) tmp = single(0.25) / ((s * r) * single(pi)); end
\begin{array}{l}
\\
\frac{0.25}{\left(s \cdot r\right) \cdot \pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ 0.25 (* r (* s PI))))
float code(float s, float r) {
return 0.25f / (r * (s * ((float) M_PI)));
}
function code(s, r) return Float32(Float32(0.25) / Float32(r * Float32(s * Float32(pi)))) end
function tmp = code(s, r) tmp = single(0.25) / (r * (s * single(pi))); end
\begin{array}{l}
\\
\frac{0.25}{r \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
herbie shell --seed 2025154
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))