
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Herbie found 14 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (/ (- r) 3.0) s))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf(((-r / 3.0f) / s))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(Float32(-r) / Float32(3.0)) / s))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp(((-r / single(3.0)) / s))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{\frac{-r}{3}}{s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
lift-*.f32N/A
lift-/.f32N/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f3299.6
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (+ (* (/ (exp (/ (- r) s)) (* (* PI s) r)) 0.125) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((expf((-r / s)) / ((((float) M_PI) * s) * r)) * 0.125f) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(Float32(pi) * s) * r)) * Float32(0.125)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((exp((-r / s)) / ((single(pi) * s) * r)) * single(0.125)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{e^{\frac{-r}{s}}}{\left(\pi \cdot s\right) \cdot r} \cdot 0.125 + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
*-commutativeN/A
lower-*.f32N/A
mul-1-negN/A
distribute-frac-negN/A
lower-/.f32N/A
lift-neg.f32N/A
lift-/.f32N/A
lift-exp.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3299.6
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (fma (/ 0.125 (* PI s)) (/ (exp (/ (- r) (* 3.0 s))) r) (* (/ (exp (/ (- r) s)) (* (* PI s) r)) 0.125)))
float code(float s, float r) {
return fmaf((0.125f / (((float) M_PI) * s)), (expf((-r / (3.0f * s))) / r), ((expf((-r / s)) / ((((float) M_PI) * s) * r)) * 0.125f));
}
function code(s, r) return fma(Float32(Float32(0.125) / Float32(Float32(pi) * s)), Float32(exp(Float32(Float32(-r) / Float32(Float32(3.0) * s))) / r), Float32(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(Float32(pi) * s) * r)) * Float32(0.125))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{0.125}{\pi \cdot s}, \frac{e^{\frac{-r}{3 \cdot s}}}{r}, \frac{e^{\frac{-r}{s}}}{\left(\pi \cdot s\right) \cdot r} \cdot 0.125\right)
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
*-commutativeN/A
lower-*.f32N/A
mul-1-negN/A
distribute-frac-negN/A
lower-/.f32N/A
lift-neg.f32N/A
lift-/.f32N/A
lift-exp.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3299.6
Applied rewrites99.6%
lift-+.f32N/A
lift-/.f32N/A
lift-*.f32N/A
lift-exp.f32N/A
lift-*.f32N/A
lift-/.f32N/A
lift-neg.f32N/A
lift-*.f32N/A
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
Applied rewrites99.6%
Taylor expanded in s around 0
lower-/.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f3299.6
Applied rewrites99.6%
(FPCore (s r)
:precision binary32
(/
(/
(-
(* 0.125 (exp (/ (- r) s)))
(* -0.125 (exp (/ (* -0.3333333333333333 r) s))))
(* PI s))
r))
float code(float s, float r) {
return (((0.125f * expf((-r / s))) - (-0.125f * expf(((-0.3333333333333333f * r) / s)))) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(Float32(Float32(0.125) * exp(Float32(Float32(-r) / s))) - Float32(Float32(-0.125) * exp(Float32(Float32(Float32(-0.3333333333333333) * r) / s)))) / Float32(Float32(pi) * s)) / r) end
function tmp = code(s, r) tmp = (((single(0.125) * exp((-r / s))) - (single(-0.125) * exp(((single(-0.3333333333333333) * r) / s)))) / (single(pi) * s)) / r; end
\begin{array}{l}
\\
\frac{\frac{0.125 \cdot e^{\frac{-r}{s}} - -0.125 \cdot e^{\frac{-0.3333333333333333 \cdot r}{s}}}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
lift-*.f32N/A
lift-/.f32N/A
associate-*r/N/A
lower-/.f32N/A
lower-*.f3299.6
Applied rewrites99.6%
(FPCore (s r)
:precision binary32
(/
(/
(-
(* 0.125 (exp (/ (- r) s)))
(* -0.125 (exp (* -0.3333333333333333 (/ r s)))))
(* PI s))
r))
float code(float s, float r) {
return (((0.125f * expf((-r / s))) - (-0.125f * expf((-0.3333333333333333f * (r / s))))) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(Float32(Float32(0.125) * exp(Float32(Float32(-r) / s))) - Float32(Float32(-0.125) * exp(Float32(Float32(-0.3333333333333333) * Float32(r / s))))) / Float32(Float32(pi) * s)) / r) end
function tmp = code(s, r) tmp = (((single(0.125) * exp((-r / s))) - (single(-0.125) * exp((single(-0.3333333333333333) * (r / s))))) / (single(pi) * s)) / r; end
\begin{array}{l}
\\
\frac{\frac{0.125 \cdot e^{\frac{-r}{s}} - -0.125 \cdot e^{-0.3333333333333333 \cdot \frac{r}{s}}}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (/ (fma 0.125 (exp (/ (- r) s)) (* (exp (* (/ r s) -0.3333333333333333)) 0.125)) (* (* PI s) r)))
float code(float s, float r) {
return fmaf(0.125f, expf((-r / s)), (expf(((r / s) * -0.3333333333333333f)) * 0.125f)) / ((((float) M_PI) * s) * r);
}
function code(s, r) return Float32(fma(Float32(0.125), exp(Float32(Float32(-r) / s)), Float32(exp(Float32(Float32(r / s) * Float32(-0.3333333333333333))) * Float32(0.125))) / Float32(Float32(Float32(pi) * s) * r)) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(0.125, e^{\frac{-r}{s}}, e^{\frac{r}{s} \cdot -0.3333333333333333} \cdot 0.125\right)}{\left(\pi \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
Applied rewrites99.6%
(FPCore (s r)
:precision binary32
(/
(/
(-
(* 0.125 (exp (/ (- r) s)))
(-
(* (/ (fma -0.006944444444444444 (/ r s) 0.041666666666666664) s) r)
0.125))
(* PI s))
r))
float code(float s, float r) {
return (((0.125f * expf((-r / s))) - (((fmaf(-0.006944444444444444f, (r / s), 0.041666666666666664f) / s) * r) - 0.125f)) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(Float32(Float32(0.125) * exp(Float32(Float32(-r) / s))) - Float32(Float32(Float32(fma(Float32(-0.006944444444444444), Float32(r / s), Float32(0.041666666666666664)) / s) * r) - Float32(0.125))) / Float32(Float32(pi) * s)) / r) end
\begin{array}{l}
\\
\frac{\frac{0.125 \cdot e^{\frac{-r}{s}} - \left(\frac{\mathsf{fma}\left(-0.006944444444444444, \frac{r}{s}, 0.041666666666666664\right)}{s} \cdot r - 0.125\right)}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
Taylor expanded in r around 0
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-fma.f32N/A
pow2N/A
lower-/.f32N/A
lift-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f3210.3
Applied rewrites10.3%
Taylor expanded in s around inf
lower-/.f32N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f3210.3
Applied rewrites10.3%
(FPCore (s r)
:precision binary32
(/
(/
(fma
(-
(* (/ r (* (* s s) PI)) 0.06944444444444445)
(/ 0.16666666666666666 (* PI s)))
r
(/ 0.25 PI))
s)
r))
float code(float s, float r) {
return (fmaf((((r / ((s * s) * ((float) M_PI))) * 0.06944444444444445f) - (0.16666666666666666f / (((float) M_PI) * s))), r, (0.25f / ((float) M_PI))) / s) / r;
}
function code(s, r) return Float32(Float32(fma(Float32(Float32(Float32(r / Float32(Float32(s * s) * Float32(pi))) * Float32(0.06944444444444445)) - Float32(Float32(0.16666666666666666) / Float32(Float32(pi) * s))), r, Float32(Float32(0.25) / Float32(pi))) / s) / r) end
\begin{array}{l}
\\
\frac{\frac{\mathsf{fma}\left(\frac{r}{\left(s \cdot s\right) \cdot \pi} \cdot 0.06944444444444445 - \frac{0.16666666666666666}{\pi \cdot s}, r, \frac{0.25}{\pi}\right)}{s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
lower-/.f32N/A
Applied rewrites8.3%
Taylor expanded in s around inf
lower-/.f32N/A
Applied rewrites9.6%
Taylor expanded in r around 0
*-commutativeN/A
lower-fma.f32N/A
Applied rewrites9.7%
(FPCore (s r)
:precision binary32
(/
(/
(fma
(- (* (/ r (* s s)) 0.06944444444444445) (/ 0.16666666666666666 s))
r
0.25)
(* PI s))
r))
float code(float s, float r) {
return (fmaf((((r / (s * s)) * 0.06944444444444445f) - (0.16666666666666666f / s)), r, 0.25f) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(fma(Float32(Float32(Float32(r / Float32(s * s)) * Float32(0.06944444444444445)) - Float32(Float32(0.16666666666666666) / s)), r, Float32(0.25)) / Float32(Float32(pi) * s)) / r) end
\begin{array}{l}
\\
\frac{\frac{\mathsf{fma}\left(\frac{r}{s \cdot s} \cdot 0.06944444444444445 - \frac{0.16666666666666666}{s}, r, 0.25\right)}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
Taylor expanded in r around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
pow2N/A
lower-/.f32N/A
lift-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f329.7
Applied rewrites9.7%
(FPCore (s r) :precision binary32 (/ (/ (- (* 0.125 (exp (/ (- r) s))) -0.125) (* PI s)) r))
float code(float s, float r) {
return (((0.125f * expf((-r / s))) - -0.125f) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(Float32(Float32(0.125) * exp(Float32(Float32(-r) / s))) - Float32(-0.125)) / Float32(Float32(pi) * s)) / r) end
function tmp = code(s, r) tmp = (((single(0.125) * exp((-r / s))) - single(-0.125)) / (single(pi) * s)) / r; end
\begin{array}{l}
\\
\frac{\frac{0.125 \cdot e^{\frac{-r}{s}} - -0.125}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
Taylor expanded in s around inf
Applied rewrites9.2%
(FPCore (s r) :precision binary32 (/ (/ (fma (/ r (* PI s)) -0.16666666666666666 (/ 0.25 PI)) s) r))
float code(float s, float r) {
return (fmaf((r / (((float) M_PI) * s)), -0.16666666666666666f, (0.25f / ((float) M_PI))) / s) / r;
}
function code(s, r) return Float32(Float32(fma(Float32(r / Float32(Float32(pi) * s)), Float32(-0.16666666666666666), Float32(Float32(0.25) / Float32(pi))) / s) / r) end
\begin{array}{l}
\\
\frac{\frac{\mathsf{fma}\left(\frac{r}{\pi \cdot s}, -0.16666666666666666, \frac{0.25}{\pi}\right)}{s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
lower-/.f32N/A
Applied rewrites8.3%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f32N/A
lift-PI.f328.8
Applied rewrites8.8%
(FPCore (s r) :precision binary32 (/ (/ (fma -0.16666666666666666 (/ r s) 0.25) (* PI s)) r))
float code(float s, float r) {
return (fmaf(-0.16666666666666666f, (r / s), 0.25f) / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(fma(Float32(-0.16666666666666666), Float32(r / s), Float32(0.25)) / Float32(Float32(pi) * s)) / r) end
\begin{array}{l}
\\
\frac{\frac{\mathsf{fma}\left(-0.16666666666666666, \frac{r}{s}, 0.25\right)}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around inf
lower-/.f32N/A
Applied rewrites99.6%
Taylor expanded in r around 0
+-commutativeN/A
lower-fma.f32N/A
lift-/.f328.8
Applied rewrites8.8%
(FPCore (s r) :precision binary32 (/ (/ (/ 0.25 PI) s) r))
float code(float s, float r) {
return ((0.25f / ((float) M_PI)) / s) / r;
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) / Float32(pi)) / s) / r) end
function tmp = code(s, r) tmp = ((single(0.25) / single(pi)) / s) / r; end
\begin{array}{l}
\\
\frac{\frac{\frac{0.25}{\pi}}{s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
lower-/.f32N/A
Applied rewrites8.3%
Taylor expanded in s around inf
lower-/.f32N/A
Applied rewrites9.6%
Taylor expanded in s around inf
lift-/.f32N/A
lift-PI.f328.8
Applied rewrites8.8%
(FPCore (s r) :precision binary32 (/ 0.25 (* (* s r) PI)))
float code(float s, float r) {
return 0.25f / ((s * r) * ((float) M_PI));
}
function code(s, r) return Float32(Float32(0.25) / Float32(Float32(s * r) * Float32(pi))) end
function tmp = code(s, r) tmp = single(0.25) / ((s * r) * single(pi)); end
\begin{array}{l}
\\
\frac{0.25}{\left(s \cdot r\right) \cdot \pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f328.8
Applied rewrites8.8%
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f328.8
Applied rewrites8.8%
herbie shell --seed 2025101
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))