
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (fma 0.75 (/ (exp (/ (* -0.3333333333333333 r) s)) (* (* (* PI 6.0) s) r)) (* (/ (exp (/ (- r) s)) (* (* PI s) r)) 0.125)))
float code(float s, float r) {
return fmaf(0.75f, (expf(((-0.3333333333333333f * r) / s)) / (((((float) M_PI) * 6.0f) * s) * r)), ((expf((-r / s)) / ((((float) M_PI) * s) * r)) * 0.125f));
}
function code(s, r) return fma(Float32(0.75), Float32(exp(Float32(Float32(Float32(-0.3333333333333333) * r) / s)) / Float32(Float32(Float32(Float32(pi) * Float32(6.0)) * s) * r)), Float32(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(Float32(pi) * s) * r)) * Float32(0.125))) end
\begin{array}{l}
\\
\mathsf{fma}\left(0.75, \frac{e^{\frac{-0.3333333333333333 \cdot r}{s}}}{\left(\left(\pi \cdot 6\right) \cdot s\right) \cdot r}, \frac{e^{\frac{-r}{s}}}{\left(\pi \cdot s\right) \cdot r} \cdot 0.125\right)
\end{array}
Initial program 99.6%
Applied rewrites99.6%
Taylor expanded in r around 0
lower-*.f3299.6
Applied rewrites99.6%
Taylor expanded in s around 0
*-commutativeN/A
lower-*.f32N/A
mul-1-negN/A
distribute-frac-negN/A
lower-/.f32N/A
lift-/.f32N/A
lift-neg.f32N/A
lift-exp.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f3299.6
Applied rewrites99.6%
(FPCore (s r)
:precision binary32
(+
(/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r))
(/
(/
(fma (fma -0.25 r (* s 0.75)) s (* (* r r) 0.041666666666666664))
(* s s))
(* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((fmaf(fmaf(-0.25f, r, (s * 0.75f)), s, ((r * r) * 0.041666666666666664f)) / (s * s)) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(fma(fma(Float32(-0.25), r, Float32(s * Float32(0.75))), s, Float32(Float32(r * r) * Float32(0.041666666666666664))) / Float32(s * s)) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{\frac{\mathsf{fma}\left(\mathsf{fma}\left(-0.25, r, s \cdot 0.75\right), s, \left(r \cdot r\right) \cdot 0.041666666666666664\right)}{s \cdot s}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f3210.7
Applied rewrites10.7%
Taylor expanded in s around 0
lower-/.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower-fma.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
pow2N/A
lift-*.f3210.7
Applied rewrites10.7%
(FPCore (s r) :precision binary32 (fma (/ (exp (/ (- r) s)) (* (* (* 2.0 PI) s) r)) 0.25 (/ (fma (/ (fma (/ r s) -0.041666666666666664 0.25) (- s)) r 0.75) (* (* (* PI 6.0) s) r))))
float code(float s, float r) {
return fmaf((expf((-r / s)) / (((2.0f * ((float) M_PI)) * s) * r)), 0.25f, (fmaf((fmaf((r / s), -0.041666666666666664f, 0.25f) / -s), r, 0.75f) / (((((float) M_PI) * 6.0f) * s) * r)));
}
function code(s, r) return fma(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)), Float32(0.25), Float32(fma(Float32(fma(Float32(r / s), Float32(-0.041666666666666664), Float32(0.25)) / Float32(-s)), r, Float32(0.75)) / Float32(Float32(Float32(Float32(pi) * Float32(6.0)) * s) * r))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r}, 0.25, \frac{\mathsf{fma}\left(\frac{\mathsf{fma}\left(\frac{r}{s}, -0.041666666666666664, 0.25\right)}{-s}, r, 0.75\right)}{\left(\left(\pi \cdot 6\right) \cdot s\right) \cdot r}\right)
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f3210.7
Applied rewrites10.7%
Taylor expanded in s around -inf
mul-1-negN/A
lower-neg.f32N/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f3210.7
Applied rewrites10.7%
Applied rewrites10.7%
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (fma (/ (fma -0.25 s (* 0.041666666666666664 r)) (* s s)) r 0.75) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + (fmaf((fmaf(-0.25f, s, (0.041666666666666664f * r)) / (s * s)), r, 0.75f) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(fma(Float32(fma(Float32(-0.25), s, Float32(Float32(0.041666666666666664) * r)) / Float32(s * s)), r, Float32(0.75)) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{\mathsf{fma}\left(\frac{\mathsf{fma}\left(-0.25, s, 0.041666666666666664 \cdot r\right)}{s \cdot s}, r, 0.75\right)}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f3210.7
Applied rewrites10.7%
Taylor expanded in s around 0
lower-/.f32N/A
lower-fma.f32N/A
lower-*.f32N/A
pow2N/A
lift-*.f3210.7
Applied rewrites10.7%
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (fma (/ (fma -0.5 (/ (* r r) s) r) s) -1.0 1.0)) (* (* (* 2.0 PI) s) r)) (/ (fma (- (* (/ r (* s s)) 0.041666666666666664) (/ 0.25 s)) r 0.75) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * fmaf((fmaf(-0.5f, ((r * r) / s), r) / s), -1.0f, 1.0f)) / (((2.0f * ((float) M_PI)) * s) * r)) + (fmaf((((r / (s * s)) * 0.041666666666666664f) - (0.25f / s)), r, 0.75f) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * fma(Float32(fma(Float32(-0.5), Float32(Float32(r * r) / s), r) / s), Float32(-1.0), Float32(1.0))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(fma(Float32(Float32(Float32(r / Float32(s * s)) * Float32(0.041666666666666664)) - Float32(Float32(0.25) / s)), r, Float32(0.75)) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
\begin{array}{l}
\\
\frac{0.25 \cdot \mathsf{fma}\left(\frac{\mathsf{fma}\left(-0.5, \frac{r \cdot r}{s}, r\right)}{s}, -1, 1\right)}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{\mathsf{fma}\left(\frac{r}{s \cdot s} \cdot 0.041666666666666664 - \frac{0.25}{s}, r, 0.75\right)}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Initial program 99.6%
Taylor expanded in r around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f3210.7
Applied rewrites10.7%
Taylor expanded in s around -inf
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f3210.1
Applied rewrites10.1%
(FPCore (s r)
:precision binary32
(-
(/
(-
(-
(/
(-
(- (/ (* (/ r PI) -0.06944444444444445) s))
(/ 0.16666666666666666 PI))
s))
(/ 0.25 (* PI r)))
s)))
float code(float s, float r) {
return -((-((-(((r / ((float) M_PI)) * -0.06944444444444445f) / s) - (0.16666666666666666f / ((float) M_PI))) / s) - (0.25f / (((float) M_PI) * r))) / s);
}
function code(s, r) return Float32(-Float32(Float32(Float32(-Float32(Float32(Float32(-Float32(Float32(Float32(r / Float32(pi)) * Float32(-0.06944444444444445)) / s)) - Float32(Float32(0.16666666666666666) / Float32(pi))) / s)) - Float32(Float32(0.25) / Float32(Float32(pi) * r))) / s)) end
function tmp = code(s, r) tmp = -((-((-(((r / single(pi)) * single(-0.06944444444444445)) / s) - (single(0.16666666666666666) / single(pi))) / s) - (single(0.25) / (single(pi) * r))) / s); end
\begin{array}{l}
\\
-\frac{\left(-\frac{\left(-\frac{\frac{r}{\pi} \cdot -0.06944444444444445}{s}\right) - \frac{0.16666666666666666}{\pi}}{s}\right) - \frac{0.25}{\pi \cdot r}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
mul-1-negN/A
lower-neg.f32N/A
lower-/.f32N/A
Applied rewrites10.1%
(FPCore (s r)
:precision binary32
(-
(/
(-
(/ (fma (/ (/ r s) PI) -0.06944444444444445 (/ 0.16666666666666666 PI)) s)
(/ 0.25 (* PI r)))
s)))
float code(float s, float r) {
return -(((fmaf(((r / s) / ((float) M_PI)), -0.06944444444444445f, (0.16666666666666666f / ((float) M_PI))) / s) - (0.25f / (((float) M_PI) * r))) / s);
}
function code(s, r) return Float32(-Float32(Float32(Float32(fma(Float32(Float32(r / s) / Float32(pi)), Float32(-0.06944444444444445), Float32(Float32(0.16666666666666666) / Float32(pi))) / s) - Float32(Float32(0.25) / Float32(Float32(pi) * r))) / s)) end
\begin{array}{l}
\\
-\frac{\frac{\mathsf{fma}\left(\frac{\frac{r}{s}}{\pi}, -0.06944444444444445, \frac{0.16666666666666666}{\pi}\right)}{s} - \frac{0.25}{\pi \cdot r}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around -inf
Applied rewrites9.8%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-fma.f32N/A
associate-/r*N/A
lower-/.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
associate-*r/N/A
metadata-evalN/A
lift-/.f32N/A
lift-PI.f3210.1
Applied rewrites10.1%
(FPCore (s r) :precision binary32 (/ (- (/ 0.25 (* PI r)) (/ 0.16666666666666666 (* PI s))) s))
float code(float s, float r) {
return ((0.25f / (((float) M_PI) * r)) - (0.16666666666666666f / (((float) M_PI) * s))) / s;
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) / Float32(Float32(pi) * r)) - Float32(Float32(0.16666666666666666) / Float32(Float32(pi) * s))) / s) end
function tmp = code(s, r) tmp = ((single(0.25) / (single(pi) * r)) - (single(0.16666666666666666) / (single(pi) * s))) / s; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi \cdot r} - \frac{0.16666666666666666}{\pi \cdot s}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 (* PI s)) r))
float code(float s, float r) {
return (0.25f / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(Float32(pi) * s)) / r) end
function tmp = code(s, r) tmp = (single(0.25) / (single(pi) * s)) / r; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
associate-/r*N/A
metadata-evalN/A
*-commutativeN/A
associate-*r/N/A
lower-/.f32N/A
associate-*r/N/A
metadata-evalN/A
lower-/.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 r) (* PI s)))
float code(float s, float r) {
return (0.25f / r) / (((float) M_PI) * s);
}
function code(s, r) return Float32(Float32(Float32(0.25) / r) / Float32(Float32(pi) * s)) end
function tmp = code(s, r) tmp = (single(0.25) / r) / (single(pi) * s); end
\begin{array}{l}
\\
\frac{\frac{0.25}{r}}{\pi \cdot s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
*-commutativeN/A
*-commutativeN/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ 0.25 (* (* s r) PI)))
float code(float s, float r) {
return 0.25f / ((s * r) * ((float) M_PI));
}
function code(s, r) return Float32(Float32(0.25) / Float32(Float32(s * r) * Float32(pi))) end
function tmp = code(s, r) tmp = single(0.25) / ((s * r) * single(pi)); end
\begin{array}{l}
\\
\frac{0.25}{\left(s \cdot r\right) \cdot \pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ 0.25 (* s (* PI r))))
float code(float s, float r) {
return 0.25f / (s * (((float) M_PI) * r));
}
function code(s, r) return Float32(Float32(0.25) / Float32(s * Float32(Float32(pi) * r))) end
function tmp = code(s, r) tmp = single(0.25) / (s * (single(pi) * r)); end
\begin{array}{l}
\\
\frac{0.25}{s \cdot \left(\pi \cdot r\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
*-commutativeN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lift-PI.f329.0
Applied rewrites9.0%
herbie shell --seed 2025102
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))