
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s r) :precision binary32 (+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))
float code(float s, float r) {
return ((0.25f * expf((-r / s))) / (((2.0f * ((float) M_PI)) * s) * r)) + ((0.75f * expf((-r / (3.0f * s)))) / (((6.0f * ((float) M_PI)) * s) * r));
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) * exp(Float32(Float32(-r) / s))) / Float32(Float32(Float32(Float32(2.0) * Float32(pi)) * s) * r)) + Float32(Float32(Float32(0.75) * exp(Float32(Float32(-r) / Float32(Float32(3.0) * s)))) / Float32(Float32(Float32(Float32(6.0) * Float32(pi)) * s) * r))) end
function tmp = code(s, r) tmp = ((single(0.25) * exp((-r / s))) / (((single(2.0) * single(pi)) * s) * r)) + ((single(0.75) * exp((-r / (single(3.0) * s)))) / (((single(6.0) * single(pi)) * s) * r)); end
\begin{array}{l}
\\
\frac{0.25 \cdot e^{\frac{-r}{s}}}{\left(\left(2 \cdot \pi\right) \cdot s\right) \cdot r} + \frac{0.75 \cdot e^{\frac{-r}{3 \cdot s}}}{\left(\left(6 \cdot \pi\right) \cdot s\right) \cdot r}
\end{array}
(FPCore (s r) :precision binary32 (/ (fma 0.125 (/ (exp (* -1.0 (/ r s))) (* r PI)) (/ (* (/ (exp (/ r (* s -3.0))) r) 0.75) (* PI 6.0))) s))
float code(float s, float r) {
return fmaf(0.125f, (expf((-1.0f * (r / s))) / (r * ((float) M_PI))), (((expf((r / (s * -3.0f))) / r) * 0.75f) / (((float) M_PI) * 6.0f))) / s;
}
function code(s, r) return Float32(fma(Float32(0.125), Float32(exp(Float32(Float32(-1.0) * Float32(r / s))) / Float32(r * Float32(pi))), Float32(Float32(Float32(exp(Float32(r / Float32(s * Float32(-3.0)))) / r) * Float32(0.75)) / Float32(Float32(pi) * Float32(6.0)))) / s) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(0.125, \frac{e^{-1 \cdot \frac{r}{s}}}{r \cdot \pi}, \frac{\frac{e^{\frac{r}{s \cdot -3}}}{r} \cdot 0.75}{\pi \cdot 6}\right)}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
lower-/.f32N/A
Applied rewrites99.5%
Applied rewrites99.5%
(FPCore (s r) :precision binary32 (fma (/ (exp (/ r (* s -3.0))) s) (/ (/ 0.125 r) PI) (* (/ (exp (/ (- r) s)) (* (* PI s) r)) 0.125)))
float code(float s, float r) {
return fmaf((expf((r / (s * -3.0f))) / s), ((0.125f / r) / ((float) M_PI)), ((expf((-r / s)) / ((((float) M_PI) * s) * r)) * 0.125f));
}
function code(s, r) return fma(Float32(exp(Float32(r / Float32(s * Float32(-3.0)))) / s), Float32(Float32(Float32(0.125) / r) / Float32(pi)), Float32(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(Float32(pi) * s) * r)) * Float32(0.125))) end
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{e^{\frac{r}{s \cdot -3}}}{s}, \frac{\frac{0.125}{r}}{\pi}, \frac{e^{\frac{-r}{s}}}{\left(\pi \cdot s\right) \cdot r} \cdot 0.125\right)
\end{array}
Initial program 99.6%
Applied rewrites99.5%
Applied rewrites99.6%
(FPCore (s r) :precision binary32 (/ (fma (/ (exp (/ (- r) s)) (* PI r)) 0.125 (* (/ (exp (/ r (* s -3.0))) (* PI r)) 0.125)) s))
float code(float s, float r) {
return fmaf((expf((-r / s)) / (((float) M_PI) * r)), 0.125f, ((expf((r / (s * -3.0f))) / (((float) M_PI) * r)) * 0.125f)) / s;
}
function code(s, r) return Float32(fma(Float32(exp(Float32(Float32(-r) / s)) / Float32(Float32(pi) * r)), Float32(0.125), Float32(Float32(exp(Float32(r / Float32(s * Float32(-3.0)))) / Float32(Float32(pi) * r)) * Float32(0.125))) / s) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(\frac{e^{\frac{-r}{s}}}{\pi \cdot r}, 0.125, \frac{e^{\frac{r}{s \cdot -3}}}{\pi \cdot r} \cdot 0.125\right)}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
lower-/.f32N/A
Applied rewrites99.5%
lift-fma.f32N/A
*-commutativeN/A
lower-fma.f3299.5
Applied rewrites99.5%
(FPCore (s r) :precision binary32 (/ (* (/ (+ (exp (/ (- r) s)) (exp (/ r (* s -3.0)))) (* PI r)) 0.125) s))
float code(float s, float r) {
return (((expf((-r / s)) + expf((r / (s * -3.0f)))) / (((float) M_PI) * r)) * 0.125f) / s;
}
function code(s, r) return Float32(Float32(Float32(Float32(exp(Float32(Float32(-r) / s)) + exp(Float32(r / Float32(s * Float32(-3.0))))) / Float32(Float32(pi) * r)) * Float32(0.125)) / s) end
function tmp = code(s, r) tmp = (((exp((-r / s)) + exp((r / (s * single(-3.0))))) / (single(pi) * r)) * single(0.125)) / s; end
\begin{array}{l}
\\
\frac{\frac{e^{\frac{-r}{s}} + e^{\frac{r}{s \cdot -3}}}{\pi \cdot r} \cdot 0.125}{s}
\end{array}
Initial program 99.6%
Applied rewrites99.5%
Applied rewrites99.5%
(FPCore (s r) :precision binary32 (/ (/ 0.25 (log (pow (exp PI) r))) s))
float code(float s, float r) {
return (0.25f / logf(powf(expf(((float) M_PI)), r))) / s;
}
function code(s, r) return Float32(Float32(Float32(0.25) / log((exp(Float32(pi)) ^ r))) / s) end
function tmp = code(s, r) tmp = (single(0.25) / log((exp(single(pi)) ^ r))) / s; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\log \left({\left(e^{\pi}\right)}^{r}\right)}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
lower-/.f32N/A
Applied rewrites99.5%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f329.1
Applied rewrites9.1%
lift-*.f32N/A
lift-PI.f32N/A
add-log-expN/A
log-pow-revN/A
lower-log.f32N/A
lower-pow.f32N/A
lift-PI.f32N/A
lower-exp.f3242.7
Applied rewrites42.7%
(FPCore (s r) :precision binary32 (/ (fma 0.125 (/ (exp (* -1.0 (/ r s))) (* r PI)) (/ 0.125 (* r PI))) s))
float code(float s, float r) {
return fmaf(0.125f, (expf((-1.0f * (r / s))) / (r * ((float) M_PI))), (0.125f / (r * ((float) M_PI)))) / s;
}
function code(s, r) return Float32(fma(Float32(0.125), Float32(exp(Float32(Float32(-1.0) * Float32(r / s))) / Float32(r * Float32(pi))), Float32(Float32(0.125) / Float32(r * Float32(pi)))) / s) end
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(0.125, \frac{e^{-1 \cdot \frac{r}{s}}}{r \cdot \pi}, \frac{0.125}{r \cdot \pi}\right)}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
lower-/.f32N/A
Applied rewrites99.5%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f329.5
Applied rewrites9.5%
(FPCore (s r) :precision binary32 (/ (/ (fma -0.16666666666666666 (/ r (* s PI)) (* 0.25 (/ 1.0 PI))) r) s))
float code(float s, float r) {
return (fmaf(-0.16666666666666666f, (r / (s * ((float) M_PI))), (0.25f * (1.0f / ((float) M_PI)))) / r) / s;
}
function code(s, r) return Float32(Float32(fma(Float32(-0.16666666666666666), Float32(r / Float32(s * Float32(pi))), Float32(Float32(0.25) * Float32(Float32(1.0) / Float32(pi)))) / r) / s) end
\begin{array}{l}
\\
\frac{\frac{\mathsf{fma}\left(-0.16666666666666666, \frac{r}{s \cdot \pi}, 0.25 \cdot \frac{1}{\pi}\right)}{r}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around 0
lower-/.f32N/A
Applied rewrites99.5%
Taylor expanded in r around 0
lower-/.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-/.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (* (/ 1.0 s) (- (/ 0.25 (* PI r)) (/ 0.16666666666666666 (* PI s)))))
float code(float s, float r) {
return (1.0f / s) * ((0.25f / (((float) M_PI) * r)) - (0.16666666666666666f / (((float) M_PI) * s)));
}
function code(s, r) return Float32(Float32(Float32(1.0) / s) * Float32(Float32(Float32(0.25) / Float32(Float32(pi) * r)) - Float32(Float32(0.16666666666666666) / Float32(Float32(pi) * s)))) end
function tmp = code(s, r) tmp = (single(1.0) / s) * ((single(0.25) / (single(pi) * r)) - (single(0.16666666666666666) / (single(pi) * s))); end
\begin{array}{l}
\\
\frac{1}{s} \cdot \left(\frac{0.25}{\pi \cdot r} - \frac{0.16666666666666666}{\pi \cdot s}\right)
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower--.f32N/A
lower-*.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-/.f32N/A
mult-flipN/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f329.0
lift-*.f32N/A
lift-/.f32N/A
mult-flip-revN/A
lift-/.f329.0
lift-*.f32N/A
*-commutativeN/A
lower-*.f329.0
lift-*.f32N/A
lift-/.f32N/A
mult-flip-revN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (- (/ 0.25 (* PI r)) (/ 0.16666666666666666 (* PI s))) s))
float code(float s, float r) {
return ((0.25f / (((float) M_PI) * r)) - (0.16666666666666666f / (((float) M_PI) * s))) / s;
}
function code(s, r) return Float32(Float32(Float32(Float32(0.25) / Float32(Float32(pi) * r)) - Float32(Float32(0.16666666666666666) / Float32(Float32(pi) * s))) / s) end
function tmp = code(s, r) tmp = ((single(0.25) / (single(pi) * r)) - (single(0.16666666666666666) / (single(pi) * s))) / s; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi \cdot r} - \frac{0.16666666666666666}{\pi \cdot s}}{s}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower--.f32N/A
lower-*.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-/.f32N/A
lower-*.f32N/A
lower-PI.f329.0
Applied rewrites9.0%
lift-*.f32N/A
lift-/.f32N/A
mult-flip-revN/A
lift-/.f329.0
lift-*.f32N/A
*-commutativeN/A
lower-*.f329.0
lift-*.f32N/A
lift-/.f32N/A
mult-flip-revN/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
lower-/.f329.0
Applied rewrites9.0%
(FPCore (s r) :precision binary32 (/ (/ 0.25 (* PI s)) r))
float code(float s, float r) {
return (0.25f / (((float) M_PI) * s)) / r;
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(Float32(pi) * s)) / r) end
function tmp = code(s, r) tmp = (single(0.25) / (single(pi) * s)) / r; end
\begin{array}{l}
\\
\frac{\frac{0.25}{\pi \cdot s}}{r}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.1
Applied rewrites9.1%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
*-commutativeN/A
associate-/r*N/A
lower-/.f32N/A
lower-/.f329.1
Applied rewrites9.1%
(FPCore (s r) :precision binary32 (/ (/ 0.25 (* s r)) PI))
float code(float s, float r) {
return (0.25f / (s * r)) / ((float) M_PI);
}
function code(s, r) return Float32(Float32(Float32(0.25) / Float32(s * r)) / Float32(pi)) end
function tmp = code(s, r) tmp = (single(0.25) / (s * r)) / single(pi); end
\begin{array}{l}
\\
\frac{\frac{0.25}{s \cdot r}}{\pi}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.1
Applied rewrites9.1%
lift-/.f32N/A
lift-*.f32N/A
lift-*.f32N/A
associate-*r*N/A
associate-/r*N/A
*-commutativeN/A
lower-/.f32N/A
lower-/.f32N/A
lower-*.f329.1
Applied rewrites9.1%
(FPCore (s r) :precision binary32 (/ 0.25 (* r (* s PI))))
float code(float s, float r) {
return 0.25f / (r * (s * ((float) M_PI)));
}
function code(s, r) return Float32(Float32(0.25) / Float32(r * Float32(s * Float32(pi)))) end
function tmp = code(s, r) tmp = single(0.25) / (r * (s * single(pi))); end
\begin{array}{l}
\\
\frac{0.25}{r \cdot \left(s \cdot \pi\right)}
\end{array}
Initial program 99.6%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lower-PI.f329.1
Applied rewrites9.1%
herbie shell --seed 2025142
(FPCore (s r)
:name "Disney BSSRDF, PDF of scattering profile"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (< 1e-6 r) (< r 1000000.0)))
(+ (/ (* 0.25 (exp (/ (- r) s))) (* (* (* 2.0 PI) s) r)) (/ (* 0.75 (exp (/ (- r) (* 3.0 s)))) (* (* (* 6.0 PI) s) r))))