
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
(FPCore (s u)
:precision binary32
(fma
(* 3.0 (log1p (* (+ u -0.25) (fma u 1.7777777777777777 0.8888888888888888))))
s
(*
(log1p
(*
(+ u -0.25)
(fma
u
(fma u -2.3703703703703702 1.1851851851851851)
-0.14814814814814814)))
(* 3.0 (- s)))))
float code(float s, float u) {
return fmaf((3.0f * log1pf(((u + -0.25f) * fmaf(u, 1.7777777777777777f, 0.8888888888888888f)))), s, (log1pf(((u + -0.25f) * fmaf(u, fmaf(u, -2.3703703703703702f, 1.1851851851851851f), -0.14814814814814814f))) * (3.0f * -s)));
}
function code(s, u) return fma(Float32(Float32(3.0) * log1p(Float32(Float32(u + Float32(-0.25)) * fma(u, Float32(1.7777777777777777), Float32(0.8888888888888888))))), s, Float32(log1p(Float32(Float32(u + Float32(-0.25)) * fma(u, fma(u, Float32(-2.3703703703703702), Float32(1.1851851851851851)), Float32(-0.14814814814814814)))) * Float32(Float32(3.0) * Float32(-s)))) end
\begin{array}{l}
\\
\mathsf{fma}\left(3 \cdot \mathsf{log1p}\left(\left(u + -0.25\right) \cdot \mathsf{fma}\left(u, 1.7777777777777777, 0.8888888888888888\right)\right), s, \mathsf{log1p}\left(\left(u + -0.25\right) \cdot \mathsf{fma}\left(u, \mathsf{fma}\left(u, -2.3703703703703702, 1.1851851851851851\right), -0.14814814814814814\right)\right) \cdot \left(3 \cdot \left(-s\right)\right)\right)
\end{array}
Initial program 95.8%
Applied egg-rr98.2%
Applied egg-rr98.5%
Applied egg-rr98.6%
Taylor expanded in u around 0
sub-negN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
metadata-eval98.6
Simplified98.6%
Final simplification98.6%
(FPCore (s u)
:precision binary32
(*
(* 3.0 s)
(-
(log1p
(fma
(* u (+ u -0.25))
1.7777777777777777
(fma u 0.8888888888888888 -0.2222222222222222)))
(log1p
(*
(fma u -2.3703703703703702 0.5925925925925926)
(* (+ u -0.25) (+ u -0.25)))))))
float code(float s, float u) {
return (3.0f * s) * (log1pf(fmaf((u * (u + -0.25f)), 1.7777777777777777f, fmaf(u, 0.8888888888888888f, -0.2222222222222222f))) - log1pf((fmaf(u, -2.3703703703703702f, 0.5925925925925926f) * ((u + -0.25f) * (u + -0.25f)))));
}
function code(s, u) return Float32(Float32(Float32(3.0) * s) * Float32(log1p(fma(Float32(u * Float32(u + Float32(-0.25))), Float32(1.7777777777777777), fma(u, Float32(0.8888888888888888), Float32(-0.2222222222222222)))) - log1p(Float32(fma(u, Float32(-2.3703703703703702), Float32(0.5925925925925926)) * Float32(Float32(u + Float32(-0.25)) * Float32(u + Float32(-0.25))))))) end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \left(\mathsf{log1p}\left(\mathsf{fma}\left(u \cdot \left(u + -0.25\right), 1.7777777777777777, \mathsf{fma}\left(u, 0.8888888888888888, -0.2222222222222222\right)\right)\right) - \mathsf{log1p}\left(\mathsf{fma}\left(u, -2.3703703703703702, 0.5925925925925926\right) \cdot \left(\left(u + -0.25\right) \cdot \left(u + -0.25\right)\right)\right)\right)
\end{array}
Initial program 95.8%
Applied egg-rr98.2%
distribute-lft-inN/A
associate-+l+N/A
*-commutativeN/A
lower-+.f32N/A
*-commutativeN/A
lower-*.f32N/A
metadata-evalN/A
metadata-eval98.3
Applied egg-rr98.3%
lift-+.f32N/A
lift-+.f32N/A
lift-+.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f3298.3
lift-*.f32N/A
*-commutativeN/A
lift-+.f32N/A
distribute-rgt-inN/A
metadata-evalN/A
metadata-evalN/A
lower-fma.f32N/A
metadata-eval98.3
Applied egg-rr98.3%
lift-+.f32N/A
lift-*.f32N/A
distribute-lft-inN/A
lift-*.f32N/A
*-commutativeN/A
associate-*r*N/A
*-commutativeN/A
lower-fma.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-+.f32N/A
distribute-rgt-inN/A
metadata-evalN/A
metadata-evalN/A
lower-fma.f32N/A
metadata-eval98.5
Applied egg-rr98.5%
(FPCore (s u)
:precision binary32
(*
(* 3.0 s)
(-
(log1p (* (+ u -0.25) (fma u 1.7777777777777777 0.8888888888888888)))
(log1p
(*
(fma u -2.3703703703703702 0.5925925925925926)
(* (+ u -0.25) (+ u -0.25)))))))
float code(float s, float u) {
return (3.0f * s) * (log1pf(((u + -0.25f) * fmaf(u, 1.7777777777777777f, 0.8888888888888888f))) - log1pf((fmaf(u, -2.3703703703703702f, 0.5925925925925926f) * ((u + -0.25f) * (u + -0.25f)))));
}
function code(s, u) return Float32(Float32(Float32(3.0) * s) * Float32(log1p(Float32(Float32(u + Float32(-0.25)) * fma(u, Float32(1.7777777777777777), Float32(0.8888888888888888)))) - log1p(Float32(fma(u, Float32(-2.3703703703703702), Float32(0.5925925925925926)) * Float32(Float32(u + Float32(-0.25)) * Float32(u + Float32(-0.25))))))) end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \left(\mathsf{log1p}\left(\left(u + -0.25\right) \cdot \mathsf{fma}\left(u, 1.7777777777777777, 0.8888888888888888\right)\right) - \mathsf{log1p}\left(\mathsf{fma}\left(u, -2.3703703703703702, 0.5925925925925926\right) \cdot \left(\left(u + -0.25\right) \cdot \left(u + -0.25\right)\right)\right)\right)
\end{array}
Initial program 95.8%
Applied egg-rr98.2%
distribute-lft-inN/A
associate-+l+N/A
*-commutativeN/A
lower-+.f32N/A
*-commutativeN/A
lower-*.f32N/A
metadata-evalN/A
metadata-eval98.3
Applied egg-rr98.3%
lift-+.f32N/A
lift-+.f32N/A
lift-+.f32N/A
lift-*.f32N/A
lift-*.f32N/A
*-commutativeN/A
lift-*.f32N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f32N/A
lower-*.f3298.3
lift-*.f32N/A
*-commutativeN/A
lift-+.f32N/A
distribute-rgt-inN/A
metadata-evalN/A
metadata-evalN/A
lower-fma.f32N/A
metadata-eval98.3
Applied egg-rr98.3%
lift-+.f32N/A
*-commutativeN/A
+-commutativeN/A
+-commutativeN/A
lift-fma.f32N/A
*-commutativeN/A
lower-*.f3298.4
Applied egg-rr98.4%
Final simplification98.4%
(FPCore (s u) :precision binary32 (* (* 3.0 s) (- (log1p (fma u 1.3333333333333333 -0.3333333333333333)) (log1p (* (- 0.25 u) (* (+ u -0.25) 1.7777777777777777))))))
float code(float s, float u) {
return (3.0f * s) * (log1pf(fmaf(u, 1.3333333333333333f, -0.3333333333333333f)) - log1pf(((0.25f - u) * ((u + -0.25f) * 1.7777777777777777f))));
}
function code(s, u) return Float32(Float32(Float32(3.0) * s) * Float32(log1p(fma(u, Float32(1.3333333333333333), Float32(-0.3333333333333333))) - log1p(Float32(Float32(Float32(0.25) - u) * Float32(Float32(u + Float32(-0.25)) * Float32(1.7777777777777777)))))) end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \left(\mathsf{log1p}\left(\mathsf{fma}\left(u, 1.3333333333333333, -0.3333333333333333\right)\right) - \mathsf{log1p}\left(\left(0.25 - u\right) \cdot \left(\left(u + -0.25\right) \cdot 1.7777777777777777\right)\right)\right)
\end{array}
Initial program 95.8%
Applied egg-rr98.2%
Final simplification98.2%
(FPCore (s u) :precision binary32 (* 3.0 (* (- s) (log1p (- (fma u 1.3333333333333333 -0.3333333333333333))))))
float code(float s, float u) {
return 3.0f * (-s * log1pf(-fmaf(u, 1.3333333333333333f, -0.3333333333333333f)));
}
function code(s, u) return Float32(Float32(3.0) * Float32(Float32(-s) * log1p(Float32(-fma(u, Float32(1.3333333333333333), Float32(-0.3333333333333333)))))) end
\begin{array}{l}
\\
3 \cdot \left(\left(-s\right) \cdot \mathsf{log1p}\left(-\mathsf{fma}\left(u, 1.3333333333333333, -0.3333333333333333\right)\right)\right)
\end{array}
Initial program 95.8%
lift--.f32N/A
lift-/.f32N/A
lift--.f32N/A
/-rgt-identityN/A
clear-numN/A
lift-/.f32N/A
lift-log.f32N/A
associate-*l*N/A
*-commutativeN/A
lower-*.f32N/A
Applied egg-rr98.0%
Final simplification98.0%
(FPCore (s u) :precision binary32 (* (* s -3.0) (log1p (fma -1.3333333333333333 u 0.3333333333333333))))
float code(float s, float u) {
return (s * -3.0f) * log1pf(fmaf(-1.3333333333333333f, u, 0.3333333333333333f));
}
function code(s, u) return Float32(Float32(s * Float32(-3.0)) * log1p(fma(Float32(-1.3333333333333333), u, Float32(0.3333333333333333)))) end
\begin{array}{l}
\\
\left(s \cdot -3\right) \cdot \mathsf{log1p}\left(\mathsf{fma}\left(-1.3333333333333333, u, 0.3333333333333333\right)\right)
\end{array}
Initial program 95.8%
Taylor expanded in s around 0
associate-*r*N/A
log-recN/A
distribute-rgt-neg-outN/A
distribute-lft-neg-inN/A
distribute-lft-neg-inN/A
metadata-evalN/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
sub-negN/A
lower-log1p.f32N/A
distribute-lft-neg-inN/A
metadata-evalN/A
sub-negN/A
distribute-lft-inN/A
metadata-evalN/A
metadata-evalN/A
lower-fma.f3297.9
Simplified97.9%
(FPCore (s u) :precision binary32 (* (* s -3.0) (log (fma u -1.3333333333333333 1.3333333333333333))))
float code(float s, float u) {
return (s * -3.0f) * logf(fmaf(u, -1.3333333333333333f, 1.3333333333333333f));
}
function code(s, u) return Float32(Float32(s * Float32(-3.0)) * log(fma(u, Float32(-1.3333333333333333), Float32(1.3333333333333333)))) end
\begin{array}{l}
\\
\left(s \cdot -3\right) \cdot \log \left(\mathsf{fma}\left(u, -1.3333333333333333, 1.3333333333333333\right)\right)
\end{array}
Initial program 95.8%
Taylor expanded in u around 0
+-commutativeN/A
lower-fma.f3295.9
Simplified95.9%
lift-*.f32N/A
lift-fma.f32N/A
lift-/.f32N/A
lift-log.f32N/A
*-commutativeN/A
lift-*.f32N/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f3295.9
lift-log.f32N/A
lift-/.f32N/A
log-recN/A
lower-neg.f32N/A
lower-log.f3296.7
lift-fma.f32N/A
*-commutativeN/A
lower-fma.f3296.7
Applied egg-rr96.7%
Taylor expanded in s around 0
associate-*r*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-log.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f3296.7
Simplified96.7%
(FPCore (s u) :precision binary32 (* (* 3.0 s) (+ u (log 0.75))))
float code(float s, float u) {
return (3.0f * s) * (u + logf(0.75f));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * (u + log(0.75e0))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * Float32(u + log(Float32(0.75)))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * (u + log(single(0.75))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \left(u + \log 0.75\right)
\end{array}
Initial program 95.8%
Taylor expanded in u around 0
associate-*r*N/A
associate-*r*N/A
distribute-lft-outN/A
*-commutativeN/A
lower-*.f32N/A
lower-+.f32N/A
lower-log.f32N/A
lower-*.f3225.8
Simplified25.8%
Final simplification25.8%
(FPCore (s u) :precision binary32 (* 3.0 (* s (+ u (log 0.75)))))
float code(float s, float u) {
return 3.0f * (s * (u + logf(0.75f)));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = 3.0e0 * (s * (u + log(0.75e0)))
end function
function code(s, u) return Float32(Float32(3.0) * Float32(s * Float32(u + log(Float32(0.75))))) end
function tmp = code(s, u) tmp = single(3.0) * (s * (u + log(single(0.75)))); end
\begin{array}{l}
\\
3 \cdot \left(s \cdot \left(u + \log 0.75\right)\right)
\end{array}
Initial program 95.8%
Taylor expanded in u around 0
+-commutativeN/A
lower-fma.f3295.9
Simplified95.9%
Taylor expanded in u around 0
distribute-lft-outN/A
lower-*.f32N/A
distribute-lft-outN/A
lower-*.f32N/A
lower-+.f32N/A
lower-log.f3225.8
Simplified25.8%
(FPCore (s u) :precision binary32 (* s (log 1.3333333333333333)))
float code(float s, float u) {
return s * logf(1.3333333333333333f);
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = s * log(1.3333333333333333e0)
end function
function code(s, u) return Float32(s * log(Float32(1.3333333333333333))) end
function tmp = code(s, u) tmp = s * log(single(1.3333333333333333)); end
\begin{array}{l}
\\
s \cdot \log 1.3333333333333333
\end{array}
Initial program 95.8%
Taylor expanded in u around 0
lower-log.f327.2
Simplified7.2%
Taylor expanded in s around -inf
mul-1-negN/A
lower-neg.f3225.5
Simplified25.5%
lift-log.f32N/A
distribute-lft-neg-outN/A
distribute-rgt-neg-inN/A
lower-*.f32N/A
lift-log.f32N/A
neg-logN/A
metadata-evalN/A
lower-log.f3225.5
Applied egg-rr25.5%
herbie shell --seed 2024214
(FPCore (s u)
:name "Disney BSSRDF, sample scattering profile, upper"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (<= 0.25 u) (<= u 1.0)))
(* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))