
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
(FPCore (s u) :precision binary32 (* (* s -3.0) (log1p (/ (+ u -0.25) -0.75))))
float code(float s, float u) {
return (s * -3.0f) * log1pf(((u + -0.25f) / -0.75f));
}
function code(s, u) return Float32(Float32(s * Float32(-3.0)) * log1p(Float32(Float32(u + Float32(-0.25)) / Float32(-0.75)))) end
\begin{array}{l}
\\
\left(s \cdot -3\right) \cdot \mathsf{log1p}\left(\frac{u + -0.25}{-0.75}\right)
\end{array}
Initial program 95.3%
log-rec96.4%
distribute-rgt-neg-out96.4%
distribute-lft-neg-out96.4%
*-commutative96.4%
distribute-rgt-neg-in96.4%
metadata-eval96.4%
sub-neg96.4%
log1p-define98.4%
distribute-neg-frac298.4%
sub-neg98.4%
metadata-eval98.4%
metadata-eval98.4%
Simplified98.4%
(FPCore (s u) :precision binary32 (* (* s -3.0) (log1p (* (+ u -0.25) -1.3333333333333333))))
float code(float s, float u) {
return (s * -3.0f) * log1pf(((u + -0.25f) * -1.3333333333333333f));
}
function code(s, u) return Float32(Float32(s * Float32(-3.0)) * log1p(Float32(Float32(u + Float32(-0.25)) * Float32(-1.3333333333333333)))) end
\begin{array}{l}
\\
\left(s \cdot -3\right) \cdot \mathsf{log1p}\left(\left(u + -0.25\right) \cdot -1.3333333333333333\right)
\end{array}
Initial program 95.3%
log-rec96.4%
distribute-rgt-neg-out96.4%
distribute-lft-neg-out96.4%
*-commutative96.4%
distribute-rgt-neg-in96.4%
metadata-eval96.4%
sub-neg96.4%
log1p-define98.4%
neg-sub098.4%
div-sub96.3%
associate--r-96.3%
neg-sub096.3%
neg-mul-196.3%
associate-/l*96.3%
*-commutative96.3%
associate-/l*96.7%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
fma-undefine96.7%
metadata-eval96.7%
metadata-eval96.7%
distribute-rgt-in98.0%
sub-neg98.0%
metadata-eval98.0%
distribute-lft-neg-in98.0%
*-commutative98.0%
distribute-rgt-neg-in98.0%
sub-neg98.0%
metadata-eval98.0%
metadata-eval98.0%
Applied egg-rr98.0%
(FPCore (s u) :precision binary32 (* -3.0 (* s (log (- 1.3333333333333333 (* u 1.3333333333333333))))))
float code(float s, float u) {
return -3.0f * (s * logf((1.3333333333333333f - (u * 1.3333333333333333f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (-3.0e0) * (s * log((1.3333333333333333e0 - (u * 1.3333333333333333e0))))
end function
function code(s, u) return Float32(Float32(-3.0) * Float32(s * log(Float32(Float32(1.3333333333333333) - Float32(u * Float32(1.3333333333333333)))))) end
function tmp = code(s, u) tmp = single(-3.0) * (s * log((single(1.3333333333333333) - (u * single(1.3333333333333333))))); end
\begin{array}{l}
\\
-3 \cdot \left(s \cdot \log \left(1.3333333333333333 - u \cdot 1.3333333333333333\right)\right)
\end{array}
Initial program 95.3%
associate-*l*95.3%
log-rec96.4%
div-sub95.4%
metadata-eval95.4%
Simplified95.4%
Taylor expanded in s around 0 95.8%
Final simplification95.8%
(FPCore (s u) :precision binary32 (* (* s 3.0) (+ u (log 0.75))))
float code(float s, float u) {
return (s * 3.0f) * (u + logf(0.75f));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (s * 3.0e0) * (u + log(0.75e0))
end function
function code(s, u) return Float32(Float32(s * Float32(3.0)) * Float32(u + log(Float32(0.75)))) end
function tmp = code(s, u) tmp = (s * single(3.0)) * (u + log(single(0.75))); end
\begin{array}{l}
\\
\left(s \cdot 3\right) \cdot \left(u + \log 0.75\right)
\end{array}
Initial program 95.3%
Taylor expanded in u around 0 25.1%
associate-*r*25.1%
associate-*r*25.1%
distribute-lft-out25.1%
*-commutative25.1%
Simplified25.1%
(FPCore (s u) :precision binary32 (* 3.0 (* s (+ u (log 0.75)))))
float code(float s, float u) {
return 3.0f * (s * (u + logf(0.75f)));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = 3.0e0 * (s * (u + log(0.75e0)))
end function
function code(s, u) return Float32(Float32(3.0) * Float32(s * Float32(u + log(Float32(0.75))))) end
function tmp = code(s, u) tmp = single(3.0) * (s * (u + log(single(0.75)))); end
\begin{array}{l}
\\
3 \cdot \left(s \cdot \left(u + \log 0.75\right)\right)
\end{array}
Initial program 95.3%
Taylor expanded in s around 0 95.3%
Taylor expanded in u around 0 25.1%
(FPCore (s u) :precision binary32 0.0)
float code(float s, float u) {
return 0.0f;
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = 0.0e0
end function
function code(s, u) return Float32(0.0) end
function tmp = code(s, u) tmp = single(0.0); end
\begin{array}{l}
\\
0
\end{array}
Initial program 95.3%
associate-*l*95.3%
log-rec96.4%
div-sub95.4%
metadata-eval95.4%
Simplified95.4%
Applied egg-rr6.4%
*-inverses11.0%
Simplified11.0%
Taylor expanded in s around 0 11.0%
herbie shell --seed 2024131
(FPCore (s u)
:name "Disney BSSRDF, sample scattering profile, upper"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (<= 0.25 u) (<= u 1.0)))
(* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))