
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (s u) :precision binary32 (* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))
float code(float s, float u) {
return (3.0f * s) * logf((1.0f / (1.0f - ((u - 0.25f) / 0.75f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (3.0e0 * s) * log((1.0e0 / (1.0e0 - ((u - 0.25e0) / 0.75e0))))
end function
function code(s, u) return Float32(Float32(Float32(3.0) * s) * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(u - Float32(0.25)) / Float32(0.75)))))) end
function tmp = code(s, u) tmp = (single(3.0) * s) * log((single(1.0) / (single(1.0) - ((u - single(0.25)) / single(0.75))))); end
\begin{array}{l}
\\
\left(3 \cdot s\right) \cdot \log \left(\frac{1}{1 - \frac{u - 0.25}{0.75}}\right)
\end{array}
(FPCore (s u) :precision binary32 (* s (sqrt (* (pow (log1p (fma u -1.3333333333333333 0.3333333333333333)) 2.0) 9.0))))
float code(float s, float u) {
return s * sqrtf((powf(log1pf(fmaf(u, -1.3333333333333333f, 0.3333333333333333f)), 2.0f) * 9.0f));
}
function code(s, u) return Float32(s * sqrt(Float32((log1p(fma(u, Float32(-1.3333333333333333), Float32(0.3333333333333333))) ^ Float32(2.0)) * Float32(9.0)))) end
\begin{array}{l}
\\
s \cdot \sqrt{{\left(\mathsf{log1p}\left(\mathsf{fma}\left(u, -1.3333333333333333, 0.3333333333333333\right)\right)\right)}^{2} \cdot 9}
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
add-sqr-sqrt97.6%
sqrt-unprod98.0%
swap-sqr98.1%
pow298.1%
metadata-eval98.1%
Applied egg-rr98.1%
(FPCore (s u) :precision binary32 (* s (* (log1p (fma u -1.3333333333333333 0.3333333333333333)) -3.0)))
float code(float s, float u) {
return s * (log1pf(fmaf(u, -1.3333333333333333f, 0.3333333333333333f)) * -3.0f);
}
function code(s, u) return Float32(s * Float32(log1p(fma(u, Float32(-1.3333333333333333), Float32(0.3333333333333333))) * Float32(-3.0))) end
\begin{array}{l}
\\
s \cdot \left(\mathsf{log1p}\left(\mathsf{fma}\left(u, -1.3333333333333333, 0.3333333333333333\right)\right) \cdot -3\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
(FPCore (s u) :precision binary32 (* s (* -3.0 (log1p (* u (- (* 0.3333333333333333 (/ 1.0 u)) 1.3333333333333333))))))
float code(float s, float u) {
return s * (-3.0f * log1pf((u * ((0.3333333333333333f * (1.0f / u)) - 1.3333333333333333f))));
}
function code(s, u) return Float32(s * Float32(Float32(-3.0) * log1p(Float32(u * Float32(Float32(Float32(0.3333333333333333) * Float32(Float32(1.0) / u)) - Float32(1.3333333333333333)))))) end
\begin{array}{l}
\\
s \cdot \left(-3 \cdot \mathsf{log1p}\left(u \cdot \left(0.3333333333333333 \cdot \frac{1}{u} - 1.3333333333333333\right)\right)\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
Taylor expanded in u around inf 97.2%
Final simplification97.2%
(FPCore (s u) :precision binary32 (* s (* -3.0 (log1p (* u (+ -1.3333333333333333 (/ 0.3333333333333333 u)))))))
float code(float s, float u) {
return s * (-3.0f * log1pf((u * (-1.3333333333333333f + (0.3333333333333333f / u)))));
}
function code(s, u) return Float32(s * Float32(Float32(-3.0) * log1p(Float32(u * Float32(Float32(-1.3333333333333333) + Float32(Float32(0.3333333333333333) / u)))))) end
\begin{array}{l}
\\
s \cdot \left(-3 \cdot \mathsf{log1p}\left(u \cdot \left(-1.3333333333333333 + \frac{0.3333333333333333}{u}\right)\right)\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
Taylor expanded in u around inf 97.2%
sub-neg97.2%
metadata-eval97.2%
+-commutative97.2%
associate-*r/97.2%
metadata-eval97.2%
Simplified97.2%
Final simplification97.2%
(FPCore (s u) :precision binary32 (* s (* -3.0 (log1p (+ 0.3333333333333333 (* u -1.3333333333333333))))))
float code(float s, float u) {
return s * (-3.0f * log1pf((0.3333333333333333f + (u * -1.3333333333333333f))));
}
function code(s, u) return Float32(s * Float32(Float32(-3.0) * log1p(Float32(Float32(0.3333333333333333) + Float32(u * Float32(-1.3333333333333333)))))) end
\begin{array}{l}
\\
s \cdot \left(-3 \cdot \mathsf{log1p}\left(0.3333333333333333 + u \cdot -1.3333333333333333\right)\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
fma-undefine97.0%
Applied egg-rr97.0%
Final simplification97.0%
(FPCore (s u) :precision binary32 (* -3.0 (* s (log (+ 1.3333333333333333 (* u -1.3333333333333333))))))
float code(float s, float u) {
return -3.0f * (s * logf((1.3333333333333333f + (u * -1.3333333333333333f))));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = (-3.0e0) * (s * log((1.3333333333333333e0 + (u * (-1.3333333333333333e0)))))
end function
function code(s, u) return Float32(Float32(-3.0) * Float32(s * log(Float32(Float32(1.3333333333333333) + Float32(u * Float32(-1.3333333333333333)))))) end
function tmp = code(s, u) tmp = single(-3.0) * (s * log((single(1.3333333333333333) + (u * single(-1.3333333333333333))))); end
\begin{array}{l}
\\
-3 \cdot \left(s \cdot \log \left(1.3333333333333333 + u \cdot -1.3333333333333333\right)\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
Taylor expanded in s around 0 96.1%
Final simplification96.1%
(FPCore (s u) :precision binary32 (* 3.0 (* s (log 1.3333333333333333))))
float code(float s, float u) {
return 3.0f * (s * logf(1.3333333333333333f));
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = 3.0e0 * (s * log(1.3333333333333333e0))
end function
function code(s, u) return Float32(Float32(3.0) * Float32(s * log(Float32(1.3333333333333333)))) end
function tmp = code(s, u) tmp = single(3.0) * (s * log(single(1.3333333333333333))); end
\begin{array}{l}
\\
3 \cdot \left(s \cdot \log 1.3333333333333333\right)
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
add-sqr-sqrt97.6%
sqrt-unprod98.0%
swap-sqr98.1%
pow298.1%
metadata-eval98.1%
Applied egg-rr98.1%
Taylor expanded in u around 0 27.9%
(FPCore (s u) :precision binary32 (* s (log 0.421875)))
float code(float s, float u) {
return s * logf(0.421875f);
}
real(4) function code(s, u)
real(4), intent (in) :: s
real(4), intent (in) :: u
code = s * log(0.421875e0)
end function
function code(s, u) return Float32(s * log(Float32(0.421875))) end
function tmp = code(s, u) tmp = s * log(single(0.421875)); end
\begin{array}{l}
\\
s \cdot \log 0.421875
\end{array}
Initial program 95.8%
*-commutative95.8%
associate-*l*95.9%
*-commutative95.9%
log-rec96.8%
distribute-lft-neg-out96.8%
distribute-rgt-neg-in96.8%
sub-neg96.8%
log1p-define98.4%
neg-sub098.4%
div-sub96.6%
associate--r-96.6%
neg-sub096.6%
distribute-frac-neg96.6%
neg-mul-196.6%
*-commutative96.6%
associate-/l*97.0%
fma-define98.0%
metadata-eval98.0%
metadata-eval98.0%
metadata-eval98.0%
Simplified98.0%
Taylor expanded in s around 0 96.1%
Simplified96.9%
Taylor expanded in u around 0 7.3%
herbie shell --seed 2024096
(FPCore (s u)
:name "Disney BSSRDF, sample scattering profile, upper"
:precision binary32
:pre (and (and (<= 0.0 s) (<= s 256.0)) (and (<= 0.25 u) (<= u 1.0)))
(* (* 3.0 s) (log (/ 1.0 (- 1.0 (/ (- u 0.25) 0.75))))))