
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
s
(-
(log
(+
(/
1.0
(+
(/ u (+ 1.0 (exp (/ (- PI) s))))
(/ (- 1.0 u) (+ 1.0 (exp (/ PI s))))))
-1.0)))))
float code(float u, float s) {
return s * -logf(((1.0f / ((u / (1.0f + expf((-((float) M_PI) / s)))) + ((1.0f - u) / (1.0f + expf((((float) M_PI) / s)))))) + -1.0f));
}
function code(u, s) return Float32(s * Float32(-log(Float32(Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) + Float32(Float32(Float32(1.0) - u) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))))) + Float32(-1.0))))) end
function tmp = code(u, s) tmp = s * -log(((single(1.0) / ((u / (single(1.0) + exp((-single(pi) / s)))) + ((single(1.0) - u) / (single(1.0) + exp((single(pi) / s)))))) + single(-1.0))); end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\frac{1}{\frac{u}{1 + e^{\frac{-\pi}{s}}} + \frac{1 - u}{1 + e^{\frac{\pi}{s}}}} + -1\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Final simplification98.9%
(FPCore (u s) :precision binary32 (let* ((t_0 (+ 0.25 (* u 0.5)))) (* s (+ (log (* t_0 (* PI 4.0))) (+ (log s) (/ (* s 0.25) (* PI t_0)))))))
float code(float u, float s) {
float t_0 = 0.25f + (u * 0.5f);
return s * (logf((t_0 * (((float) M_PI) * 4.0f))) + (logf(s) + ((s * 0.25f) / (((float) M_PI) * t_0))));
}
function code(u, s) t_0 = Float32(Float32(0.25) + Float32(u * Float32(0.5))) return Float32(s * Float32(log(Float32(t_0 * Float32(Float32(pi) * Float32(4.0)))) + Float32(log(s) + Float32(Float32(s * Float32(0.25)) / Float32(Float32(pi) * t_0))))) end
function tmp = code(u, s) t_0 = single(0.25) + (u * single(0.5)); tmp = s * (log((t_0 * (single(pi) * single(4.0)))) + (log(s) + ((s * single(0.25)) / (single(pi) * t_0)))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := 0.25 + u \cdot 0.5\\
s \cdot \left(\log \left(t_0 \cdot \left(\pi \cdot 4\right)\right) + \left(\log s + \frac{s \cdot 0.25}{\pi \cdot t_0}\right)\right)
\end{array}
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in s around 0 25.1%
add-sqr-sqrt-0.0%
sqrt-unprod7.6%
sqr-neg7.6%
Applied egg-rr25.2%
distribute-lft-in25.2%
associate-*r*25.2%
*-commutative25.2%
associate-*l*25.2%
*-commutative25.2%
associate-*l/25.2%
Simplified25.2%
Final simplification25.2%
(FPCore (u s) :precision binary32 (* s (- (- (log s) (* 0.25 (/ s (* PI 0.25)))) (log (* 4.0 (* PI (+ 0.25 (* u 0.5))))))))
float code(float u, float s) {
return s * ((logf(s) - (0.25f * (s / (((float) M_PI) * 0.25f)))) - logf((4.0f * (((float) M_PI) * (0.25f + (u * 0.5f))))));
}
function code(u, s) return Float32(s * Float32(Float32(log(s) - Float32(Float32(0.25) * Float32(s / Float32(Float32(pi) * Float32(0.25))))) - log(Float32(Float32(4.0) * Float32(Float32(pi) * Float32(Float32(0.25) + Float32(u * Float32(0.5)))))))) end
function tmp = code(u, s) tmp = s * ((log(s) - (single(0.25) * (s / (single(pi) * single(0.25))))) - log((single(4.0) * (single(pi) * (single(0.25) + (u * single(0.5))))))); end
\begin{array}{l}
\\
s \cdot \left(\left(\log s - 0.25 \cdot \frac{s}{\pi \cdot 0.25}\right) - \log \left(4 \cdot \left(\pi \cdot \left(0.25 + u \cdot 0.5\right)\right)\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in s around 0 25.1%
Taylor expanded in u around 0 25.1%
Final simplification25.1%
(FPCore (u s) :precision binary32 (* s (- (log (fma -4.0 (/ (* PI (- -0.25 (* u 0.5))) s) 1.0)))))
float code(float u, float s) {
return s * -logf(fmaf(-4.0f, ((((float) M_PI) * (-0.25f - (u * 0.5f))) / s), 1.0f));
}
function code(u, s) return Float32(s * Float32(-log(fma(Float32(-4.0), Float32(Float32(Float32(pi) * Float32(Float32(-0.25) - Float32(u * Float32(0.5)))) / s), Float32(1.0))))) end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\mathsf{fma}\left(-4, \frac{\pi \cdot \left(-0.25 - u \cdot 0.5\right)}{s}, 1\right)\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* s (- (log (+ 1.0 (/ PI s))))))
float code(float u, float s) {
return s * -logf((1.0f + (((float) M_PI) / s)));
}
function code(u, s) return Float32(s * Float32(-log(Float32(Float32(1.0) + Float32(Float32(pi) / s))))) end
function tmp = code(u, s) tmp = s * -log((single(1.0) + (single(pi) / s))); end
\begin{array}{l}
\\
s \cdot \left(-\log \left(1 + \frac{\pi}{s}\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in u around 0 25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* s (- (log1p (/ PI s)))))
float code(float u, float s) {
return s * -log1pf((((float) M_PI) / s));
}
function code(u, s) return Float32(s * Float32(-log1p(Float32(Float32(pi) / s)))) end
\begin{array}{l}
\\
s \cdot \left(-\mathsf{log1p}\left(\frac{\pi}{s}\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in u around 0 25.0%
associate-*r*25.0%
neg-mul-125.0%
log1p-def25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* s (/ (* 0.25 (- s)) (* PI (+ 0.25 (* u 0.5))))))
float code(float u, float s) {
return s * ((0.25f * -s) / (((float) M_PI) * (0.25f + (u * 0.5f))));
}
function code(u, s) return Float32(s * Float32(Float32(Float32(0.25) * Float32(-s)) / Float32(Float32(pi) * Float32(Float32(0.25) + Float32(u * Float32(0.5)))))) end
function tmp = code(u, s) tmp = s * ((single(0.25) * -s) / (single(pi) * (single(0.25) + (u * single(0.5))))); end
\begin{array}{l}
\\
s \cdot \frac{0.25 \cdot \left(-s\right)}{\pi \cdot \left(0.25 + u \cdot 0.5\right)}
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
fma-def24.9%
associate--r+24.9%
cancel-sign-sub-inv24.9%
distribute-rgt-out--24.9%
*-commutative24.9%
metadata-eval24.9%
metadata-eval24.9%
*-commutative24.9%
Simplified24.9%
+-commutative24.9%
*-commutative24.9%
metadata-eval24.9%
distribute-rgt-out--24.9%
cancel-sign-sub-inv24.9%
metadata-eval24.9%
add-sqr-sqrt24.9%
sqrt-unprod24.9%
swap-sqr24.9%
metadata-eval24.9%
metadata-eval24.9%
swap-sqr24.9%
sqrt-unprod-0.0%
add-sqr-sqrt25.0%
Applied egg-rr25.0%
distribute-lft-out--25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in s around 0 25.1%
Taylor expanded in s around inf 12.6%
*-commutative12.6%
associate-*l/12.6%
Simplified12.6%
Final simplification12.6%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (+ (* u 0.5) -0.25))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * ((u * 0.5f) + -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * Float32(Float32(u * Float32(0.5)) + Float32(-0.25)))) end
function tmp = code(u, s) tmp = single(4.0) * (single(pi) * ((u * single(0.5)) + single(-0.25))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \left(u \cdot 0.5 + -0.25\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 10.7%
associate--r+10.7%
cancel-sign-sub-inv10.7%
distribute-rgt-out--10.7%
*-commutative10.7%
metadata-eval10.7%
metadata-eval10.7%
*-commutative10.7%
Simplified10.7%
+-commutative10.7%
associate-*l*10.7%
distribute-lft-out10.7%
Applied egg-rr10.7%
Final simplification10.7%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in u around 0 10.5%
mul-1-neg10.5%
Simplified10.5%
Final simplification10.5%
(FPCore (u s) :precision binary32 (* s 0.0))
float code(float u, float s) {
return s * 0.0f;
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = s * 0.0e0
end function
function code(u, s) return Float32(s * Float32(0.0)) end
function tmp = code(u, s) tmp = s * single(0.0); end
\begin{array}{l}
\\
s \cdot 0
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around inf 10.5%
Final simplification10.5%
herbie shell --seed 2023301
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))