
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
s
(-
(log
(+
(/
1.0
(+
(/ u (+ 1.0 (exp (/ PI (- s)))))
(/ (- 1.0 u) (+ 1.0 (exp (/ PI s))))))
-1.0)))))
float code(float u, float s) {
return s * -logf(((1.0f / ((u / (1.0f + expf((((float) M_PI) / -s)))) + ((1.0f - u) / (1.0f + expf((((float) M_PI) / s)))))) + -1.0f));
}
function code(u, s) return Float32(s * Float32(-log(Float32(Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(Float32(1.0) - u) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))))) + Float32(-1.0))))) end
function tmp = code(u, s) tmp = s * -log(((single(1.0) / ((u / (single(1.0) + exp((single(pi) / -s)))) + ((single(1.0) - u) / (single(1.0) + exp((single(pi) / s)))))) + single(-1.0))); end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\frac{1}{\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{1 - u}{1 + e^{\frac{\pi}{s}}}} + -1\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Final simplification98.9%
(FPCore (u s) :precision binary32 (- (* 2.0 (* s u)) (* s (log (+ 1.0 (/ PI s))))))
float code(float u, float s) {
return (2.0f * (s * u)) - (s * logf((1.0f + (((float) M_PI) / s))));
}
function code(u, s) return Float32(Float32(Float32(2.0) * Float32(s * u)) - Float32(s * log(Float32(Float32(1.0) + Float32(Float32(pi) / s))))) end
function tmp = code(u, s) tmp = (single(2.0) * (s * u)) - (s * log((single(1.0) + (single(pi) / s)))); end
\begin{array}{l}
\\
2 \cdot \left(s \cdot u\right) - s \cdot \log \left(1 + \frac{\pi}{s}\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around -inf 24.7%
+-commutative24.7%
fma-def24.7%
Simplified24.7%
Taylor expanded in u around 0 25.0%
Taylor expanded in s around 0 25.0%
*-commutative25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (- s) (log1p (/ PI s))))
float code(float u, float s) {
return -s * log1pf((((float) M_PI) / s));
}
function code(u, s) return Float32(Float32(-s) * log1p(Float32(Float32(pi) / s))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \mathsf{log1p}\left(\frac{\pi}{s}\right)
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in s around -inf 24.7%
+-commutative24.7%
fma-def24.7%
Simplified24.7%
Taylor expanded in u around 0 25.0%
associate-*r*25.0%
neg-mul-125.0%
log1p-def25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (+ -0.25 (* u 0.5)))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * (-0.25f + (u * 0.5f)));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * Float32(Float32(-0.25) + Float32(u * Float32(0.5))))) end
function tmp = code(u, s) tmp = single(4.0) * (single(pi) * (single(-0.25) + (u * single(0.5)))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \left(-0.25 + u \cdot 0.5\right)\right)
\end{array}
Initial program 98.9%
Simplified98.9%
div-inv98.8%
add-cube-cbrt98.9%
associate-*l*98.8%
pow298.8%
Applied egg-rr98.8%
Taylor expanded in s around inf 11.3%
associate--r+11.3%
cancel-sign-sub-inv11.3%
*-commutative11.3%
*-commutative11.3%
associate-*r*11.3%
*-commutative11.3%
*-commutative11.3%
associate-*r*11.3%
distribute-lft-out--11.3%
metadata-eval11.3%
*-commutative11.3%
*-commutative11.3%
metadata-eval11.3%
+-commutative11.3%
associate-*r*11.3%
*-commutative11.3%
Simplified11.3%
Final simplification11.3%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Simplified98.9%
Taylor expanded in u around 0 11.1%
neg-mul-111.1%
Simplified11.1%
Final simplification11.1%
herbie shell --seed 2024011
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))