
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
(log
(+
(/
1.0
(+ (/ u (+ 1.0 (exp (- (/ PI s))))) (/ (- 1.0 u) (+ 1.0 (exp (/ PI s))))))
-1.0))
(- s)))
float code(float u, float s) {
return logf(((1.0f / ((u / (1.0f + expf(-(((float) M_PI) / s)))) + ((1.0f - u) / (1.0f + expf((((float) M_PI) / s)))))) + -1.0f)) * -s;
}
function code(u, s) return Float32(log(Float32(Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(-Float32(Float32(pi) / s))))) + Float32(Float32(Float32(1.0) - u) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))))) + Float32(-1.0))) * Float32(-s)) end
function tmp = code(u, s) tmp = log(((single(1.0) / ((u / (single(1.0) + exp(-(single(pi) / s)))) + ((single(1.0) - u) / (single(1.0) + exp((single(pi) / s)))))) + single(-1.0))) * -s; end
\begin{array}{l}
\\
\log \left(\frac{1}{\frac{u}{1 + e^{-\frac{\pi}{s}}} + \frac{1 - u}{1 + e^{\frac{\pi}{s}}}} + -1\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Final simplification98.8%
(FPCore (u s) :precision binary32 (* (log (fma 4.0 (fabs (* PI (/ (fma u 0.5 -0.25) s))) 1.0)) (- s)))
float code(float u, float s) {
return logf(fmaf(4.0f, fabsf((((float) M_PI) * (fmaf(u, 0.5f, -0.25f) / s))), 1.0f)) * -s;
}
function code(u, s) return Float32(log(fma(Float32(4.0), abs(Float32(Float32(pi) * Float32(fma(u, Float32(0.5), Float32(-0.25)) / s))), Float32(1.0))) * Float32(-s)) end
\begin{array}{l}
\\
\log \left(\mathsf{fma}\left(4, \left|\pi \cdot \frac{\mathsf{fma}\left(u, 0.5, -0.25\right)}{s}\right|, 1\right)\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in s around -inf 24.8%
+-commutative24.8%
fma-def24.8%
associate--r+24.8%
cancel-sign-sub-inv24.8%
distribute-rgt-out--24.8%
*-commutative24.8%
metadata-eval24.8%
metadata-eval24.8%
*-commutative24.8%
Simplified24.8%
add-sqr-sqrt24.8%
sqrt-unprod15.8%
pow215.8%
Applied egg-rr15.8%
unpow215.8%
rem-sqrt-square25.0%
*-rgt-identity25.0%
associate-*r/25.0%
associate-*l*25.0%
associate-*r/25.0%
*-rgt-identity25.0%
fma-def25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (log (fma 4.0 (fabs (* PI (+ (* 0.5 (/ u s)) (* 0.25 (/ -1.0 s))))) 1.0)) (- s)))
float code(float u, float s) {
return logf(fmaf(4.0f, fabsf((((float) M_PI) * ((0.5f * (u / s)) + (0.25f * (-1.0f / s))))), 1.0f)) * -s;
}
function code(u, s) return Float32(log(fma(Float32(4.0), abs(Float32(Float32(pi) * Float32(Float32(Float32(0.5) * Float32(u / s)) + Float32(Float32(0.25) * Float32(Float32(-1.0) / s))))), Float32(1.0))) * Float32(-s)) end
\begin{array}{l}
\\
\log \left(\mathsf{fma}\left(4, \left|\pi \cdot \left(0.5 \cdot \frac{u}{s} + 0.25 \cdot \frac{-1}{s}\right)\right|, 1\right)\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in s around -inf 24.8%
+-commutative24.8%
fma-def24.8%
associate--r+24.8%
cancel-sign-sub-inv24.8%
distribute-rgt-out--24.8%
*-commutative24.8%
metadata-eval24.8%
metadata-eval24.8%
*-commutative24.8%
Simplified24.8%
add-sqr-sqrt24.8%
sqrt-unprod15.8%
pow215.8%
Applied egg-rr15.8%
unpow215.8%
rem-sqrt-square25.0%
*-rgt-identity25.0%
associate-*r/25.0%
associate-*l*25.0%
associate-*r/25.0%
*-rgt-identity25.0%
fma-def25.0%
Simplified25.0%
Taylor expanded in u around 0 25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (log1p (* 4.0 (fabs (* PI (+ (* (/ u s) -0.5) (/ 0.25 s)))))) (- s)))
float code(float u, float s) {
return log1pf((4.0f * fabsf((((float) M_PI) * (((u / s) * -0.5f) + (0.25f / s)))))) * -s;
}
function code(u, s) return Float32(log1p(Float32(Float32(4.0) * abs(Float32(Float32(pi) * Float32(Float32(Float32(u / s) * Float32(-0.5)) + Float32(Float32(0.25) / s)))))) * Float32(-s)) end
\begin{array}{l}
\\
\mathsf{log1p}\left(4 \cdot \left|\pi \cdot \left(\frac{u}{s} \cdot -0.5 + \frac{0.25}{s}\right)\right|\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in s around -inf 24.8%
+-commutative24.8%
fma-def24.8%
associate--r+24.8%
cancel-sign-sub-inv24.8%
distribute-rgt-out--24.8%
*-commutative24.8%
metadata-eval24.8%
metadata-eval24.8%
*-commutative24.8%
Simplified24.8%
add-sqr-sqrt24.8%
sqrt-unprod15.8%
pow215.8%
Applied egg-rr15.8%
unpow215.8%
rem-sqrt-square25.0%
*-rgt-identity25.0%
associate-*r/25.0%
associate-*l*25.0%
associate-*r/25.0%
*-rgt-identity25.0%
fma-def25.0%
Simplified25.0%
Taylor expanded in u around 0 25.0%
Taylor expanded in u around -inf 25.0%
log1p-def25.0%
mul-1-neg25.0%
*-commutative25.0%
associate-*r/25.0%
metadata-eval25.0%
+-commutative25.0%
Simplified25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (log (+ 1.0 (* 4.0 (fabs (* PI (/ -0.25 s)))))) (- s)))
float code(float u, float s) {
return logf((1.0f + (4.0f * fabsf((((float) M_PI) * (-0.25f / s)))))) * -s;
}
function code(u, s) return Float32(log(Float32(Float32(1.0) + Float32(Float32(4.0) * abs(Float32(Float32(pi) * Float32(Float32(-0.25) / s)))))) * Float32(-s)) end
function tmp = code(u, s) tmp = log((single(1.0) + (single(4.0) * abs((single(pi) * (single(-0.25) / s)))))) * -s; end
\begin{array}{l}
\\
\log \left(1 + 4 \cdot \left|\pi \cdot \frac{-0.25}{s}\right|\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in s around -inf 24.8%
+-commutative24.8%
fma-def24.8%
associate--r+24.8%
cancel-sign-sub-inv24.8%
distribute-rgt-out--24.8%
*-commutative24.8%
metadata-eval24.8%
metadata-eval24.8%
*-commutative24.8%
Simplified24.8%
add-sqr-sqrt24.8%
sqrt-unprod15.8%
pow215.8%
Applied egg-rr15.8%
unpow215.8%
rem-sqrt-square25.0%
*-rgt-identity25.0%
associate-*r/25.0%
associate-*l*25.0%
associate-*r/25.0%
*-rgt-identity25.0%
fma-def25.0%
Simplified25.0%
Taylor expanded in u around 0 24.9%
fma-udef24.9%
Applied egg-rr24.9%
Final simplification24.9%
(FPCore (u s) :precision binary32 (* (log (+ 1.0 (/ PI s))) (- s)))
float code(float u, float s) {
return logf((1.0f + (((float) M_PI) / s))) * -s;
}
function code(u, s) return Float32(log(Float32(Float32(1.0) + Float32(Float32(pi) / s))) * Float32(-s)) end
function tmp = code(u, s) tmp = log((single(1.0) + (single(pi) / s))) * -s; end
\begin{array}{l}
\\
\log \left(1 + \frac{\pi}{s}\right) \cdot \left(-s\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in u around 0 5.7%
Taylor expanded in s around inf 24.9%
+-commutative24.9%
Simplified24.9%
Final simplification24.9%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (fma u 0.5 -0.25))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * fmaf(u, 0.5f, -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * fma(u, Float32(0.5), Float32(-0.25)))) end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \mathsf{fma}\left(u, 0.5, -0.25\right)\right)
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in s around inf 11.6%
associate--r+11.6%
cancel-sign-sub-inv11.6%
distribute-rgt-out--11.6%
*-commutative11.6%
metadata-eval11.6%
metadata-eval11.6%
*-commutative11.6%
Simplified11.6%
Taylor expanded in u around 0 11.6%
+-commutative11.6%
associate-*r*11.6%
*-commutative11.6%
distribute-rgt-in11.6%
fma-def11.6%
Simplified11.6%
Final simplification11.6%
(FPCore (u s) :precision binary32 (* s (/ (- PI) s)))
float code(float u, float s) {
return s * (-((float) M_PI) / s);
}
function code(u, s) return Float32(s * Float32(Float32(-Float32(pi)) / s)) end
function tmp = code(u, s) tmp = s * (-single(pi) / s); end
\begin{array}{l}
\\
s \cdot \frac{-\pi}{s}
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in u around 0 5.7%
Taylor expanded in s around 0 11.2%
Final simplification11.2%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in u around 0 11.2%
mul-1-neg11.2%
Simplified11.2%
Final simplification11.2%
(FPCore (u s) :precision binary32 PI)
float code(float u, float s) {
return (float) M_PI;
}
function code(u, s) return Float32(pi) end
function tmp = code(u, s) tmp = single(pi); end
\begin{array}{l}
\\
\pi
\end{array}
Initial program 98.8%
distribute-lft-neg-out98.8%
distribute-rgt-neg-in98.8%
sub-neg98.8%
Simplified98.8%
Taylor expanded in u around 0 5.7%
add-sqr-sqrt-0.0%
sqrt-unprod2.3%
sqr-neg2.3%
sqrt-unprod2.3%
add-sqr-sqrt2.3%
add-log-exp4.7%
clear-num4.7%
un-div-inv4.7%
Applied egg-rr4.7%
Taylor expanded in s around 0 4.7%
Final simplification4.7%
herbie shell --seed 2023208
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))