
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
s
(-
(log
(+
(/
1.0
(+
(/ u (+ 1.0 (exp (/ (- PI) s))))
(/ (- 1.0 u) (+ 1.0 (exp (/ PI s))))))
-1.0)))))
float code(float u, float s) {
return s * -logf(((1.0f / ((u / (1.0f + expf((-((float) M_PI) / s)))) + ((1.0f - u) / (1.0f + expf((((float) M_PI) / s)))))) + -1.0f));
}
function code(u, s) return Float32(s * Float32(-log(Float32(Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) + Float32(Float32(Float32(1.0) - u) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))))) + Float32(-1.0))))) end
function tmp = code(u, s) tmp = s * -log(((single(1.0) / ((u / (single(1.0) + exp((-single(pi) / s)))) + ((single(1.0) - u) / (single(1.0) + exp((single(pi) / s)))))) + single(-1.0))); end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\frac{1}{\frac{u}{1 + e^{\frac{-\pi}{s}}} + \frac{1 - u}{1 + e^{\frac{\pi}{s}}}} + -1\right)\right)
\end{array}
Initial program 99.1%
distribute-lft-neg-out99.1%
distribute-rgt-neg-in99.1%
sub-neg99.1%
Simplified99.1%
Final simplification99.1%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (+ (* u 0.5) -0.25))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * ((u * 0.5f) + -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * Float32(Float32(u * Float32(0.5)) + Float32(-0.25)))) end
function tmp = code(u, s) tmp = single(4.0) * (single(pi) * ((u * single(0.5)) + single(-0.25))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \left(u \cdot 0.5 + -0.25\right)\right)
\end{array}
Initial program 99.1%
distribute-lft-neg-out99.1%
distribute-rgt-neg-in99.1%
sub-neg99.1%
Simplified99.1%
Taylor expanded in s around inf 10.9%
associate--r+10.9%
cancel-sign-sub-inv10.9%
distribute-rgt-out--10.9%
*-commutative10.9%
metadata-eval10.9%
metadata-eval10.9%
*-commutative10.9%
Simplified10.9%
expm1-log1p-u10.9%
Applied egg-rr10.9%
Taylor expanded in u around 0 10.9%
+-commutative10.9%
associate-*r*10.9%
*-commutative10.9%
distribute-rgt-out10.9%
Simplified10.9%
Final simplification10.9%
(FPCore (u s) :precision binary32 (* s (- (log s) (* u -2.0))))
float code(float u, float s) {
return s * (logf(s) - (u * -2.0f));
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = s * (log(s) - (u * (-2.0e0)))
end function
function code(u, s) return Float32(s * Float32(log(s) - Float32(u * Float32(-2.0)))) end
function tmp = code(u, s) tmp = s * (log(s) - (u * single(-2.0))); end
\begin{array}{l}
\\
s \cdot \left(\log s - u \cdot -2\right)
\end{array}
Initial program 99.1%
distribute-lft-neg-out99.1%
distribute-rgt-neg-in99.1%
sub-neg99.1%
Simplified99.1%
Taylor expanded in s around -inf 24.5%
+-commutative24.5%
fma-def24.5%
associate--r+24.5%
cancel-sign-sub-inv24.5%
distribute-rgt-out--24.5%
*-commutative24.5%
metadata-eval24.5%
metadata-eval24.5%
*-commutative24.5%
Simplified24.5%
Taylor expanded in s around 0 24.7%
mul-1-neg24.7%
*-commutative24.7%
distribute-rgt-neg-in24.7%
Simplified24.7%
Taylor expanded in u around 0 25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in u around inf 25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 99.1%
distribute-lft-neg-out99.1%
distribute-rgt-neg-in99.1%
sub-neg99.1%
Simplified99.1%
Taylor expanded in u around 0 10.6%
mul-1-neg10.6%
Simplified10.6%
Final simplification10.6%
(FPCore (u s) :precision binary32 (* 2.0 (* s u)))
float code(float u, float s) {
return 2.0f * (s * u);
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = 2.0e0 * (s * u)
end function
function code(u, s) return Float32(Float32(2.0) * Float32(s * u)) end
function tmp = code(u, s) tmp = single(2.0) * (s * u); end
\begin{array}{l}
\\
2 \cdot \left(s \cdot u\right)
\end{array}
Initial program 99.1%
distribute-lft-neg-out99.1%
distribute-rgt-neg-in99.1%
sub-neg99.1%
Simplified99.1%
Taylor expanded in s around -inf 24.5%
+-commutative24.5%
fma-def24.5%
associate--r+24.5%
cancel-sign-sub-inv24.5%
distribute-rgt-out--24.5%
*-commutative24.5%
metadata-eval24.5%
metadata-eval24.5%
*-commutative24.5%
Simplified24.5%
Taylor expanded in s around 0 24.7%
mul-1-neg24.7%
*-commutative24.7%
distribute-rgt-neg-in24.7%
Simplified24.7%
Taylor expanded in u around 0 25.0%
*-commutative25.0%
Simplified25.0%
Taylor expanded in u around inf 9.3%
*-commutative9.3%
Simplified9.3%
Final simplification9.3%
herbie shell --seed 2023194
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))