
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 9 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t_0\right) + t_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
s
(-
(log
(+
(/
1.0
(+
(/ u (+ 1.0 (exp (/ (- PI) s))))
(/ (- 1.0 u) (+ 1.0 (exp (/ PI s))))))
-1.0)))))
float code(float u, float s) {
return s * -logf(((1.0f / ((u / (1.0f + expf((-((float) M_PI) / s)))) + ((1.0f - u) / (1.0f + expf((((float) M_PI) / s)))))) + -1.0f));
}
function code(u, s) return Float32(s * Float32(-log(Float32(Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) + Float32(Float32(Float32(1.0) - u) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))))) + Float32(-1.0))))) end
function tmp = code(u, s) tmp = s * -log(((single(1.0) / ((u / (single(1.0) + exp((-single(pi) / s)))) + ((single(1.0) - u) / (single(1.0) + exp((single(pi) / s)))))) + single(-1.0))); end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\frac{1}{\frac{u}{1 + e^{\frac{-\pi}{s}}} + \frac{1 - u}{1 + e^{\frac{\pi}{s}}}} + -1\right)\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Final simplification99.0%
(FPCore (u s) :precision binary32 (* s (- (log (fma 4.0 (/ (+ (* (* u PI) -0.5) (* PI 0.25)) s) 1.0)))))
float code(float u, float s) {
return s * -logf(fmaf(4.0f, ((((u * ((float) M_PI)) * -0.5f) + (((float) M_PI) * 0.25f)) / s), 1.0f));
}
function code(u, s) return Float32(s * Float32(-log(fma(Float32(4.0), Float32(Float32(Float32(Float32(u * Float32(pi)) * Float32(-0.5)) + Float32(Float32(pi) * Float32(0.25))) / s), Float32(1.0))))) end
\begin{array}{l}
\\
s \cdot \left(-\log \left(\mathsf{fma}\left(4, \frac{\left(u \cdot \pi\right) \cdot -0.5 + \pi \cdot 0.25}{s}, 1\right)\right)\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around -inf 24.3%
+-commutative24.3%
fma-def24.3%
associate--r+24.3%
cancel-sign-sub-inv24.3%
distribute-rgt-out--24.3%
*-commutative24.3%
metadata-eval24.3%
metadata-eval24.3%
*-commutative24.3%
Simplified24.3%
Final simplification24.3%
(FPCore (u s) :precision binary32 (* 4.0 (+ (* (expm1 (log (+ 1.0 (* u PI)))) 0.5) (* PI -0.25))))
float code(float u, float s) {
return 4.0f * ((expm1f(logf((1.0f + (u * ((float) M_PI))))) * 0.5f) + (((float) M_PI) * -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(expm1(log(Float32(Float32(1.0) + Float32(u * Float32(pi))))) * Float32(0.5)) + Float32(Float32(pi) * Float32(-0.25)))) end
\begin{array}{l}
\\
4 \cdot \left(\mathsf{expm1}\left(\log \left(1 + u \cdot \pi\right)\right) \cdot 0.5 + \pi \cdot -0.25\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.8%
associate--r+10.8%
cancel-sign-sub-inv10.8%
distribute-rgt-out--10.8%
*-commutative10.8%
metadata-eval10.8%
metadata-eval10.8%
*-commutative10.8%
Simplified10.8%
expm1-log1p-u10.8%
Applied egg-rr10.8%
log1p-udef10.8%
*-commutative10.8%
Applied egg-rr10.8%
Final simplification10.8%
(FPCore (u s) :precision binary32 (* 4.0 (+ (* PI -0.25) (* 0.5 (+ 1.0 (+ -1.0 (* u PI)))))))
float code(float u, float s) {
return 4.0f * ((((float) M_PI) * -0.25f) + (0.5f * (1.0f + (-1.0f + (u * ((float) M_PI))))));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(Float32(pi) * Float32(-0.25)) + Float32(Float32(0.5) * Float32(Float32(1.0) + Float32(Float32(-1.0) + Float32(u * Float32(pi))))))) end
function tmp = code(u, s) tmp = single(4.0) * ((single(pi) * single(-0.25)) + (single(0.5) * (single(1.0) + (single(-1.0) + (u * single(pi)))))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot -0.25 + 0.5 \cdot \left(1 + \left(-1 + u \cdot \pi\right)\right)\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.8%
associate--r+10.8%
cancel-sign-sub-inv10.8%
distribute-rgt-out--10.8%
*-commutative10.8%
metadata-eval10.8%
metadata-eval10.8%
*-commutative10.8%
Simplified10.8%
expm1-log1p-u10.8%
Applied egg-rr10.8%
expm1-udef10.8%
log1p-udef10.8%
add-exp-log10.8%
*-commutative10.8%
Applied egg-rr10.8%
associate--l+10.8%
*-commutative10.8%
Simplified10.8%
Final simplification10.8%
(FPCore (u s) :precision binary32 (* 4.0 (+ (* PI -0.25) (* 0.5 (+ -1.0 (+ 1.0 (* u PI)))))))
float code(float u, float s) {
return 4.0f * ((((float) M_PI) * -0.25f) + (0.5f * (-1.0f + (1.0f + (u * ((float) M_PI))))));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(Float32(pi) * Float32(-0.25)) + Float32(Float32(0.5) * Float32(Float32(-1.0) + Float32(Float32(1.0) + Float32(u * Float32(pi))))))) end
function tmp = code(u, s) tmp = single(4.0) * ((single(pi) * single(-0.25)) + (single(0.5) * (single(-1.0) + (single(1.0) + (u * single(pi)))))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot -0.25 + 0.5 \cdot \left(-1 + \left(1 + u \cdot \pi\right)\right)\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.8%
associate--r+10.8%
cancel-sign-sub-inv10.8%
distribute-rgt-out--10.8%
*-commutative10.8%
metadata-eval10.8%
metadata-eval10.8%
*-commutative10.8%
Simplified10.8%
expm1-log1p-u10.8%
Applied egg-rr10.8%
expm1-udef10.8%
log1p-udef10.8%
add-exp-log10.8%
*-commutative10.8%
Applied egg-rr10.8%
Final simplification10.8%
(FPCore (u s) :precision binary32 (* 4.0 (+ (* PI -0.25) (* (* u PI) 0.5))))
float code(float u, float s) {
return 4.0f * ((((float) M_PI) * -0.25f) + ((u * ((float) M_PI)) * 0.5f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(Float32(pi) * Float32(-0.25)) + Float32(Float32(u * Float32(pi)) * Float32(0.5)))) end
function tmp = code(u, s) tmp = single(4.0) * ((single(pi) * single(-0.25)) + ((u * single(pi)) * single(0.5))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot -0.25 + \left(u \cdot \pi\right) \cdot 0.5\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.8%
associate--r+10.8%
cancel-sign-sub-inv10.8%
distribute-rgt-out--10.8%
*-commutative10.8%
metadata-eval10.8%
metadata-eval10.8%
*-commutative10.8%
Simplified10.8%
Final simplification10.8%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (+ -0.25 (* u 0.5)))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * (-0.25f + (u * 0.5f)));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * Float32(Float32(-0.25) + Float32(u * Float32(0.5))))) end
function tmp = code(u, s) tmp = single(4.0) * (single(pi) * (single(-0.25) + (u * single(0.5)))); end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \left(-0.25 + u \cdot 0.5\right)\right)
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.8%
associate--r+10.8%
cancel-sign-sub-inv10.8%
distribute-rgt-out--10.8%
*-commutative10.8%
metadata-eval10.8%
metadata-eval10.8%
*-commutative10.8%
Simplified10.8%
Taylor expanded in u around 0 10.8%
*-commutative10.8%
*-commutative10.8%
*-commutative10.8%
associate-*r*10.8%
distribute-lft-out10.8%
Simplified10.8%
Final simplification10.8%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in u around 0 10.4%
mul-1-neg10.4%
Simplified10.4%
Final simplification10.4%
(FPCore (u s) :precision binary32 (* s 0.0))
float code(float u, float s) {
return s * 0.0f;
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = s * 0.0e0
end function
function code(u, s) return Float32(s * Float32(0.0)) end
function tmp = code(u, s) tmp = s * single(0.0); end
\begin{array}{l}
\\
s \cdot 0
\end{array}
Initial program 99.0%
distribute-lft-neg-out99.0%
distribute-rgt-neg-in99.0%
sub-neg99.0%
Simplified99.0%
Taylor expanded in s around inf 10.4%
Final simplification10.4%
herbie shell --seed 2023252
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))