
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(*
(log
(-
(/
1.0
(fma
(- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) (/ 1.0 (+ (exp (/ PI s)) 1.0)))
u
(/ 1.0 (+ (exp (* (/ 1.0 s) PI)) 1.0))))
1.0))
(- s)))
float code(float u, float s) {
return logf(((1.0f / fmaf(((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - (1.0f / (expf((((float) M_PI) / s)) + 1.0f))), u, (1.0f / (expf(((1.0f / s) * ((float) M_PI))) + 1.0f)))) - 1.0f)) * -s;
}
function code(u, s) return Float32(log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0)))), u, Float32(Float32(1.0) / Float32(exp(Float32(Float32(Float32(1.0) / s) * Float32(pi))) + Float32(1.0))))) - Float32(1.0))) * Float32(-s)) end
\begin{array}{l}
\\
\log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - \frac{1}{e^{\frac{\pi}{s}} + 1}, u, \frac{1}{e^{\frac{1}{s} \cdot \pi} + 1}\right)} - 1\right) \cdot \left(-s\right)
\end{array}
Initial program 98.9%
lift-+.f32N/A
lift-*.f32N/A
*-commutativeN/A
lower-fma.f3298.9
Applied rewrites98.9%
lift-PI.f32N/A
lift-/.f32N/A
clear-numN/A
associate-/r/N/A
lower-*.f32N/A
lower-/.f32N/A
lift-PI.f3298.9
Applied rewrites98.9%
Final simplification98.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ (exp (/ PI s)) 1.0))))
(*
(log
(- (/ 1.0 (fma (- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) t_0) u t_0)) 1.0))
(- s))))
float code(float u, float s) {
float t_0 = 1.0f / (expf((((float) M_PI) / s)) + 1.0f);
return logf(((1.0f / fmaf(((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - t_0), u, t_0)) - 1.0f)) * -s;
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))) return Float32(log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - t_0), u, t_0)) - Float32(1.0))) * Float32(-s)) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{e^{\frac{\pi}{s}} + 1}\\
\log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - t\_0, u, t\_0\right)} - 1\right) \cdot \left(-s\right)
\end{array}
\end{array}
Initial program 98.9%
lift-+.f32N/A
lift-*.f32N/A
*-commutativeN/A
lower-fma.f3298.9
Applied rewrites98.9%
Final simplification98.9%
(FPCore (u s)
:precision binary32
(*
(log
(-
(/
1.0
(*
u
(- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) (/ 1.0 (+ (exp (/ PI s)) 1.0)))))
1.0))
(- s)))
float code(float u, float s) {
return logf(((1.0f / (u * ((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - (1.0f / (expf((((float) M_PI) / s)) + 1.0f))))) - 1.0f)) * -s;
}
function code(u, s) return Float32(log(Float32(Float32(Float32(1.0) / Float32(u * Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0)))))) - Float32(1.0))) * Float32(-s)) end
function tmp = code(u, s) tmp = log(((single(1.0) / (u * ((single(1.0) / (exp((-single(pi) / s)) + single(1.0))) - (single(1.0) / (exp((single(pi) / s)) + single(1.0)))))) - single(1.0))) * -s; end
\begin{array}{l}
\\
\log \left(\frac{1}{u \cdot \left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - \frac{1}{e^{\frac{\pi}{s}} + 1}\right)} - 1\right) \cdot \left(-s\right)
\end{array}
Initial program 98.9%
Taylor expanded in u around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites97.9%
Final simplification97.9%
(FPCore (u s) :precision binary32 (* (log (fma (/ (fma (* 0.5 PI) u (* -0.25 PI)) s) -4.0 1.0)) (- s)))
float code(float u, float s) {
return logf(fmaf((fmaf((0.5f * ((float) M_PI)), u, (-0.25f * ((float) M_PI))) / s), -4.0f, 1.0f)) * -s;
}
function code(u, s) return Float32(log(fma(Float32(fma(Float32(Float32(0.5) * Float32(pi)), u, Float32(Float32(-0.25) * Float32(pi))) / s), Float32(-4.0), Float32(1.0))) * Float32(-s)) end
\begin{array}{l}
\\
\log \left(\mathsf{fma}\left(\frac{\mathsf{fma}\left(0.5 \cdot \pi, u, -0.25 \cdot \pi\right)}{s}, -4, 1\right)\right) \cdot \left(-s\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Applied rewrites10.3%
Taylor expanded in s around inf
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
Applied rewrites25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (/ PI s) (/ (* (- s) s) s)))
float code(float u, float s) {
return (((float) M_PI) / s) * ((-s * s) / s);
}
function code(u, s) return Float32(Float32(Float32(pi) / s) * Float32(Float32(Float32(-s) * s) / s)) end
function tmp = code(u, s) tmp = (single(pi) / s) * ((-s * s) / s); end
\begin{array}{l}
\\
\frac{\pi}{s} \cdot \frac{\left(-s\right) \cdot s}{s}
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
lower-/.f32N/A
lower-PI.f3210.7
Applied rewrites10.7%
--rgt-identityN/A
flip--N/A
lift-neg.f32N/A
lift-neg.f32N/A
sqr-negN/A
lift-*.f32N/A
metadata-evalN/A
--rgt-identityN/A
metadata-evalN/A
sub-negN/A
--rgt-identityN/A
lower-/.f3213.3
Applied rewrites13.3%
Final simplification13.3%
(FPCore (u s) :precision binary32 (* (fma 2.0 PI (/ (- PI) u)) u))
float code(float u, float s) {
return fmaf(2.0f, ((float) M_PI), (-((float) M_PI) / u)) * u;
}
function code(u, s) return Float32(fma(Float32(2.0), Float32(pi), Float32(Float32(-Float32(pi)) / u)) * u) end
\begin{array}{l}
\\
\mathsf{fma}\left(2, \pi, \frac{-\pi}{u}\right) \cdot u
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
cancel-sign-sub-invN/A
metadata-evalN/A
distribute-rgt-out--N/A
metadata-evalN/A
associate-*r*N/A
lower-fma.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3210.9
Applied rewrites10.9%
Taylor expanded in u around inf
Applied rewrites10.9%
(FPCore (u s) :precision binary32 (* 4.0 (fma (* 0.5 PI) u (* -0.25 PI))))
float code(float u, float s) {
return 4.0f * fmaf((0.5f * ((float) M_PI)), u, (-0.25f * ((float) M_PI)));
}
function code(u, s) return Float32(Float32(4.0) * fma(Float32(Float32(0.5) * Float32(pi)), u, Float32(Float32(-0.25) * Float32(pi)))) end
\begin{array}{l}
\\
4 \cdot \mathsf{fma}\left(0.5 \cdot \pi, u, -0.25 \cdot \pi\right)
\end{array}
Initial program 98.9%
lift-neg.f32N/A
neg-sub0N/A
sub-negN/A
lift-neg.f32N/A
flip3-+N/A
lower-/.f32N/A
metadata-evalN/A
lower-+.f32N/A
lower-pow.f32N/A
metadata-evalN/A
lower-+.f32N/A
lower--.f32N/A
lower-*.f32N/A
lower-*.f3236.9
Applied rewrites36.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
cancel-sign-sub-invN/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f32N/A
distribute-rgt-out--N/A
metadata-evalN/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3210.9
Applied rewrites10.9%
Final simplification10.9%
(FPCore (u s) :precision binary32 (* (fma (* u PI) 0.5 (* -0.25 PI)) 4.0))
float code(float u, float s) {
return fmaf((u * ((float) M_PI)), 0.5f, (-0.25f * ((float) M_PI))) * 4.0f;
}
function code(u, s) return Float32(fma(Float32(u * Float32(pi)), Float32(0.5), Float32(Float32(-0.25) * Float32(pi))) * Float32(4.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(u \cdot \pi, 0.5, -0.25 \cdot \pi\right) \cdot 4
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
cancel-sign-sub-invN/A
metadata-evalN/A
distribute-rgt-out--N/A
metadata-evalN/A
associate-*r*N/A
lower-fma.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3210.9
Applied rewrites10.9%
(FPCore (u s) :precision binary32 (* (fma 2.0 u -1.0) PI))
float code(float u, float s) {
return fmaf(2.0f, u, -1.0f) * ((float) M_PI);
}
function code(u, s) return Float32(fma(Float32(2.0), u, Float32(-1.0)) * Float32(pi)) end
\begin{array}{l}
\\
\mathsf{fma}\left(2, u, -1\right) \cdot \pi
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
cancel-sign-sub-invN/A
metadata-evalN/A
distribute-rgt-out--N/A
metadata-evalN/A
associate-*r*N/A
lower-fma.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3210.9
Applied rewrites10.9%
Taylor expanded in u around 0
Applied rewrites10.9%
Final simplification10.9%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
lower-neg.f32N/A
lower-PI.f3210.7
Applied rewrites10.7%
herbie shell --seed 2024235
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))