
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 13 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s)))
(t_1
(fma
u
(+ (/ 1.0 (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (- -1.0 t_0)))
(/ 1.0 (+ 1.0 t_0)))))
(* (- s) (log (/ (+ -1.0 (pow t_1 -2.0)) (- (/ 1.0 t_1) -1.0))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
float t_1 = fmaf(u, ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f - t_0))), (1.0f / (1.0f + t_0)));
return -s * logf(((-1.0f + powf(t_1, -2.0f)) / ((1.0f / t_1) - -1.0f)));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) t_1 = fma(u, Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) - t_0))), Float32(Float32(1.0) / Float32(Float32(1.0) + t_0))) return Float32(Float32(-s) * log(Float32(Float32(Float32(-1.0) + (t_1 ^ Float32(-2.0))) / Float32(Float32(Float32(1.0) / t_1) - Float32(-1.0))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
t_1 := \mathsf{fma}\left(u, \frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 - t\_0}, \frac{1}{1 + t\_0}\right)\\
\left(-s\right) \cdot \log \left(\frac{-1 + {t\_1}^{-2}}{\frac{1}{t\_1} - -1}\right)
\end{array}
\end{array}
Initial program 98.7%
Applied rewrites98.8%
Final simplification98.8%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(*
u
(+ (/ 1.0 (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (- -1.0 (exp (/ PI s))))))
(/ 1.0 (+ 1.0 (exp (* PI (/ 1.0 s)))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f - expf((((float) M_PI) / s)))))) + (1.0f / (1.0f + expf((((float) M_PI) * (1.0f / s)))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) - exp(Float32(Float32(pi) / s)))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) * Float32(Float32(1.0) / s)))))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(-1.0) - exp((single(pi) / s)))))) + (single(1.0) / (single(1.0) + exp((single(pi) * (single(1.0) / s))))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 - e^{\frac{\pi}{s}}}\right) + \frac{1}{1 + e^{\pi \cdot \frac{1}{s}}}}\right)
\end{array}
Initial program 98.7%
lift-PI.f32N/A
clear-numN/A
associate-/r/N/A
lower-*.f32N/A
lower-/.f3298.7
Applied rewrites98.7%
Final simplification98.7%
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s))))
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(/ 1.0 (+ 1.0 t_0))
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u (- -1.0 t_0))))))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
return -s * logf((-1.0f + (1.0f / ((1.0f / (1.0f + t_0)) + ((u / (1.0f + expf((((float) M_PI) / -s)))) + (u / (-1.0f - t_0)))))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + t_0)) + Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / Float32(Float32(-1.0) - t_0)))))))) end
function tmp = code(u, s) t_0 = exp((single(pi) / s)); tmp = -s * log((single(-1.0) + (single(1.0) / ((single(1.0) / (single(1.0) + t_0)) + ((u / (single(1.0) + exp((single(pi) / -s)))) + (u / (single(-1.0) - t_0))))))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\frac{1}{1 + t\_0} + \left(\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{-1 - t\_0}\right)}\right)
\end{array}
\end{array}
Initial program 98.7%
Applied rewrites98.8%
Applied rewrites98.7%
Applied rewrites98.7%
Final simplification98.7%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u (- -1.0 (exp (/ PI s))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u / (1.0f + expf((((float) M_PI) / -s)))) + (u / (-1.0f - expf((((float) M_PI) / s))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / Float32(Float32(-1.0) - exp(Float32(Float32(pi) / s))))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u / (single(1.0) + exp((single(pi) / -s)))) + (u / (single(-1.0) - exp((single(pi) / s)))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{-1 - e^{\frac{\pi}{s}}}}\right)
\end{array}
Initial program 98.7%
Taylor expanded in u around inf
lower-*.f32N/A
sub-negN/A
lower-+.f32N/A
lower-/.f32N/A
lower-+.f32N/A
lower-exp.f32N/A
mul-1-negN/A
distribute-neg-frac2N/A
mul-1-negN/A
lower-/.f32N/A
lower-PI.f32N/A
mul-1-negN/A
lower-neg.f32N/A
distribute-neg-fracN/A
Applied rewrites96.9%
lift-PI.f32N/A
lift-neg.f32N/A
lift-/.f32N/A
lift-exp.f32N/A
lift-+.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-/.f32N/A
lift-exp.f32N/A
lift-+.f32N/A
lift-/.f32N/A
Applied rewrites96.9%
Final simplification96.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (+ s (* s (/ PI s)))))
(*
(- s)
(fma
u
(* -2.0 (+ (/ PI t_0) (/ (* u (* PI PI)) (* t_0 t_0))))
(log1p (/ PI s))))))
float code(float u, float s) {
float t_0 = s + (s * (((float) M_PI) / s));
return -s * fmaf(u, (-2.0f * ((((float) M_PI) / t_0) + ((u * (((float) M_PI) * ((float) M_PI))) / (t_0 * t_0)))), log1pf((((float) M_PI) / s)));
}
function code(u, s) t_0 = Float32(s + Float32(s * Float32(Float32(pi) / s))) return Float32(Float32(-s) * fma(u, Float32(Float32(-2.0) * Float32(Float32(Float32(pi) / t_0) + Float32(Float32(u * Float32(Float32(pi) * Float32(pi))) / Float32(t_0 * t_0)))), log1p(Float32(Float32(pi) / s)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := s + s \cdot \frac{\pi}{s}\\
\left(-s\right) \cdot \mathsf{fma}\left(u, -2 \cdot \left(\frac{\pi}{t\_0} + \frac{u \cdot \left(\pi \cdot \pi\right)}{t\_0 \cdot t\_0}\right), \mathsf{log1p}\left(\frac{\pi}{s}\right)\right)
\end{array}
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.8%
Taylor expanded in u around 0
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites25.0%
(FPCore (u s)
:precision binary32
(let* ((t_0 (+ 1.0 (/ PI s))))
(fma
u
(* 2.0 (+ (/ PI t_0) (/ (* u (* PI PI)) (* s (* t_0 t_0)))))
(* (- s) (log1p (/ PI s))))))
float code(float u, float s) {
float t_0 = 1.0f + (((float) M_PI) / s);
return fmaf(u, (2.0f * ((((float) M_PI) / t_0) + ((u * (((float) M_PI) * ((float) M_PI))) / (s * (t_0 * t_0))))), (-s * log1pf((((float) M_PI) / s))));
}
function code(u, s) t_0 = Float32(Float32(1.0) + Float32(Float32(pi) / s)) return fma(u, Float32(Float32(2.0) * Float32(Float32(Float32(pi) / t_0) + Float32(Float32(u * Float32(Float32(pi) * Float32(pi))) / Float32(s * Float32(t_0 * t_0))))), Float32(Float32(-s) * log1p(Float32(Float32(pi) / s)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := 1 + \frac{\pi}{s}\\
\mathsf{fma}\left(u, 2 \cdot \left(\frac{\pi}{t\_0} + \frac{u \cdot \left(\pi \cdot \pi\right)}{s \cdot \left(t\_0 \cdot t\_0\right)}\right), \left(-s\right) \cdot \mathsf{log1p}\left(\frac{\pi}{s}\right)\right)
\end{array}
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.8%
Taylor expanded in u around 0
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites25.0%
(FPCore (u s) :precision binary32 (fma (- s) (log1p (/ PI s)) (/ (* 2.0 (* u PI)) (+ 1.0 (/ PI s)))))
float code(float u, float s) {
return fmaf(-s, log1pf((((float) M_PI) / s)), ((2.0f * (u * ((float) M_PI))) / (1.0f + (((float) M_PI) / s))));
}
function code(u, s) return fma(Float32(-s), log1p(Float32(Float32(pi) / s)), Float32(Float32(Float32(2.0) * Float32(u * Float32(pi))) / Float32(Float32(1.0) + Float32(Float32(pi) / s)))) end
\begin{array}{l}
\\
\mathsf{fma}\left(-s, \mathsf{log1p}\left(\frac{\pi}{s}\right), \frac{2 \cdot \left(u \cdot \pi\right)}{1 + \frac{\pi}{s}}\right)
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.8%
Taylor expanded in u around 0
associate-*r*N/A
lower-fma.f32N/A
mul-1-negN/A
lower-neg.f32N/A
lower-log1p.f32N/A
lower-/.f32N/A
lower-PI.f32N/A
associate-*r/N/A
lower-/.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-PI.f32N/A
lower-+.f32N/A
lower-/.f32N/A
lower-PI.f3225.0
Applied rewrites25.0%
Final simplification25.0%
(FPCore (u s) :precision binary32 (* (- s) (log (+ 1.0 (/ PI s)))))
float code(float u, float s) {
return -s * logf((1.0f + (((float) M_PI) / s)));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(1.0) + Float32(Float32(pi) / s)))) end
function tmp = code(u, s) tmp = -s * log((single(1.0) + (single(pi) / s))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(1 + \frac{\pi}{s}\right)
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.8%
Taylor expanded in u around 0
lower-+.f32N/A
lower-/.f32N/A
lower-PI.f3225.0
Applied rewrites25.0%
(FPCore (u s) :precision binary32 (* (- s) (log1p (/ PI s))))
float code(float u, float s) {
return -s * log1pf((((float) M_PI) / s));
}
function code(u, s) return Float32(Float32(-s) * log1p(Float32(Float32(pi) / s))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \mathsf{log1p}\left(\frac{\pi}{s}\right)
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
+-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.8%
Taylor expanded in u around 0
lower-log1p.f32N/A
lower-/.f32N/A
lower-PI.f3225.0
Applied rewrites25.0%
(FPCore (u s) :precision binary32 (* (fma PI 0.25 (* PI (* u -0.5))) -4.0))
float code(float u, float s) {
return fmaf(((float) M_PI), 0.25f, (((float) M_PI) * (u * -0.5f))) * -4.0f;
}
function code(u, s) return Float32(fma(Float32(pi), Float32(0.25), Float32(Float32(pi) * Float32(u * Float32(-0.5)))) * Float32(-4.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(\pi, 0.25, \pi \cdot \left(u \cdot -0.5\right)\right) \cdot -4
\end{array}
Initial program 98.7%
Taylor expanded in s around -inf
*-commutativeN/A
lower-*.f32N/A
cancel-sign-sub-invN/A
metadata-evalN/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lower-PI.f32N/A
*-commutativeN/A
distribute-rgt-out--N/A
metadata-evalN/A
associate-*l*N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f3212.3
Applied rewrites12.3%
Final simplification12.3%
(FPCore (u s) :precision binary32 (* 4.0 (fma PI (* u 0.5) (* PI -0.25))))
float code(float u, float s) {
return 4.0f * fmaf(((float) M_PI), (u * 0.5f), (((float) M_PI) * -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * fma(Float32(pi), Float32(u * Float32(0.5)), Float32(Float32(pi) * Float32(-0.25)))) end
\begin{array}{l}
\\
4 \cdot \mathsf{fma}\left(\pi, u \cdot 0.5, \pi \cdot -0.25\right)
\end{array}
Initial program 98.7%
Taylor expanded in s around inf
lower-*.f32N/A
cancel-sign-sub-invN/A
*-commutativeN/A
distribute-rgt-out--N/A
metadata-evalN/A
associate-*l*N/A
metadata-evalN/A
lower-fma.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-PI.f3212.3
Applied rewrites12.3%
Final simplification12.3%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.7%
Taylor expanded in u around 0
mul-1-negN/A
lower-neg.f32N/A
lower-PI.f3212.0
Applied rewrites12.0%
(FPCore (u s) :precision binary32 0.0)
float code(float u, float s) {
return 0.0f;
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = 0.0e0
end function
function code(u, s) return Float32(0.0) end
function tmp = code(u, s) tmp = single(0.0); end
\begin{array}{l}
\\
0
\end{array}
Initial program 98.7%
Applied rewrites98.6%
Taylor expanded in s around inf
associate-*r*N/A
exp-negN/A
rem-exp-logN/A
metadata-evalN/A
metadata-evalN/A
metadata-evalN/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f329.9
Applied rewrites9.9%
lift-neg.f32N/A
mul0-rgt9.9
Applied rewrites9.9%
herbie shell --seed 2024219
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))