
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ (exp (/ PI s)) 1.0))))
(*
(- s)
(log
(- (/ 1.0 (fma (- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) t_0) u t_0)) 1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (expf((((float) M_PI) / s)) + 1.0f);
return -s * logf(((1.0f / fmaf(((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - t_0), u, t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - t_0), u, t_0)) - Float32(1.0)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{e^{\frac{\pi}{s}} + 1}\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - t\_0, u, t\_0\right)} - 1\right)
\end{array}
\end{array}
Initial program 98.9%
Applied rewrites98.9%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(fma
(-
(/ 1.0 (+ (exp (/ (- PI) s)) 1.0))
(/ 1.0 (+ 2.0 (fma 0.5 (/ (* PI PI) (* s s)) (/ PI s)))))
u
(/ 1.0 (+ (exp (/ PI s)) 1.0))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / fmaf(((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - (1.0f / (2.0f + fmaf(0.5f, ((((float) M_PI) * ((float) M_PI)) / (s * s)), (((float) M_PI) / s))))), u, (1.0f / (expf((((float) M_PI) / s)) + 1.0f)))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - Float32(Float32(1.0) / Float32(Float32(2.0) + fma(Float32(0.5), Float32(Float32(Float32(pi) * Float32(pi)) / Float32(s * s)), Float32(Float32(pi) / s))))), u, Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))))) - Float32(1.0)))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - \frac{1}{2 + \mathsf{fma}\left(0.5, \frac{\pi \cdot \pi}{s \cdot s}, \frac{\pi}{s}\right)}, u, \frac{1}{e^{\frac{\pi}{s}} + 1}\right)} - 1\right)
\end{array}
Initial program 98.9%
Applied rewrites98.9%
Taylor expanded in s around inf
lower-+.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
lift-PI.f32N/A
lift-PI.f32N/A
unpow2N/A
lower-*.f32N/A
lift-/.f32N/A
lift-PI.f3297.2
Applied rewrites97.2%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(*
(- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) (/ 1.0 (+ (exp (/ PI s)) 1.0)))
u))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / (((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - (1.0f / (expf((((float) M_PI) / s)) + 1.0f))) * u)) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0)))) * u)) - Float32(1.0)))) end
function tmp = code(u, s) tmp = -s * log(((single(1.0) / (((single(1.0) / (exp((-single(pi) / s)) + single(1.0))) - (single(1.0) / (exp((single(pi) / s)) + single(1.0)))) * u)) - single(1.0))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - \frac{1}{e^{\frac{\pi}{s}} + 1}\right) \cdot u} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in u around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites97.6%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(+
(* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 2.0 (/ PI s)))))
(/ 1.0 (+ 1.0 (+ 1.0 (fma 0.5 (/ (* PI PI) (* s s)) (/ PI s)))))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - (1.0f / (2.0f + (((float) M_PI) / s))))) + (1.0f / (1.0f + (1.0f + fmaf(0.5f, ((((float) M_PI) * ((float) M_PI)) / (s * s)), (((float) M_PI) / s))))))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - Float32(Float32(1.0) / Float32(Float32(2.0) + Float32(Float32(pi) / s))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) + fma(Float32(0.5), Float32(Float32(Float32(pi) * Float32(pi)) / Float32(s * s)), Float32(Float32(pi) / s))))))) - Float32(1.0)))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - \frac{1}{2 + \frac{\pi}{s}}\right) + \frac{1}{1 + \left(1 + \mathsf{fma}\left(0.5, \frac{\pi \cdot \pi}{s \cdot s}, \frac{\pi}{s}\right)\right)}} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3294.8
Applied rewrites94.8%
Taylor expanded in s around inf
lower-+.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
lift-PI.f32N/A
lift-PI.f32N/A
unpow2N/A
lower-*.f32N/A
lift-/.f32N/A
lift-PI.f3291.9
Applied rewrites91.9%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(+
(* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (/ PI s))))
(/ 1.0 (+ 1.0 (+ 1.0 (/ PI s))))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - (1.0f / (((float) M_PI) / s)))) + (1.0f / (1.0f + (1.0f + (((float) M_PI) / s)))))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - Float32(Float32(1.0) / Float32(Float32(pi) / s)))) + Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) + Float32(Float32(pi) / s)))))) - Float32(1.0)))) end
function tmp = code(u, s) tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - (single(1.0) / (single(pi) / s)))) + (single(1.0) / (single(1.0) + (single(1.0) + (single(pi) / s)))))) - single(1.0))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - \frac{1}{\frac{\pi}{s}}\right) + \frac{1}{1 + \left(1 + \frac{\pi}{s}\right)}} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3294.8
Applied rewrites94.8%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3285.7
Applied rewrites85.7%
Taylor expanded in s around 0
lift-/.f32N/A
lift-PI.f3285.7
Applied rewrites85.7%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(fma
(- 0.5 (/ 1.0 (+ 2.0 (fma 0.5 (/ (* PI PI) (* s s)) (/ PI s)))))
u
(/ 1.0 (+ (exp (/ PI s)) 1.0))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / fmaf((0.5f - (1.0f / (2.0f + fmaf(0.5f, ((((float) M_PI) * ((float) M_PI)) / (s * s)), (((float) M_PI) / s))))), u, (1.0f / (expf((((float) M_PI) / s)) + 1.0f)))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(0.5) - Float32(Float32(1.0) / Float32(Float32(2.0) + fma(Float32(0.5), Float32(Float32(Float32(pi) * Float32(pi)) / Float32(s * s)), Float32(Float32(pi) / s))))), u, Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))))) - Float32(1.0)))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(0.5 - \frac{1}{2 + \mathsf{fma}\left(0.5, \frac{\pi \cdot \pi}{s \cdot s}, \frac{\pi}{s}\right)}, u, \frac{1}{e^{\frac{\pi}{s}} + 1}\right)} - 1\right)
\end{array}
Initial program 98.9%
Applied rewrites98.9%
Taylor expanded in s around inf
Applied rewrites37.6%
Taylor expanded in s around inf
lower-+.f32N/A
lower-fma.f32N/A
lower-/.f32N/A
unpow2N/A
lower-*.f32N/A
lift-PI.f32N/A
lift-PI.f32N/A
unpow2N/A
lower-*.f32N/A
lift-/.f32N/A
lift-PI.f3237.6
Applied rewrites37.6%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(fma (- 0.5 (/ 1.0 (+ 2.0 (/ PI s)))) u (/ 1.0 (+ (exp (/ PI s)) 1.0))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / fmaf((0.5f - (1.0f / (2.0f + (((float) M_PI) / s)))), u, (1.0f / (expf((((float) M_PI) / s)) + 1.0f)))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(0.5) - Float32(Float32(1.0) / Float32(Float32(2.0) + Float32(Float32(pi) / s)))), u, Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))))) - Float32(1.0)))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(0.5 - \frac{1}{2 + \frac{\pi}{s}}, u, \frac{1}{e^{\frac{\pi}{s}} + 1}\right)} - 1\right)
\end{array}
Initial program 98.9%
Applied rewrites98.9%
Taylor expanded in s around inf
Applied rewrites37.6%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3237.6
Applied rewrites37.6%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(+
(* u (- 0.5 (/ 1.0 (+ 2.0 (/ PI s)))))
(/ 1.0 (+ 1.0 (+ 1.0 (/ PI s))))))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / ((u * (0.5f - (1.0f / (2.0f + (((float) M_PI) / s))))) + (1.0f / (1.0f + (1.0f + (((float) M_PI) / s)))))) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(0.5) - Float32(Float32(1.0) / Float32(Float32(2.0) + Float32(Float32(pi) / s))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) + Float32(Float32(pi) / s)))))) - Float32(1.0)))) end
function tmp = code(u, s) tmp = -s * log(((single(1.0) / ((u * (single(0.5) - (single(1.0) / (single(2.0) + (single(pi) / s))))) + (single(1.0) / (single(1.0) + (single(1.0) + (single(pi) / s)))))) - single(1.0))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(0.5 - \frac{1}{2 + \frac{\pi}{s}}\right) + \frac{1}{1 + \left(1 + \frac{\pi}{s}\right)}} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3294.8
Applied rewrites94.8%
Taylor expanded in s around inf
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3285.7
Applied rewrites85.7%
Taylor expanded in s around inf
Applied rewrites36.1%
(FPCore (u s) :precision binary32 (* (- s) (log (+ 1.0 (/ PI s)))))
float code(float u, float s) {
return -s * logf((1.0f + (((float) M_PI) / s)));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(1.0) + Float32(Float32(pi) / s)))) end
function tmp = code(u, s) tmp = -s * log((single(1.0) + (single(pi) / s))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(1 + \frac{\pi}{s}\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.9%
Taylor expanded in u around 0
lower-+.f32N/A
lift-/.f32N/A
lift-PI.f3225.1
Applied rewrites25.1%
(FPCore (u s) :precision binary32 (* (fma (* PI 0.5) u (* -0.25 PI)) 4.0))
float code(float u, float s) {
return fmaf((((float) M_PI) * 0.5f), u, (-0.25f * ((float) M_PI))) * 4.0f;
}
function code(u, s) return Float32(fma(Float32(Float32(pi) * Float32(0.5)), u, Float32(Float32(-0.25) * Float32(pi))) * Float32(4.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(\pi \cdot 0.5, u, -0.25 \cdot \pi\right) \cdot 4
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites11.6%
(FPCore (u s) :precision binary32 (fma -1.0 PI (* 2.0 (* u PI))))
float code(float u, float s) {
return fmaf(-1.0f, ((float) M_PI), (2.0f * (u * ((float) M_PI))));
}
function code(u, s) return fma(Float32(-1.0), Float32(pi), Float32(Float32(2.0) * Float32(u * Float32(pi)))) end
\begin{array}{l}
\\
\mathsf{fma}\left(-1, \pi, 2 \cdot \left(u \cdot \pi\right)\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites11.6%
Taylor expanded in u around 0
lower-fma.f32N/A
lift-PI.f32N/A
lower-*.f32N/A
lower-*.f32N/A
lift-PI.f3211.6
Applied rewrites11.6%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
lift-neg.f32N/A
lift-PI.f3211.4
Applied rewrites11.4%
herbie shell --seed 2025096
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))