
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s)))))
(t_1 (- 1.0 (exp (* -2.0 (/ PI s)))))
(t_2
(fma u (- (/ 1.0 t_1) (+ t_0 (/ (exp (* -1.0 (/ PI s))) t_1))) t_0)))
(*
(- s)
(log
(/
(- (pow t_2 -3.0) 1.0)
(+ 1.0 (/ (fma 1.0 (pow t_2 2.0) (* t_2 1.0)) (pow t_2 3.0))))))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
float t_1 = 1.0f - expf((-2.0f * (((float) M_PI) / s)));
float t_2 = fmaf(u, ((1.0f / t_1) - (t_0 + (expf((-1.0f * (((float) M_PI) / s))) / t_1))), t_0);
return -s * logf(((powf(t_2, -3.0f) - 1.0f) / (1.0f + (fmaf(1.0f, powf(t_2, 2.0f), (t_2 * 1.0f)) / powf(t_2, 3.0f)))));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) t_1 = Float32(Float32(1.0) - exp(Float32(Float32(-2.0) * Float32(Float32(pi) / s)))) t_2 = fma(u, Float32(Float32(Float32(1.0) / t_1) - Float32(t_0 + Float32(exp(Float32(Float32(-1.0) * Float32(Float32(pi) / s))) / t_1))), t_0) return Float32(Float32(-s) * log(Float32(Float32((t_2 ^ Float32(-3.0)) - Float32(1.0)) / Float32(Float32(1.0) + Float32(fma(Float32(1.0), (t_2 ^ Float32(2.0)), Float32(t_2 * Float32(1.0))) / (t_2 ^ Float32(3.0))))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
t_1 := 1 - e^{-2 \cdot \frac{\pi}{s}}\\
t_2 := \mathsf{fma}\left(u, \frac{1}{t\_1} - \left(t\_0 + \frac{e^{-1 \cdot \frac{\pi}{s}}}{t\_1}\right), t\_0\right)\\
\left(-s\right) \cdot \log \left(\frac{{t\_2}^{-3} - 1}{1 + \frac{\mathsf{fma}\left(1, {t\_2}^{2}, t\_2 \cdot 1\right)}{{t\_2}^{3}}}\right)
\end{array}
\end{array}
Initial program 98.9%
lift-+.f32N/A
lift-exp.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-neg.f32N/A
flip-+N/A
lower-/.f32N/A
Applied rewrites98.9%
Applied rewrites98.9%
Taylor expanded in s around 0
Applied rewrites99.0%
Applied rewrites98.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s)))))
(t_1 (- 1.0 (exp (* -2.0 (/ PI s)))))
(t_2
(fma u (- (/ 1.0 t_1) (+ t_0 (/ (exp (* -1.0 (/ PI s))) t_1))) t_0)))
(*
(- s)
(log (/ (- (pow t_2 -3.0) 1.0) (+ 1.0 (+ (/ 1.0 t_2) (pow t_2 -2.0))))))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
float t_1 = 1.0f - expf((-2.0f * (((float) M_PI) / s)));
float t_2 = fmaf(u, ((1.0f / t_1) - (t_0 + (expf((-1.0f * (((float) M_PI) / s))) / t_1))), t_0);
return -s * logf(((powf(t_2, -3.0f) - 1.0f) / (1.0f + ((1.0f / t_2) + powf(t_2, -2.0f)))));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) t_1 = Float32(Float32(1.0) - exp(Float32(Float32(-2.0) * Float32(Float32(pi) / s)))) t_2 = fma(u, Float32(Float32(Float32(1.0) / t_1) - Float32(t_0 + Float32(exp(Float32(Float32(-1.0) * Float32(Float32(pi) / s))) / t_1))), t_0) return Float32(Float32(-s) * log(Float32(Float32((t_2 ^ Float32(-3.0)) - Float32(1.0)) / Float32(Float32(1.0) + Float32(Float32(Float32(1.0) / t_2) + (t_2 ^ Float32(-2.0))))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
t_1 := 1 - e^{-2 \cdot \frac{\pi}{s}}\\
t_2 := \mathsf{fma}\left(u, \frac{1}{t\_1} - \left(t\_0 + \frac{e^{-1 \cdot \frac{\pi}{s}}}{t\_1}\right), t\_0\right)\\
\left(-s\right) \cdot \log \left(\frac{{t\_2}^{-3} - 1}{1 + \left(\frac{1}{t\_2} + {t\_2}^{-2}\right)}\right)
\end{array}
\end{array}
Initial program 98.9%
lift-+.f32N/A
lift-exp.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-neg.f32N/A
flip-+N/A
lower-/.f32N/A
Applied rewrites98.9%
Applied rewrites98.9%
Taylor expanded in s around 0
Applied rewrites99.0%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/
1.0
(fma
u
(-
(/ (- 1.0 (exp (* -1.0 (/ PI s)))) (- 1.0 (exp (* -2.0 (/ PI s)))))
t_0)
t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / fmaf(u, (((1.0f - expf((-1.0f * (((float) M_PI) / s)))) / (1.0f - expf((-2.0f * (((float) M_PI) / s))))) - t_0), t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(u, Float32(Float32(Float32(Float32(1.0) - exp(Float32(Float32(-1.0) * Float32(Float32(pi) / s)))) / Float32(Float32(1.0) - exp(Float32(Float32(-2.0) * Float32(Float32(pi) / s))))) - t_0), t_0)) - Float32(1.0)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(u, \frac{1 - e^{-1 \cdot \frac{\pi}{s}}}{1 - e^{-2 \cdot \frac{\pi}{s}}} - t\_0, t\_0\right)} - 1\right)
\end{array}
\end{array}
Initial program 98.9%
lift-+.f32N/A
lift-exp.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-neg.f32N/A
flip-+N/A
lower-/.f32N/A
Applied rewrites98.9%
Applied rewrites98.9%
Taylor expanded in s around 0
lower-/.f32N/A
lower--.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
lift-exp.f32N/A
lift-/.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
lift-exp.f32N/A
lift--.f3298.9
Applied rewrites98.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ (exp (/ PI s)) 1.0))))
(*
(- s)
(log
(- (/ 1.0 (fma (- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) t_0) u t_0)) 1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (expf((((float) M_PI) / s)) + 1.0f);
return -s * logf(((1.0f / fmaf(((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - t_0), u, t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - t_0), u, t_0)) - Float32(1.0)))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{e^{\frac{\pi}{s}} + 1}\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - t\_0, u, t\_0\right)} - 1\right)
\end{array}
\end{array}
Initial program 98.9%
Applied rewrites98.9%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(*
(- (/ 1.0 (+ (exp (/ (- PI) s)) 1.0)) (/ 1.0 (+ (exp (/ PI s)) 1.0)))
u))
1.0))))
float code(float u, float s) {
return -s * logf(((1.0f / (((1.0f / (expf((-((float) M_PI) / s)) + 1.0f)) - (1.0f / (expf((((float) M_PI) / s)) + 1.0f))) * u)) - 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(Float32(Float32(1.0) / Float32(exp(Float32(Float32(-Float32(pi)) / s)) + Float32(1.0))) - Float32(Float32(1.0) / Float32(exp(Float32(Float32(pi) / s)) + Float32(1.0)))) * u)) - Float32(1.0)))) end
function tmp = code(u, s) tmp = -s * log(((single(1.0) / (((single(1.0) / (exp((-single(pi) / s)) + single(1.0))) - (single(1.0) / (exp((single(pi) / s)) + single(1.0)))) * u)) - single(1.0))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\left(\frac{1}{e^{\frac{-\pi}{s}} + 1} - \frac{1}{e^{\frac{\pi}{s}} + 1}\right) \cdot u} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in u around inf
Applied rewrites97.5%
(FPCore (u s) :precision binary32 (* (- s) (log (fma (/ (fma (* PI 0.5) u (* -0.25 PI)) s) -4.0 1.0))))
float code(float u, float s) {
return -s * logf(fmaf((fmaf((((float) M_PI) * 0.5f), u, (-0.25f * ((float) M_PI))) / s), -4.0f, 1.0f));
}
function code(u, s) return Float32(Float32(-s) * log(fma(Float32(fma(Float32(Float32(pi) * Float32(0.5)), u, Float32(Float32(-0.25) * Float32(pi))) / s), Float32(-4.0), Float32(1.0)))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\mathsf{fma}\left(\frac{\mathsf{fma}\left(\pi \cdot 0.5, u, -0.25 \cdot \pi\right)}{s}, -4, 1\right)\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
Applied rewrites24.9%
(FPCore (u s) :precision binary32 (* (- s) (/ s (* u (- (* 0.25 PI) (* -0.25 PI))))))
float code(float u, float s) {
return -s * (s / (u * ((0.25f * ((float) M_PI)) - (-0.25f * ((float) M_PI)))));
}
function code(u, s) return Float32(Float32(-s) * Float32(s / Float32(u * Float32(Float32(Float32(0.25) * Float32(pi)) - Float32(Float32(-0.25) * Float32(pi)))))) end
function tmp = code(u, s) tmp = -s * (s / (u * ((single(0.25) * single(pi)) - (single(-0.25) * single(pi))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \frac{s}{u \cdot \left(0.25 \cdot \pi - -0.25 \cdot \pi\right)}
\end{array}
Initial program 98.9%
Taylor expanded in u around inf
Applied rewrites17.3%
Taylor expanded in s around inf
lower-/.f32N/A
lower-*.f32N/A
lower--.f32N/A
lower-*.f32N/A
lift-PI.f32N/A
lift-*.f32N/A
lift-PI.f3214.5
Applied rewrites14.5%
(FPCore (u s) :precision binary32 (* (fma (* PI 0.5) u (* -0.25 PI)) 4.0))
float code(float u, float s) {
return fmaf((((float) M_PI) * 0.5f), u, (-0.25f * ((float) M_PI))) * 4.0f;
}
function code(u, s) return Float32(fma(Float32(Float32(pi) * Float32(0.5)), u, Float32(Float32(-0.25) * Float32(pi))) * Float32(4.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(\pi \cdot 0.5, u, -0.25 \cdot \pi\right) \cdot 4
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites11.7%
(FPCore (u s) :precision binary32 (* (- s) (/ PI s)))
float code(float u, float s) {
return -s * (((float) M_PI) / s);
}
function code(u, s) return Float32(Float32(-s) * Float32(Float32(pi) / s)) end
function tmp = code(u, s) tmp = -s * (single(pi) / s); end
\begin{array}{l}
\\
\left(-s\right) \cdot \frac{\pi}{s}
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
lift-/.f32N/A
lift-PI.f3211.5
Applied rewrites11.5%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
lift-neg.f32N/A
lift-PI.f3211.5
Applied rewrites11.5%
herbie shell --seed 2025143
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))