
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 20 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ PI s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) t_0)) t_0))
1.0)))))
float code(float u, float s) {
float t_0 = 1.0f / (1.0f + expf((((float) M_PI) / s)));
return -s * logf(((1.0f / ((u * ((1.0f / (1.0f + expf((-((float) M_PI) / s)))) - t_0)) + t_0)) - 1.0f));
}
function code(u, s) t_0 = Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s)))) return Float32(Float32(-s) * log(Float32(Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(-Float32(pi)) / s)))) - t_0)) + t_0)) - Float32(1.0)))) end
function tmp = code(u, s) t_0 = single(1.0) / (single(1.0) + exp((single(pi) / s))); tmp = -s * log(((single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((-single(pi) / s)))) - t_0)) + t_0)) - single(1.0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\pi}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\pi}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s)))
(t_1 (- -1.0 t_0))
(t_2 (+ 1.0 t_0))
(t_3 (+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u t_1))))
(*
s
(log
(/
(fma (/ 1.0 (- (pow t_3 2.0) (pow t_2 -2.0))) (+ t_3 (/ 1.0 t_1)) 1.0)
(+ -1.0 (pow (+ t_3 (/ 1.0 t_2)) -2.0)))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
float t_1 = -1.0f - t_0;
float t_2 = 1.0f + t_0;
float t_3 = (u / (1.0f + expf((((float) M_PI) / -s)))) + (u / t_1);
return s * logf((fmaf((1.0f / (powf(t_3, 2.0f) - powf(t_2, -2.0f))), (t_3 + (1.0f / t_1)), 1.0f) / (-1.0f + powf((t_3 + (1.0f / t_2)), -2.0f))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) t_1 = Float32(Float32(-1.0) - t_0) t_2 = Float32(Float32(1.0) + t_0) t_3 = Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / t_1)) return Float32(s * log(Float32(fma(Float32(Float32(1.0) / Float32((t_3 ^ Float32(2.0)) - (t_2 ^ Float32(-2.0)))), Float32(t_3 + Float32(Float32(1.0) / t_1)), Float32(1.0)) / Float32(Float32(-1.0) + (Float32(t_3 + Float32(Float32(1.0) / t_2)) ^ Float32(-2.0)))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
t_1 := -1 - t\_0\\
t_2 := 1 + t\_0\\
t_3 := \frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{t\_1}\\
s \cdot \log \left(\frac{\mathsf{fma}\left(\frac{1}{{t\_3}^{2} - {t\_2}^{-2}}, t\_3 + \frac{1}{t\_1}, 1\right)}{-1 + {\left(t\_3 + \frac{1}{t\_2}\right)}^{-2}}\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Applied egg-rr99.1%
Applied egg-rr99.1%
Final simplification99.1%
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s)))
(t_1
(+
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u (- -1.0 t_0)))
(/ 1.0 (+ 1.0 t_0)))))
(* s (log (* (/ 1.0 (+ -1.0 (pow t_1 -2.0))) (+ 1.0 (/ 1.0 t_1)))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
float t_1 = ((u / (1.0f + expf((((float) M_PI) / -s)))) + (u / (-1.0f - t_0))) + (1.0f / (1.0f + t_0));
return s * logf(((1.0f / (-1.0f + powf(t_1, -2.0f))) * (1.0f + (1.0f / t_1))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) t_1 = Float32(Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / Float32(Float32(-1.0) - t_0))) + Float32(Float32(1.0) / Float32(Float32(1.0) + t_0))) return Float32(s * log(Float32(Float32(Float32(1.0) / Float32(Float32(-1.0) + (t_1 ^ Float32(-2.0)))) * Float32(Float32(1.0) + Float32(Float32(1.0) / t_1))))) end
function tmp = code(u, s) t_0 = exp((single(pi) / s)); t_1 = ((u / (single(1.0) + exp((single(pi) / -s)))) + (u / (single(-1.0) - t_0))) + (single(1.0) / (single(1.0) + t_0)); tmp = s * log(((single(1.0) / (single(-1.0) + (t_1 ^ single(-2.0)))) * (single(1.0) + (single(1.0) / t_1)))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
t_1 := \left(\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{-1 - t\_0}\right) + \frac{1}{1 + t\_0}\\
s \cdot \log \left(\frac{1}{-1 + {t\_1}^{-2}} \cdot \left(1 + \frac{1}{t\_1}\right)\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Applied egg-rr99.1%
Applied egg-rr99.1%
Final simplification99.1%
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s)))
(t_1
(+
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u (- -1.0 t_0)))
(/ 1.0 (+ 1.0 t_0)))))
(* s (log (/ (+ 1.0 (/ 1.0 t_1)) (+ -1.0 (pow t_1 -2.0)))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
float t_1 = ((u / (1.0f + expf((((float) M_PI) / -s)))) + (u / (-1.0f - t_0))) + (1.0f / (1.0f + t_0));
return s * logf(((1.0f + (1.0f / t_1)) / (-1.0f + powf(t_1, -2.0f))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) t_1 = Float32(Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / Float32(Float32(-1.0) - t_0))) + Float32(Float32(1.0) / Float32(Float32(1.0) + t_0))) return Float32(s * log(Float32(Float32(Float32(1.0) + Float32(Float32(1.0) / t_1)) / Float32(Float32(-1.0) + (t_1 ^ Float32(-2.0)))))) end
function tmp = code(u, s) t_0 = exp((single(pi) / s)); t_1 = ((u / (single(1.0) + exp((single(pi) / -s)))) + (u / (single(-1.0) - t_0))) + (single(1.0) / (single(1.0) + t_0)); tmp = s * log(((single(1.0) + (single(1.0) / t_1)) / (single(-1.0) + (t_1 ^ single(-2.0))))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
t_1 := \left(\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{-1 - t\_0}\right) + \frac{1}{1 + t\_0}\\
s \cdot \log \left(\frac{1 + \frac{1}{t\_1}}{-1 + {t\_1}^{-2}}\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Applied egg-rr99.1%
Final simplification99.1%
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s))))
(*
s
(log
(/
1.0
(+
-1.0
(/
1.0
(+
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ u (- -1.0 t_0)))
(/ 1.0 (+ 1.0 t_0))))))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
return s * logf((1.0f / (-1.0f + (1.0f / (((u / (1.0f + expf((((float) M_PI) / -s)))) + (u / (-1.0f - t_0))) + (1.0f / (1.0f + t_0)))))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) return Float32(s * log(Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(u / Float32(Float32(-1.0) - t_0))) + Float32(Float32(1.0) / Float32(Float32(1.0) + t_0)))))))) end
function tmp = code(u, s) t_0 = exp((single(pi) / s)); tmp = s * log((single(1.0) / (single(-1.0) + (single(1.0) / (((u / (single(1.0) + exp((single(pi) / -s)))) + (u / (single(-1.0) - t_0))) + (single(1.0) / (single(1.0) + t_0))))))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
s \cdot \log \left(\frac{1}{-1 + \frac{1}{\left(\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{u}{-1 - t\_0}\right) + \frac{1}{1 + t\_0}}}\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Applied egg-rr99.1%
Applied egg-rr99.0%
Final simplification99.0%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(fma
(+ (/ 1.0 (- -1.0 (exp (/ PI s)))) (/ 1.0 (+ 1.0 (exp (/ PI (- s))))))
u
(/ 1.0 (+ 1.0 (exp (* PI (/ 1.0 s)))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / fmaf(((1.0f / (-1.0f - expf((((float) M_PI) / s)))) + (1.0f / (1.0f + expf((((float) M_PI) / -s))))), u, (1.0f / (1.0f + expf((((float) M_PI) * (1.0f / s)))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / fma(Float32(Float32(Float32(1.0) / Float32(Float32(-1.0) - exp(Float32(Float32(pi) / s)))) + Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s)))))), u, Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) * Float32(Float32(1.0) / s)))))))))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\mathsf{fma}\left(\frac{1}{-1 - e^{\frac{\pi}{s}}} + \frac{1}{1 + e^{\frac{\pi}{-s}}}, u, \frac{1}{1 + e^{\pi \cdot \frac{1}{s}}}\right)}\right)
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
clear-numN/A
associate-/r/N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Final simplification98.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ PI s))))
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (+ 1.0 t_0)))
(/ u (- -1.0 t_0)))))))))
float code(float u, float s) {
float t_0 = expf((((float) M_PI) / s));
return -s * logf((-1.0f + (1.0f / (((u / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (1.0f + t_0))) + (u / (-1.0f - t_0))))));
}
function code(u, s) t_0 = exp(Float32(Float32(pi) / s)) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + t_0))) + Float32(u / Float32(Float32(-1.0) - t_0))))))) end
function tmp = code(u, s) t_0 = exp((single(pi) / s)); tmp = -s * log((single(-1.0) + (single(1.0) / (((u / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(1.0) + t_0))) + (u / (single(-1.0) - t_0)))))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\pi}{s}}\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\left(\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{1 + t\_0}\right) + \frac{u}{-1 - t\_0}}\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
rem-log-expN/A
*-lft-identityN/A
log-prodN/A
metadata-evalN/A
rem-log-expN/A
flip3-+N/A
/-lowering-/.f32N/A
Applied egg-rr51.5%
Applied egg-rr98.9%
Final simplification98.9%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+ (/ u (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (+ 1.0 (exp (/ PI s))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (1.0f + expf((((float) M_PI) / s))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / s))))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(1.0) + exp((single(pi) / s)))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\frac{u}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{1 + e^{\frac{\pi}{s}}}}\right)
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3294.3
Simplified94.3%
Taylor expanded in s around 0
associate-*r*N/A
*-lowering-*.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
log-lowering-log.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
Simplified98.7%
Final simplification98.7%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(*
u
(+
(/ 1.0 (+ 1.0 (exp (/ PI (- s)))))
(/ 1.0 (+ -1.0 (- -1.0 (/ PI s))))))
(/
1.0
(+
1.0
(+
1.0
(/
(+
PI
(/
(fma 0.16666666666666666 (/ (* PI (* PI PI)) s) (* (* PI PI) 0.5))
s))
s))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f + (-1.0f - (((float) M_PI) / s)))))) + (1.0f / (1.0f + (1.0f + ((((float) M_PI) + (fmaf(0.16666666666666666f, ((((float) M_PI) * (((float) M_PI) * ((float) M_PI))) / s), ((((float) M_PI) * ((float) M_PI)) * 0.5f)) / s)) / s))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(Float32(-1.0) - Float32(Float32(pi) / s)))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) + Float32(Float32(Float32(pi) + Float32(fma(Float32(0.16666666666666666), Float32(Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))) / s), Float32(Float32(Float32(pi) * Float32(pi)) * Float32(0.5))) / s)) / s))))))))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 + \left(-1 - \frac{\pi}{s}\right)}\right) + \frac{1}{1 + \left(1 + \frac{\pi + \frac{\mathsf{fma}\left(0.16666666666666666, \frac{\pi \cdot \left(\pi \cdot \pi\right)}{s}, \left(\pi \cdot \pi\right) \cdot 0.5\right)}{s}}{s}\right)}}\right)
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3294.3
Simplified94.3%
Taylor expanded in s around -inf
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
/-lowering-/.f32N/A
Simplified92.5%
Final simplification92.5%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(*
u
(+
(/ 1.0 (+ 1.0 (exp (/ PI (- s)))))
(/ 1.0 (+ -1.0 (- -1.0 (/ PI s))))))
(/ 1.0 (+ 1.0 (- 1.0 (/ (fma -0.5 (/ (* PI PI) s) (- PI)) s))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f + (-1.0f - (((float) M_PI) / s)))))) + (1.0f / (1.0f + (1.0f - (fmaf(-0.5f, ((((float) M_PI) * ((float) M_PI)) / s), -((float) M_PI)) / s))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(Float32(-1.0) - Float32(Float32(pi) / s)))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) - Float32(fma(Float32(-0.5), Float32(Float32(Float32(pi) * Float32(pi)) / s), Float32(-Float32(pi))) / s))))))))) end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 + \left(-1 - \frac{\pi}{s}\right)}\right) + \frac{1}{1 + \left(1 - \frac{\mathsf{fma}\left(-0.5, \frac{\pi \cdot \pi}{s}, -\pi\right)}{s}\right)}}\right)
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3294.3
Simplified94.3%
Taylor expanded in s around -inf
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
/-lowering-/.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
PI-lowering-PI.f3291.3
Simplified91.3%
Final simplification91.3%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(/ 1.0 (+ 1.0 (+ 1.0 (/ PI s))))
(*
u
(+
(/ 1.0 (+ 1.0 (exp (/ PI (- s)))))
(/ 1.0 (+ -1.0 (- -1.0 (/ PI s))))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((1.0f / (1.0f + (1.0f + (((float) M_PI) / s)))) + (u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f + (-1.0f - (((float) M_PI) / s))))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(Float32(1.0) + Float32(Float32(pi) / s)))) + Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(Float32(-1.0) - Float32(Float32(pi) / s))))))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((single(1.0) / (single(1.0) + (single(1.0) + (single(pi) / s)))) + (u * ((single(1.0) / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(-1.0) + (single(-1.0) - (single(pi) / s)))))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{\frac{1}{1 + \left(1 + \frac{\pi}{s}\right)} + u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 + \left(-1 - \frac{\pi}{s}\right)}\right)}\right)
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3294.3
Simplified94.3%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3285.4
Simplified85.4%
Final simplification85.4%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(* u (+ (/ 1.0 (+ 1.0 1.0)) (/ 1.0 (+ -1.0 (- -1.0 (/ PI s))))))
(/ 1.0 (+ 1.0 (exp (/ 1.0 (/ s PI)))))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + 1.0f)) + (1.0f / (-1.0f + (-1.0f - (((float) M_PI) / s)))))) + (1.0f / (1.0f + expf((1.0f / (s / ((float) M_PI))))))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + Float32(1.0))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(Float32(-1.0) - Float32(Float32(pi) / s)))))) + Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(1.0) / Float32(s / Float32(pi))))))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u * ((single(1.0) / (single(1.0) + single(1.0))) + (single(1.0) / (single(-1.0) + (single(-1.0) - (single(pi) / s)))))) + (single(1.0) / (single(1.0) + exp((single(1.0) / (s / single(pi)))))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + 1} + \frac{1}{-1 + \left(-1 - \frac{\pi}{s}\right)}\right) + \frac{1}{1 + e^{\frac{1}{\frac{s}{\pi}}}}}\right)
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around inf
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3294.3
Simplified94.3%
Taylor expanded in s around inf
Simplified37.6%
Final simplification37.6%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(* u (+ (/ 1.0 (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (+ -1.0 -1.0))))
(/ (* 2.0 (* s s)) (* PI PI))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f + -1.0f)))) + ((2.0f * (s * s)) / (((float) M_PI) * ((float) M_PI)))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(-1.0))))) + Float32(Float32(Float32(2.0) * Float32(s * s)) / Float32(Float32(pi) * Float32(pi)))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(-1.0) + single(-1.0))))) + ((single(2.0) * (s * s)) / (single(pi) * single(pi))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 + -1}\right) + \frac{2 \cdot \left(s \cdot s\right)}{\pi \cdot \pi}}\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Simplified37.6%
Taylor expanded in s around -inf
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
/-lowering-/.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
PI-lowering-PI.f3236.6
Simplified36.6%
Taylor expanded in s around 0
associate-*r/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f3236.5
Simplified36.5%
Final simplification36.5%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(+
-1.0
(/
1.0
(+
(* u (+ (/ 1.0 (+ 1.0 (exp (/ PI (- s))))) (/ 1.0 (+ -1.0 -1.0))))
(/ 1.0 (+ (/ PI s) 2.0))))))))
float code(float u, float s) {
return -s * logf((-1.0f + (1.0f / ((u * ((1.0f / (1.0f + expf((((float) M_PI) / -s)))) + (1.0f / (-1.0f + -1.0f)))) + (1.0f / ((((float) M_PI) / s) + 2.0f))))));
}
function code(u, s) return Float32(Float32(-s) * log(Float32(Float32(-1.0) + Float32(Float32(1.0) / Float32(Float32(u * Float32(Float32(Float32(1.0) / Float32(Float32(1.0) + exp(Float32(Float32(pi) / Float32(-s))))) + Float32(Float32(1.0) / Float32(Float32(-1.0) + Float32(-1.0))))) + Float32(Float32(1.0) / Float32(Float32(Float32(pi) / s) + Float32(2.0)))))))) end
function tmp = code(u, s) tmp = -s * log((single(-1.0) + (single(1.0) / ((u * ((single(1.0) / (single(1.0) + exp((single(pi) / -s)))) + (single(1.0) / (single(-1.0) + single(-1.0))))) + (single(1.0) / ((single(pi) / s) + single(2.0))))))); end
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(-1 + \frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{\pi}{-s}}} + \frac{1}{-1 + -1}\right) + \frac{1}{\frac{\pi}{s} + 2}}\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Simplified37.6%
Taylor expanded in s around -inf
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
/-lowering-/.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
/-lowering-/.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
PI-lowering-PI.f3236.6
Simplified36.6%
Taylor expanded in s around inf
+-commutativeN/A
+-lowering-+.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3235.9
Simplified35.9%
Final simplification35.9%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ (* u PI) 3.0)))
(*
(- s)
(fma
1.0
(/
(-
(fma 1.0 t_0 (* (sqrt PI) (* (sqrt PI) -0.3333333333333333)))
(fma
-1.0
t_0
(*
-2.0
(/ (* 3.0 (fma -0.25 (fma u PI (- PI)) (* (* u PI) -0.25))) 1.125))))
s)
0.0))))
float code(float u, float s) {
float t_0 = (u * ((float) M_PI)) / 3.0f;
return -s * fmaf(1.0f, ((fmaf(1.0f, t_0, (sqrtf(((float) M_PI)) * (sqrtf(((float) M_PI)) * -0.3333333333333333f))) - fmaf(-1.0f, t_0, (-2.0f * ((3.0f * fmaf(-0.25f, fmaf(u, ((float) M_PI), -((float) M_PI)), ((u * ((float) M_PI)) * -0.25f))) / 1.125f)))) / s), 0.0f);
}
function code(u, s) t_0 = Float32(Float32(u * Float32(pi)) / Float32(3.0)) return Float32(Float32(-s) * fma(Float32(1.0), Float32(Float32(fma(Float32(1.0), t_0, Float32(sqrt(Float32(pi)) * Float32(sqrt(Float32(pi)) * Float32(-0.3333333333333333)))) - fma(Float32(-1.0), t_0, Float32(Float32(-2.0) * Float32(Float32(Float32(3.0) * fma(Float32(-0.25), fma(u, Float32(pi), Float32(-Float32(pi))), Float32(Float32(u * Float32(pi)) * Float32(-0.25)))) / Float32(1.125))))) / s), Float32(0.0))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{u \cdot \pi}{3}\\
\left(-s\right) \cdot \mathsf{fma}\left(1, \frac{\mathsf{fma}\left(1, t\_0, \sqrt{\pi} \cdot \left(\sqrt{\pi} \cdot -0.3333333333333333\right)\right) - \mathsf{fma}\left(-1, t\_0, -2 \cdot \frac{3 \cdot \mathsf{fma}\left(-0.25, \mathsf{fma}\left(u, \pi, -\pi\right), \left(u \cdot \pi\right) \cdot -0.25\right)}{1.125}\right)}{s}, 0\right)
\end{array}
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Taylor expanded in s around -inf
Simplified11.9%
associate-/l*N/A
add-sqr-sqrtN/A
associate-*l*N/A
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
PI-lowering-PI.f32N/A
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
PI-lowering-PI.f32N/A
metadata-eval11.9
Applied egg-rr11.9%
Final simplification11.9%
(FPCore (u s) :precision binary32 (* (fma u (* PI -0.5) (* PI 0.25)) -4.0))
float code(float u, float s) {
return fmaf(u, (((float) M_PI) * -0.5f), (((float) M_PI) * 0.25f)) * -4.0f;
}
function code(u, s) return Float32(fma(u, Float32(Float32(pi) * Float32(-0.5)), Float32(Float32(pi) * Float32(0.25))) * Float32(-4.0)) end
\begin{array}{l}
\\
\mathsf{fma}\left(u, \pi \cdot -0.5, \pi \cdot 0.25\right) \cdot -4
\end{array}
Initial program 98.9%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3298.9
Applied egg-rr98.9%
Taylor expanded in s around -inf
*-commutativeN/A
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
metadata-evalN/A
accelerator-lowering-fma.f32N/A
distribute-rgt-out--N/A
metadata-evalN/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
PI-lowering-PI.f3211.9
Simplified11.9%
(FPCore (u s) :precision binary32 (* u (- PI (/ PI u))))
float code(float u, float s) {
return u * (((float) M_PI) - (((float) M_PI) / u));
}
function code(u, s) return Float32(u * Float32(Float32(pi) - Float32(Float32(pi) / u))) end
function tmp = code(u, s) tmp = u * (single(pi) - (single(pi) / u)); end
\begin{array}{l}
\\
u \cdot \left(\pi - \frac{\pi}{u}\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Simplified37.6%
Taylor expanded in s around inf
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
associate-*r*N/A
metadata-evalN/A
distribute-rgt-outN/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
accelerator-lowering-fma.f3211.7
Simplified11.7%
Taylor expanded in u around inf
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
PI-lowering-PI.f32N/A
/-lowering-/.f32N/A
PI-lowering-PI.f3211.7
Simplified11.7%
(FPCore (u s) :precision binary32 (* 4.0 (* PI (fma 0.25 u -0.25))))
float code(float u, float s) {
return 4.0f * (((float) M_PI) * fmaf(0.25f, u, -0.25f));
}
function code(u, s) return Float32(Float32(4.0) * Float32(Float32(pi) * fma(Float32(0.25), u, Float32(-0.25)))) end
\begin{array}{l}
\\
4 \cdot \left(\pi \cdot \mathsf{fma}\left(0.25, u, -0.25\right)\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Simplified37.6%
Taylor expanded in s around inf
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
associate-*r*N/A
metadata-evalN/A
distribute-rgt-outN/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
accelerator-lowering-fma.f3211.7
Simplified11.7%
(FPCore (u s) :precision binary32 (fma u PI (- PI)))
float code(float u, float s) {
return fmaf(u, ((float) M_PI), -((float) M_PI));
}
function code(u, s) return fma(u, Float32(pi), Float32(-Float32(pi))) end
\begin{array}{l}
\\
\mathsf{fma}\left(u, \pi, -\pi\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
Simplified37.6%
Taylor expanded in s around inf
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
associate-*r*N/A
metadata-evalN/A
distribute-rgt-outN/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
accelerator-lowering-fma.f3211.7
Simplified11.7%
Taylor expanded in u around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
PI-lowering-PI.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
PI-lowering-PI.f3211.7
Simplified11.7%
(FPCore (u s) :precision binary32 (- PI))
float code(float u, float s) {
return -((float) M_PI);
}
function code(u, s) return Float32(-Float32(pi)) end
function tmp = code(u, s) tmp = -single(pi); end
\begin{array}{l}
\\
-\pi
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
neg-lowering-neg.f32N/A
PI-lowering-PI.f3211.7
Simplified11.7%
(FPCore (u s) :precision binary32 0.0)
float code(float u, float s) {
return 0.0f;
}
real(4) function code(u, s)
real(4), intent (in) :: u
real(4), intent (in) :: s
code = 0.0e0
end function
function code(u, s) return Float32(0.0) end
function tmp = code(u, s) tmp = single(0.0); end
\begin{array}{l}
\\
0
\end{array}
Initial program 98.9%
*-commutativeN/A
accelerator-lowering-fma.f32N/A
Applied egg-rr98.9%
Applied egg-rr99.1%
Taylor expanded in s around inf
distribute-rgt-outN/A
metadata-evalN/A
mul0-rgtN/A
metadata-evalN/A
metadata-evalN/A
metadata-evalN/A
distribute-rgt-outN/A
metadata-evalN/A
mul0-rgtN/A
metadata-evalN/A
metadata-evalN/A
metadata-evalN/A
metadata-evalN/A
metadata-evalN/A
Simplified10.2%
mul0-rgt10.2
Applied egg-rr10.2%
herbie shell --seed 2024204
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- PI) s)))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) (/ 1.0 (+ 1.0 (exp (/ PI s)))))) 1.0))))