
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ (PI) s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- (PI)) s)))) t_0)) t_0))
1.0)))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\mathsf{PI}\left(\right)}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\mathsf{PI}\left(\right)}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ 1.0 (exp (/ (PI) s))))))
(*
(- s)
(log
(-
(/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- (PI)) s)))) t_0)) t_0))
1.0)))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{1 + e^{\frac{\mathsf{PI}\left(\right)}{s}}}\\
\left(-s\right) \cdot \log \left(\frac{1}{u \cdot \left(\frac{1}{1 + e^{\frac{-\mathsf{PI}\left(\right)}{s}}} - t\_0\right) + t\_0} - 1\right)
\end{array}
\end{array}
(FPCore (u s)
:precision binary32
(let* ((t_0 (exp (/ (PI) s)))
(t_1 (exp (- (log1p t_0))))
(t_2 (exp (- (log1p (exp (/ (- (PI)) s)))))))
(*
(- s)
(log
(/
(- (pow (fma (- t_2 (/ 1.0 (+ 1.0 t_0))) u t_1) -2.0) 1.0)
(+ (/ 1.0 (fma (- t_2 t_1) u t_1)) 1.0))))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := e^{\frac{\mathsf{PI}\left(\right)}{s}}\\
t_1 := e^{-\mathsf{log1p}\left(t\_0\right)}\\
t_2 := e^{-\mathsf{log1p}\left(e^{\frac{-\mathsf{PI}\left(\right)}{s}}\right)}\\
\left(-s\right) \cdot \log \left(\frac{{\left(\mathsf{fma}\left(t\_2 - \frac{1}{1 + t\_0}, u, t\_1\right)\right)}^{-2} - 1}{\frac{1}{\mathsf{fma}\left(t\_2 - t\_1, u, t\_1\right)} + 1}\right)
\end{array}
\end{array}
Initial program 98.9%
lift--.f32N/A
flip--N/A
lower-/.f32N/A
Applied rewrites99.0%
lift-exp.f32N/A
lift-neg.f32N/A
exp-negN/A
lift-log1p.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-+.f3299.0
Applied rewrites99.0%
(FPCore (u s)
:precision binary32
(let* ((t_0 (/ 1.0 (+ (exp (/ (PI) s)) 1.0))))
(*
(- s)
(log
(-
(/ 1.0 (fma (- (/ 1.0 (+ (exp (/ (- (PI)) s)) 1.0)) t_0) u t_0))
1.0)))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{e^{\frac{\mathsf{PI}\left(\right)}{s}} + 1}\\
\left(-s\right) \cdot \log \left(\frac{1}{\mathsf{fma}\left(\frac{1}{e^{\frac{-\mathsf{PI}\left(\right)}{s}} + 1} - t\_0, u, t\_0\right)} - 1\right)
\end{array}
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
*-commutativeN/A
lower-fma.f32N/A
Applied rewrites98.9%
(FPCore (u s)
:precision binary32
(*
(- s)
(log
(-
(/
1.0
(*
(- (/ 1.0 (+ (exp (/ (- (PI)) s)) 1.0)) (/ 1.0 (+ (exp (/ (PI) s)) 1.0)))
u))
1.0))))\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{1}{\left(\frac{1}{e^{\frac{-\mathsf{PI}\left(\right)}{s}} + 1} - \frac{1}{e^{\frac{\mathsf{PI}\left(\right)}{s}} + 1}\right) \cdot u} - 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in u around inf
*-commutativeN/A
lower-*.f32N/A
Applied rewrites97.8%
(FPCore (u s) :precision binary32 (* (- s) (log (+ (/ (PI) s) 1.0))))
\begin{array}{l}
\\
\left(-s\right) \cdot \log \left(\frac{\mathsf{PI}\left(\right)}{s} + 1\right)
\end{array}
Initial program 98.9%
Taylor expanded in s around inf
+-commutativeN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
lower-fma.f32N/A
Applied rewrites24.3%
Taylor expanded in u around 0
Applied rewrites24.7%
(FPCore (u s) :precision binary32 (* (fma (* 0.5 (PI)) u (* -0.25 (PI))) 4.0))
\begin{array}{l}
\\
\mathsf{fma}\left(0.5 \cdot \mathsf{PI}\left(\right), u, -0.25 \cdot \mathsf{PI}\left(\right)\right) \cdot 4
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
lower-neg.f32N/A
lower-PI.f3211.3
Applied rewrites11.3%
Taylor expanded in s around inf
*-commutativeN/A
lower-*.f32N/A
fp-cancel-sub-sign-invN/A
*-commutativeN/A
distribute-rgt-out--N/A
metadata-evalN/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f32N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-*.f32N/A
lower-PI.f3211.6
Applied rewrites11.6%
(FPCore (u s) :precision binary32 (- (PI)))
\begin{array}{l}
\\
-\mathsf{PI}\left(\right)
\end{array}
Initial program 98.9%
Taylor expanded in u around 0
mul-1-negN/A
lower-neg.f32N/A
lower-PI.f3211.3
Applied rewrites11.3%
herbie shell --seed 2024352
(FPCore (u s)
:name "Sample trimmed logistic on [-pi, pi]"
:precision binary32
:pre (and (and (<= 2.328306437e-10 u) (<= u 1.0)) (and (<= 0.0 s) (<= s 1.0651631)))
(* (- s) (log (- (/ 1.0 (+ (* u (- (/ 1.0 (+ 1.0 (exp (/ (- (PI)) s)))) (/ 1.0 (+ 1.0 (exp (/ (PI) s)))))) (/ 1.0 (+ 1.0 (exp (/ (PI) s)))))) 1.0))))