
(FPCore (u1 u2) :precision binary64 (+ (* (* (/ 1.0 6.0) (pow (* -2.0 (log u1)) 0.5)) (cos (* (* 2.0 PI) u2))) 0.5))
double code(double u1, double u2) {
return (((1.0 / 6.0) * pow((-2.0 * log(u1)), 0.5)) * cos(((2.0 * ((double) M_PI)) * u2))) + 0.5;
}
public static double code(double u1, double u2) {
return (((1.0 / 6.0) * Math.pow((-2.0 * Math.log(u1)), 0.5)) * Math.cos(((2.0 * Math.PI) * u2))) + 0.5;
}
def code(u1, u2): return (((1.0 / 6.0) * math.pow((-2.0 * math.log(u1)), 0.5)) * math.cos(((2.0 * math.pi) * u2))) + 0.5
function code(u1, u2) return Float64(Float64(Float64(Float64(1.0 / 6.0) * (Float64(-2.0 * log(u1)) ^ 0.5)) * cos(Float64(Float64(2.0 * pi) * u2))) + 0.5) end
function tmp = code(u1, u2) tmp = (((1.0 / 6.0) * ((-2.0 * log(u1)) ^ 0.5)) * cos(((2.0 * pi) * u2))) + 0.5; end
code[u1_, u2_] := N[(N[(N[(N[(1.0 / 6.0), $MachinePrecision] * N[Power[N[(-2.0 * N[Log[u1], $MachinePrecision]), $MachinePrecision], 0.5], $MachinePrecision]), $MachinePrecision] * N[Cos[N[(N[(2.0 * Pi), $MachinePrecision] * u2), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + 0.5), $MachinePrecision]
\begin{array}{l}
\\
\left(\frac{1}{6} \cdot {\left(-2 \cdot \log u1\right)}^{0.5}\right) \cdot \cos \left(\left(2 \cdot \pi\right) \cdot u2\right) + 0.5
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (u1 u2) :precision binary64 (+ (* (* (/ 1.0 6.0) (pow (* -2.0 (log u1)) 0.5)) (cos (* (* 2.0 PI) u2))) 0.5))
double code(double u1, double u2) {
return (((1.0 / 6.0) * pow((-2.0 * log(u1)), 0.5)) * cos(((2.0 * ((double) M_PI)) * u2))) + 0.5;
}
public static double code(double u1, double u2) {
return (((1.0 / 6.0) * Math.pow((-2.0 * Math.log(u1)), 0.5)) * Math.cos(((2.0 * Math.PI) * u2))) + 0.5;
}
def code(u1, u2): return (((1.0 / 6.0) * math.pow((-2.0 * math.log(u1)), 0.5)) * math.cos(((2.0 * math.pi) * u2))) + 0.5
function code(u1, u2) return Float64(Float64(Float64(Float64(1.0 / 6.0) * (Float64(-2.0 * log(u1)) ^ 0.5)) * cos(Float64(Float64(2.0 * pi) * u2))) + 0.5) end
function tmp = code(u1, u2) tmp = (((1.0 / 6.0) * ((-2.0 * log(u1)) ^ 0.5)) * cos(((2.0 * pi) * u2))) + 0.5; end
code[u1_, u2_] := N[(N[(N[(N[(1.0 / 6.0), $MachinePrecision] * N[Power[N[(-2.0 * N[Log[u1], $MachinePrecision]), $MachinePrecision], 0.5], $MachinePrecision]), $MachinePrecision] * N[Cos[N[(N[(2.0 * Pi), $MachinePrecision] * u2), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + 0.5), $MachinePrecision]
\begin{array}{l}
\\
\left(\frac{1}{6} \cdot {\left(-2 \cdot \log u1\right)}^{0.5}\right) \cdot \cos \left(\left(2 \cdot \pi\right) \cdot u2\right) + 0.5
\end{array}
(FPCore (u1 u2) :precision binary64 (fma (sqrt (* (log u1) -0.05555555555555555)) (fabs (cos (* 2.0 (* PI u2)))) 0.5))
double code(double u1, double u2) {
return fma(sqrt((log(u1) * -0.05555555555555555)), fabs(cos((2.0 * (((double) M_PI) * u2)))), 0.5);
}
function code(u1, u2) return fma(sqrt(Float64(log(u1) * -0.05555555555555555)), abs(cos(Float64(2.0 * Float64(pi * u2)))), 0.5) end
code[u1_, u2_] := N[(N[Sqrt[N[(N[Log[u1], $MachinePrecision] * -0.05555555555555555), $MachinePrecision]], $MachinePrecision] * N[Abs[N[Cos[N[(2.0 * N[(Pi * u2), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]], $MachinePrecision] + 0.5), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\sqrt{\log u1 \cdot -0.05555555555555555}, \left|\cos \left(2 \cdot \left(\pi \cdot u2\right)\right)\right|, 0.5\right)
\end{array}
Initial program 99.4%
lift-pow.f64N/A
sqr-powN/A
pow2N/A
lower-pow.f64N/A
metadata-evalN/A
metadata-evalN/A
lower-pow.f64N/A
metadata-eval99.1
Applied rewrites99.1%
Applied rewrites99.6%
Applied rewrites99.6%
(FPCore (u1 u2)
:precision binary64
(+
0.5
(pow
(*
(log u1)
(fma (* (* u2 u2) 0.2222222222222222) (* PI PI) -0.05555555555555555))
0.5)))
double code(double u1, double u2) {
return 0.5 + pow((log(u1) * fma(((u2 * u2) * 0.2222222222222222), (((double) M_PI) * ((double) M_PI)), -0.05555555555555555)), 0.5);
}
function code(u1, u2) return Float64(0.5 + (Float64(log(u1) * fma(Float64(Float64(u2 * u2) * 0.2222222222222222), Float64(pi * pi), -0.05555555555555555)) ^ 0.5)) end
code[u1_, u2_] := N[(0.5 + N[Power[N[(N[Log[u1], $MachinePrecision] * N[(N[(N[(u2 * u2), $MachinePrecision] * 0.2222222222222222), $MachinePrecision] * N[(Pi * Pi), $MachinePrecision] + -0.05555555555555555), $MachinePrecision]), $MachinePrecision], 0.5], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
0.5 + {\left(\log u1 \cdot \mathsf{fma}\left(\left(u2 \cdot u2\right) \cdot 0.2222222222222222, \pi \cdot \pi, -0.05555555555555555\right)\right)}^{0.5}
\end{array}
Initial program 99.4%
lift-pow.f64N/A
sqr-powN/A
pow2N/A
lower-pow.f64N/A
metadata-evalN/A
metadata-evalN/A
lower-pow.f64N/A
metadata-eval99.1
Applied rewrites99.1%
Applied rewrites99.6%
Taylor expanded in u2 around 0
+-commutativeN/A
associate-*r*N/A
associate-*r*N/A
distribute-rgt-outN/A
lower-*.f64N/A
lower-log.f64N/A
lower-fma.f64N/A
*-commutativeN/A
lower-*.f64N/A
unpow2N/A
lower-*.f64N/A
unpow2N/A
lower-*.f64N/A
lower-PI.f64N/A
lower-PI.f6498.9
Applied rewrites98.9%
Final simplification98.9%
herbie shell --seed 2024230
(FPCore (u1 u2)
:name "normal distribution"
:precision binary64
:pre (and (and (<= 0.0 u1) (<= u1 1.0)) (and (<= 0.0 u2) (<= u2 1.0)))
(+ (* (* (/ 1.0 6.0) (pow (* -2.0 (log u1)) 0.5)) (cos (* (* 2.0 PI) u2))) 0.5))