
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
(FPCore (x)
:precision binary64
(let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0)))
(+
(fma (cbrt (pow (* PI 0.5) 2.0)) (cbrt (* PI 0.5)) (- t_0))
(fma (- t_1) t_1 t_0))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return fma(cbrt(pow((((double) M_PI) * 0.5), 2.0)), cbrt((((double) M_PI) * 0.5)), -t_0) + fma(-t_1, t_1, t_0);
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(fma(cbrt((Float64(pi * 0.5) ^ 2.0)), cbrt(Float64(pi * 0.5)), Float64(-t_0)) + fma(Float64(-t_1), t_1, t_0)) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[(N[Power[N[Power[N[(Pi * 0.5), $MachinePrecision], 2.0], $MachinePrecision], 1/3], $MachinePrecision] * N[Power[N[(Pi * 0.5), $MachinePrecision], 1/3], $MachinePrecision] + (-t$95$0)), $MachinePrecision] + N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\mathsf{fma}\left(\sqrt[3]{{\left(\pi \cdot 0.5\right)}^{2}}, \sqrt[3]{\pi \cdot 0.5}, -t\_0\right) + \mathsf{fma}\left(-t\_1, t\_1, t\_0\right)
\end{array}
\end{array}
Initial program 5.6%
acos-asin5.6%
*-un-lft-identity5.6%
add-sqr-sqrt9.2%
prod-diff9.2%
add-sqr-sqrt9.3%
fma-neg9.3%
*-un-lft-identity9.3%
acos-asin9.3%
add-sqr-sqrt9.2%
Applied egg-rr9.2%
acos-asin9.2%
add-cube-cbrt3.8%
fma-neg3.8%
cbrt-unprod9.3%
pow29.3%
div-inv9.3%
metadata-eval9.3%
div-inv9.3%
metadata-eval9.3%
Applied egg-rr9.3%
(FPCore (x)
:precision binary64
(let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0)))
(+
(fma (- t_1) t_1 t_0)
(- (* (cbrt (pow (* PI 0.5) 2.0)) (cbrt (* PI 0.5))) t_0))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return fma(-t_1, t_1, t_0) + ((cbrt(pow((((double) M_PI) * 0.5), 2.0)) * cbrt((((double) M_PI) * 0.5))) - t_0);
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(fma(Float64(-t_1), t_1, t_0) + Float64(Float64(cbrt((Float64(pi * 0.5) ^ 2.0)) * cbrt(Float64(pi * 0.5))) - t_0)) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision] + N[(N[(N[Power[N[Power[N[(Pi * 0.5), $MachinePrecision], 2.0], $MachinePrecision], 1/3], $MachinePrecision] * N[Power[N[(Pi * 0.5), $MachinePrecision], 1/3], $MachinePrecision]), $MachinePrecision] - t$95$0), $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\mathsf{fma}\left(-t\_1, t\_1, t\_0\right) + \left(\sqrt[3]{{\left(\pi \cdot 0.5\right)}^{2}} \cdot \sqrt[3]{\pi \cdot 0.5} - t\_0\right)
\end{array}
\end{array}
Initial program 5.6%
acos-asin5.6%
*-un-lft-identity5.6%
add-sqr-sqrt9.2%
prod-diff9.2%
add-sqr-sqrt9.3%
fma-neg9.3%
*-un-lft-identity9.3%
acos-asin9.3%
add-sqr-sqrt9.2%
Applied egg-rr9.2%
acos-asin9.2%
add-cube-cbrt3.8%
*-un-lft-identity3.8%
prod-diff3.8%
cbrt-unprod9.3%
pow29.3%
div-inv9.3%
metadata-eval9.3%
div-inv9.3%
metadata-eval9.3%
Applied egg-rr9.3%
+-commutative9.3%
fma-undefine9.3%
*-rgt-identity9.3%
*-rgt-identity9.3%
+-commutative9.3%
sub-neg9.3%
+-inverses9.3%
fma-undefine9.3%
*-rgt-identity9.3%
associate-+r+9.3%
Simplified9.3%
Final simplification9.3%
(FPCore (x) :precision binary64 (let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0))) (+ (+ 1.0 (+ (fma (- t_1) t_1 t_0) (acos (- 1.0 x)))) -1.0)))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return (1.0 + (fma(-t_1, t_1, t_0) + acos((1.0 - x)))) + -1.0;
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(Float64(1.0 + Float64(fma(Float64(-t_1), t_1, t_0) + acos(Float64(1.0 - x)))) + -1.0) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[(1.0 + N[(N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision] + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\left(1 + \left(\mathsf{fma}\left(-t\_1, t\_1, t\_0\right) + \cos^{-1} \left(1 - x\right)\right)\right) + -1
\end{array}
\end{array}
Initial program 5.6%
expm1-log1p-u5.6%
expm1-undefine5.6%
log1p-undefine5.6%
rem-exp-log5.6%
Applied egg-rr5.6%
acos-asin5.6%
*-un-lft-identity5.6%
add-sqr-sqrt9.2%
prod-diff9.2%
add-sqr-sqrt9.3%
fma-neg9.3%
*-un-lft-identity9.3%
acos-asin9.3%
add-sqr-sqrt9.2%
Applied egg-rr9.2%
Final simplification9.2%
(FPCore (x) :precision binary64 (let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0))) (+ (fma (- t_1) t_1 t_0) (acos (- 1.0 x)))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return fma(-t_1, t_1, t_0) + acos((1.0 - x));
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(fma(Float64(-t_1), t_1, t_0) + acos(Float64(1.0 - x))) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision] + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\mathsf{fma}\left(-t\_1, t\_1, t\_0\right) + \cos^{-1} \left(1 - x\right)
\end{array}
\end{array}
Initial program 5.6%
acos-asin5.6%
*-un-lft-identity5.6%
add-sqr-sqrt9.2%
prod-diff9.2%
add-sqr-sqrt9.3%
fma-neg9.3%
*-un-lft-identity9.3%
acos-asin9.3%
add-sqr-sqrt9.2%
Applied egg-rr9.2%
Final simplification9.2%
(FPCore (x) :precision binary64 (- (* PI (pow (sqrt 0.5) 2.0)) (asin (- 1.0 x))))
double code(double x) {
return (((double) M_PI) * pow(sqrt(0.5), 2.0)) - asin((1.0 - x));
}
public static double code(double x) {
return (Math.PI * Math.pow(Math.sqrt(0.5), 2.0)) - Math.asin((1.0 - x));
}
def code(x): return (math.pi * math.pow(math.sqrt(0.5), 2.0)) - math.asin((1.0 - x))
function code(x) return Float64(Float64(pi * (sqrt(0.5) ^ 2.0)) - asin(Float64(1.0 - x))) end
function tmp = code(x) tmp = (pi * (sqrt(0.5) ^ 2.0)) - asin((1.0 - x)); end
code[x_] := N[(N[(Pi * N[Power[N[Sqrt[0.5], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision] - N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\pi \cdot {\left(\sqrt{0.5}\right)}^{2} - \sin^{-1} \left(1 - x\right)
\end{array}
Initial program 5.6%
acos-asin5.6%
*-un-lft-identity5.6%
add-sqr-sqrt9.2%
prod-diff9.2%
add-sqr-sqrt9.3%
fma-neg9.3%
*-un-lft-identity9.3%
acos-asin9.3%
add-sqr-sqrt9.2%
Applied egg-rr9.2%
acos-asin9.2%
add-sqr-sqrt9.3%
fma-neg5.6%
div-inv5.6%
metadata-eval5.6%
div-inv5.6%
metadata-eval5.6%
Applied egg-rr5.6%
Taylor expanded in x around 0 9.2%
+-commutative9.2%
mul-1-neg9.2%
sub-neg9.2%
Simplified9.2%
(FPCore (x) :precision binary64 (acos (- x)))
double code(double x) {
return acos(-x);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(-x)
end function
public static double code(double x) {
return Math.acos(-x);
}
def code(x): return math.acos(-x)
function code(x) return acos(Float64(-x)) end
function tmp = code(x) tmp = acos(-x); end
code[x_] := N[ArcCos[(-x)], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(-x\right)
\end{array}
Initial program 5.6%
Taylor expanded in x around inf 6.9%
neg-mul-16.9%
Simplified6.9%
(FPCore (x) :precision binary64 (acos 1.0))
double code(double x) {
return acos(1.0);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(1.0d0)
end function
public static double code(double x) {
return Math.acos(1.0);
}
def code(x): return math.acos(1.0)
function code(x) return acos(1.0) end
function tmp = code(x) tmp = acos(1.0); end
code[x_] := N[ArcCos[1.0], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} 1
\end{array}
Initial program 5.6%
Taylor expanded in x around 0 3.8%
(FPCore (x) :precision binary64 (* 2.0 (asin (sqrt (/ x 2.0)))))
double code(double x) {
return 2.0 * asin(sqrt((x / 2.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = 2.0d0 * asin(sqrt((x / 2.0d0)))
end function
public static double code(double x) {
return 2.0 * Math.asin(Math.sqrt((x / 2.0)));
}
def code(x): return 2.0 * math.asin(math.sqrt((x / 2.0)))
function code(x) return Float64(2.0 * asin(sqrt(Float64(x / 2.0)))) end
function tmp = code(x) tmp = 2.0 * asin(sqrt((x / 2.0))); end
code[x_] := N[(2.0 * N[ArcSin[N[Sqrt[N[(x / 2.0), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
2 \cdot \sin^{-1} \left(\sqrt{\frac{x}{2}}\right)
\end{array}
herbie shell --seed 2024111
(FPCore (x)
:name "bug323 (missed optimization)"
:precision binary64
:pre (and (<= 0.0 x) (<= x 0.5))
:alt
(* 2.0 (asin (sqrt (/ x 2.0))))
(acos (- 1.0 x)))