
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
(FPCore (x)
:precision binary64
(let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0)))
(+
(fma (cbrt (pow (* PI 0.5) 2.0)) (cbrt (* PI 0.5)) (- t_0))
(fma (- t_1) t_1 t_0))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return fma(cbrt(pow((((double) M_PI) * 0.5), 2.0)), cbrt((((double) M_PI) * 0.5)), -t_0) + fma(-t_1, t_1, t_0);
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(fma(cbrt((Float64(pi * 0.5) ^ 2.0)), cbrt(Float64(pi * 0.5)), Float64(-t_0)) + fma(Float64(-t_1), t_1, t_0)) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[(N[Power[N[Power[N[(Pi * 0.5), $MachinePrecision], 2.0], $MachinePrecision], 1/3], $MachinePrecision] * N[Power[N[(Pi * 0.5), $MachinePrecision], 1/3], $MachinePrecision] + (-t$95$0)), $MachinePrecision] + N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\mathsf{fma}\left(\sqrt[3]{{\left(\pi \cdot 0.5\right)}^{2}}, \sqrt[3]{\pi \cdot 0.5}, -t\_0\right) + \mathsf{fma}\left(-t\_1, t\_1, t\_0\right)
\end{array}
\end{array}
Initial program 7.9%
acos-asin7.9%
*-un-lft-identity7.9%
add-sqr-sqrt11.2%
prod-diff11.2%
add-sqr-sqrt11.2%
fma-neg11.2%
*-un-lft-identity11.2%
acos-asin11.2%
add-sqr-sqrt11.2%
Applied egg-rr11.2%
acos-asin11.2%
add-cube-cbrt6.1%
fma-neg6.1%
cbrt-unprod11.2%
pow211.2%
div-inv11.2%
metadata-eval11.2%
div-inv11.2%
metadata-eval11.2%
Applied egg-rr11.2%
Final simplification11.2%
(FPCore (x) :precision binary64 (let* ((t_0 (sqrt (asin (- 1.0 x))))) (+ (acos (- 1.0 x)) (fma (- t_0) t_0 (pow t_0 2.0)))))
double code(double x) {
double t_0 = sqrt(asin((1.0 - x)));
return acos((1.0 - x)) + fma(-t_0, t_0, pow(t_0, 2.0));
}
function code(x) t_0 = sqrt(asin(Float64(1.0 - x))) return Float64(acos(Float64(1.0 - x)) + fma(Float64(-t_0), t_0, (t_0 ^ 2.0))) end
code[x_] := Block[{t$95$0 = N[Sqrt[N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]}, N[(N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision] + N[((-t$95$0) * t$95$0 + N[Power[t$95$0, 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{\sin^{-1} \left(1 - x\right)}\\
\cos^{-1} \left(1 - x\right) + \mathsf{fma}\left(-t\_0, t\_0, {t\_0}^{2}\right)
\end{array}
\end{array}
Initial program 7.9%
acos-asin7.9%
*-un-lft-identity7.9%
add-sqr-sqrt11.2%
prod-diff11.2%
add-sqr-sqrt11.2%
fma-neg11.2%
*-un-lft-identity11.2%
acos-asin11.2%
add-sqr-sqrt11.2%
Applied egg-rr11.2%
add-sqr-sqrt11.2%
pow211.2%
Applied egg-rr11.2%
Final simplification11.2%
(FPCore (x) :precision binary64 (let* ((t_0 (asin (- 1.0 x))) (t_1 (sqrt t_0))) (+ (fma (- t_1) t_1 t_0) (+ (+ 1.0 (acos (- 1.0 x))) -1.0))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = sqrt(t_0);
return fma(-t_1, t_1, t_0) + ((1.0 + acos((1.0 - x))) + -1.0);
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = sqrt(t_0) return Float64(fma(Float64(-t_1), t_1, t_0) + Float64(Float64(1.0 + acos(Float64(1.0 - x))) + -1.0)) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Sqrt[t$95$0], $MachinePrecision]}, N[(N[((-t$95$1) * t$95$1 + t$95$0), $MachinePrecision] + N[(N[(1.0 + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt{t\_0}\\
\mathsf{fma}\left(-t\_1, t\_1, t\_0\right) + \left(\left(1 + \cos^{-1} \left(1 - x\right)\right) + -1\right)
\end{array}
\end{array}
Initial program 7.9%
acos-asin7.9%
*-un-lft-identity7.9%
add-sqr-sqrt11.2%
prod-diff11.2%
add-sqr-sqrt11.2%
fma-neg11.2%
*-un-lft-identity11.2%
acos-asin11.2%
add-sqr-sqrt11.2%
Applied egg-rr11.2%
expm1-log1p-u11.2%
expm1-undefine11.2%
log1p-undefine11.2%
rem-exp-log11.2%
Applied egg-rr11.2%
Final simplification11.2%
(FPCore (x) :precision binary64 (- (* PI 0.5) (pow (cbrt (asin (- 1.0 x))) 3.0)))
double code(double x) {
return (((double) M_PI) * 0.5) - pow(cbrt(asin((1.0 - x))), 3.0);
}
public static double code(double x) {
return (Math.PI * 0.5) - Math.pow(Math.cbrt(Math.asin((1.0 - x))), 3.0);
}
function code(x) return Float64(Float64(pi * 0.5) - (cbrt(asin(Float64(1.0 - x))) ^ 3.0)) end
code[x_] := N[(N[(Pi * 0.5), $MachinePrecision] - N[Power[N[Power[N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision], 1/3], $MachinePrecision], 3.0], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\pi \cdot 0.5 - {\left(\sqrt[3]{\sin^{-1} \left(1 - x\right)}\right)}^{3}
\end{array}
Initial program 7.9%
acos-asin7.9%
sub-neg7.9%
div-inv7.9%
metadata-eval7.9%
Applied egg-rr7.9%
sub-neg7.9%
Simplified7.9%
add-cube-cbrt11.1%
pow311.1%
Applied egg-rr11.1%
Final simplification11.1%
(FPCore (x) :precision binary64 (- (* PI 0.5) (pow (sqrt (asin (- 1.0 x))) 2.0)))
double code(double x) {
return (((double) M_PI) * 0.5) - pow(sqrt(asin((1.0 - x))), 2.0);
}
public static double code(double x) {
return (Math.PI * 0.5) - Math.pow(Math.sqrt(Math.asin((1.0 - x))), 2.0);
}
def code(x): return (math.pi * 0.5) - math.pow(math.sqrt(math.asin((1.0 - x))), 2.0)
function code(x) return Float64(Float64(pi * 0.5) - (sqrt(asin(Float64(1.0 - x))) ^ 2.0)) end
function tmp = code(x) tmp = (pi * 0.5) - (sqrt(asin((1.0 - x))) ^ 2.0); end
code[x_] := N[(N[(Pi * 0.5), $MachinePrecision] - N[Power[N[Sqrt[N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\pi \cdot 0.5 - {\left(\sqrt{\sin^{-1} \left(1 - x\right)}\right)}^{2}
\end{array}
Initial program 7.9%
acos-asin7.9%
sub-neg7.9%
div-inv7.9%
metadata-eval7.9%
Applied egg-rr7.9%
sub-neg7.9%
Simplified7.9%
add-sqr-sqrt11.2%
pow211.2%
Applied egg-rr11.2%
Final simplification11.2%
(FPCore (x) :precision binary64 (if (<= (- 1.0 x) 1.0) (acos (- 1.0 x)) (+ (* PI 0.5) (asin (- 1.0 x)))))
double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = acos((1.0 - x));
} else {
tmp = (((double) M_PI) * 0.5) + asin((1.0 - x));
}
return tmp;
}
public static double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = Math.acos((1.0 - x));
} else {
tmp = (Math.PI * 0.5) + Math.asin((1.0 - x));
}
return tmp;
}
def code(x): tmp = 0 if (1.0 - x) <= 1.0: tmp = math.acos((1.0 - x)) else: tmp = (math.pi * 0.5) + math.asin((1.0 - x)) return tmp
function code(x) tmp = 0.0 if (Float64(1.0 - x) <= 1.0) tmp = acos(Float64(1.0 - x)); else tmp = Float64(Float64(pi * 0.5) + asin(Float64(1.0 - x))); end return tmp end
function tmp_2 = code(x) tmp = 0.0; if ((1.0 - x) <= 1.0) tmp = acos((1.0 - x)); else tmp = (pi * 0.5) + asin((1.0 - x)); end tmp_2 = tmp; end
code[x_] := If[LessEqual[N[(1.0 - x), $MachinePrecision], 1.0], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision], N[(N[(Pi * 0.5), $MachinePrecision] + N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - x \leq 1:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\mathbf{else}:\\
\;\;\;\;\pi \cdot 0.5 + \sin^{-1} \left(1 - x\right)\\
\end{array}
\end{array}
if (-.f64 #s(literal 1 binary64) x) < 1Initial program 7.9%
if 1 < (-.f64 #s(literal 1 binary64) x) Initial program 7.9%
acos-asin7.9%
sub-neg7.9%
div-inv7.9%
metadata-eval7.9%
Applied egg-rr7.9%
sub-neg7.9%
Simplified7.9%
add-sqr-sqrt11.2%
cancel-sign-sub-inv11.2%
add-sqr-sqrt0.0%
sqrt-unprod7.0%
sqr-neg7.0%
add-sqr-sqrt7.0%
add-sqr-sqrt7.0%
Applied egg-rr7.0%
Final simplification7.9%
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Initial program 7.9%
Final simplification7.9%
(FPCore (x) :precision binary64 (* 2.0 (asin (sqrt (/ x 2.0)))))
double code(double x) {
return 2.0 * asin(sqrt((x / 2.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = 2.0d0 * asin(sqrt((x / 2.0d0)))
end function
public static double code(double x) {
return 2.0 * Math.asin(Math.sqrt((x / 2.0)));
}
def code(x): return 2.0 * math.asin(math.sqrt((x / 2.0)))
function code(x) return Float64(2.0 * asin(sqrt(Float64(x / 2.0)))) end
function tmp = code(x) tmp = 2.0 * asin(sqrt((x / 2.0))); end
code[x_] := N[(2.0 * N[ArcSin[N[Sqrt[N[(x / 2.0), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
2 \cdot \sin^{-1} \left(\sqrt{\frac{x}{2}}\right)
\end{array}
herbie shell --seed 2024084
(FPCore (x)
:name "bug323 (missed optimization)"
:precision binary64
:pre (and (<= 0.0 x) (<= x 0.5))
:alt
(* 2.0 (asin (sqrt (/ x 2.0))))
(acos (- 1.0 x)))