
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
(FPCore (x)
:precision binary64
(let* ((t_0 (asin (- 1.0 x))) (t_1 (cbrt t_0)) (t_2 (pow t_1 2.0)))
(+
(fma
PI
0.5
(* (cbrt (asin (/ (- 1.0 (pow x 3.0)) (+ 1.0 (* x (+ 1.0 x)))))) (- t_2)))
(fma (- t_1) t_2 (cbrt (pow t_0 3.0))))))
double code(double x) {
double t_0 = asin((1.0 - x));
double t_1 = cbrt(t_0);
double t_2 = pow(t_1, 2.0);
return fma(((double) M_PI), 0.5, (cbrt(asin(((1.0 - pow(x, 3.0)) / (1.0 + (x * (1.0 + x)))))) * -t_2)) + fma(-t_1, t_2, cbrt(pow(t_0, 3.0)));
}
function code(x) t_0 = asin(Float64(1.0 - x)) t_1 = cbrt(t_0) t_2 = t_1 ^ 2.0 return Float64(fma(pi, 0.5, Float64(cbrt(asin(Float64(Float64(1.0 - (x ^ 3.0)) / Float64(1.0 + Float64(x * Float64(1.0 + x)))))) * Float64(-t_2))) + fma(Float64(-t_1), t_2, cbrt((t_0 ^ 3.0)))) end
code[x_] := Block[{t$95$0 = N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[Power[t$95$0, 1/3], $MachinePrecision]}, Block[{t$95$2 = N[Power[t$95$1, 2.0], $MachinePrecision]}, N[(N[(Pi * 0.5 + N[(N[Power[N[ArcSin[N[(N[(1.0 - N[Power[x, 3.0], $MachinePrecision]), $MachinePrecision] / N[(1.0 + N[(x * N[(1.0 + x), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], 1/3], $MachinePrecision] * (-t$95$2)), $MachinePrecision]), $MachinePrecision] + N[((-t$95$1) * t$95$2 + N[Power[N[Power[t$95$0, 3.0], $MachinePrecision], 1/3], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sin^{-1} \left(1 - x\right)\\
t_1 := \sqrt[3]{t\_0}\\
t_2 := {t\_1}^{2}\\
\mathsf{fma}\left(\pi, 0.5, \sqrt[3]{\sin^{-1} \left(\frac{1 - {x}^{3}}{1 + x \cdot \left(1 + x\right)}\right)} \cdot \left(-t\_2\right)\right) + \mathsf{fma}\left(-t\_1, t\_2, \sqrt[3]{{t\_0}^{3}}\right)
\end{array}
\end{array}
Initial program 6.8%
acos-asin6.8%
div-inv6.8%
metadata-eval6.8%
add-cube-cbrt10.4%
prod-diff10.4%
pow210.4%
pow210.4%
Applied egg-rr10.4%
flip3--10.5%
div-inv10.5%
metadata-eval10.5%
metadata-eval10.5%
+-commutative10.5%
distribute-rgt-out10.5%
+-commutative10.5%
fma-define10.5%
Applied egg-rr10.5%
associate-*r/10.5%
*-rgt-identity10.5%
Simplified10.5%
unpow210.5%
rem-3cbrt-rft10.5%
add-cbrt-cube10.5%
pow310.5%
Applied egg-rr10.5%
Taylor expanded in x around 0 10.5%
Final simplification10.5%
(FPCore (x)
:precision binary64
(-
(* PI 0.5)
(pow
(cbrt
(cbrt
(*
(asin (/ (- 1.0 (pow x 3.0)) (fma x (+ 1.0 x) 1.0)))
(pow (asin (- 1.0 x)) 2.0))))
3.0)))
double code(double x) {
return (((double) M_PI) * 0.5) - pow(cbrt(cbrt((asin(((1.0 - pow(x, 3.0)) / fma(x, (1.0 + x), 1.0))) * pow(asin((1.0 - x)), 2.0)))), 3.0);
}
function code(x) return Float64(Float64(pi * 0.5) - (cbrt(cbrt(Float64(asin(Float64(Float64(1.0 - (x ^ 3.0)) / fma(x, Float64(1.0 + x), 1.0))) * (asin(Float64(1.0 - x)) ^ 2.0)))) ^ 3.0)) end
code[x_] := N[(N[(Pi * 0.5), $MachinePrecision] - N[Power[N[Power[N[Power[N[(N[ArcSin[N[(N[(1.0 - N[Power[x, 3.0], $MachinePrecision]), $MachinePrecision] / N[(x * N[(1.0 + x), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision]], $MachinePrecision] * N[Power[N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision], 1/3], $MachinePrecision], 1/3], $MachinePrecision], 3.0], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\pi \cdot 0.5 - {\left(\sqrt[3]{\sqrt[3]{\sin^{-1} \left(\frac{1 - {x}^{3}}{\mathsf{fma}\left(x, 1 + x, 1\right)}\right) \cdot {\sin^{-1} \left(1 - x\right)}^{2}}}\right)}^{3}
\end{array}
Initial program 6.8%
acos-asin6.8%
div-inv6.8%
metadata-eval6.8%
add-cube-cbrt10.4%
prod-diff10.4%
pow210.4%
pow210.4%
Applied egg-rr10.4%
flip3--10.5%
div-inv10.5%
metadata-eval10.5%
metadata-eval10.5%
+-commutative10.5%
distribute-rgt-out10.5%
+-commutative10.5%
fma-define10.5%
Applied egg-rr10.5%
associate-*r/10.5%
*-rgt-identity10.5%
Simplified10.5%
Taylor expanded in x around 0 5.1%
Simplified5.1%
cbrt-prod10.5%
unpow210.5%
cbrt-prod10.5%
unpow210.5%
*-commutative10.5%
add-cube-cbrt10.5%
pow310.5%
Applied egg-rr10.5%
Final simplification10.5%
(FPCore (x) :precision binary64 (- (* 0.5 (cbrt (pow PI 3.0))) (asin (- 1.0 x))))
double code(double x) {
return (0.5 * cbrt(pow(((double) M_PI), 3.0))) - asin((1.0 - x));
}
public static double code(double x) {
return (0.5 * Math.cbrt(Math.pow(Math.PI, 3.0))) - Math.asin((1.0 - x));
}
function code(x) return Float64(Float64(0.5 * cbrt((pi ^ 3.0))) - asin(Float64(1.0 - x))) end
code[x_] := N[(N[(0.5 * N[Power[N[Power[Pi, 3.0], $MachinePrecision], 1/3], $MachinePrecision]), $MachinePrecision] - N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
0.5 \cdot \sqrt[3]{{\pi}^{3}} - \sin^{-1} \left(1 - x\right)
\end{array}
Initial program 6.8%
acos-asin6.8%
sub-neg6.8%
div-inv6.8%
metadata-eval6.8%
Applied egg-rr6.8%
sub-neg6.8%
Simplified6.8%
add-cbrt-cube10.4%
pow310.4%
Applied egg-rr10.4%
Final simplification10.4%
(FPCore (x) :precision binary64 (if (<= (- 1.0 x) 1.0) (+ (+ 1.0 (acos (- 1.0 x))) -1.0) (+ (asin (- 1.0 x)) (* PI 0.5))))
double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = (1.0 + acos((1.0 - x))) + -1.0;
} else {
tmp = asin((1.0 - x)) + (((double) M_PI) * 0.5);
}
return tmp;
}
public static double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = (1.0 + Math.acos((1.0 - x))) + -1.0;
} else {
tmp = Math.asin((1.0 - x)) + (Math.PI * 0.5);
}
return tmp;
}
def code(x): tmp = 0 if (1.0 - x) <= 1.0: tmp = (1.0 + math.acos((1.0 - x))) + -1.0 else: tmp = math.asin((1.0 - x)) + (math.pi * 0.5) return tmp
function code(x) tmp = 0.0 if (Float64(1.0 - x) <= 1.0) tmp = Float64(Float64(1.0 + acos(Float64(1.0 - x))) + -1.0); else tmp = Float64(asin(Float64(1.0 - x)) + Float64(pi * 0.5)); end return tmp end
function tmp_2 = code(x) tmp = 0.0; if ((1.0 - x) <= 1.0) tmp = (1.0 + acos((1.0 - x))) + -1.0; else tmp = asin((1.0 - x)) + (pi * 0.5); end tmp_2 = tmp; end
code[x_] := If[LessEqual[N[(1.0 - x), $MachinePrecision], 1.0], N[(N[(1.0 + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision] + N[(Pi * 0.5), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - x \leq 1:\\
\;\;\;\;\left(1 + \cos^{-1} \left(1 - x\right)\right) + -1\\
\mathbf{else}:\\
\;\;\;\;\sin^{-1} \left(1 - x\right) + \pi \cdot 0.5\\
\end{array}
\end{array}
if (-.f64 #s(literal 1 binary64) x) < 1Initial program 6.8%
expm1-log1p-u6.8%
expm1-undefine6.9%
log1p-undefine6.9%
rem-exp-log6.9%
Applied egg-rr6.9%
if 1 < (-.f64 #s(literal 1 binary64) x) Initial program 6.8%
acos-asin6.8%
sub-neg6.8%
div-inv6.8%
metadata-eval6.8%
Applied egg-rr6.8%
sub-neg6.8%
Simplified6.8%
sub-neg6.8%
add-sqr-sqrt10.4%
distribute-rgt-neg-out10.4%
add-sqr-sqrt0.0%
sqrt-unprod6.9%
distribute-rgt-neg-out6.9%
add-sqr-sqrt6.9%
distribute-rgt-neg-out6.9%
add-sqr-sqrt6.9%
sqr-neg6.9%
sqrt-unprod6.9%
add-sqr-sqrt6.9%
Applied egg-rr6.9%
Final simplification6.9%
(FPCore (x) :precision binary64 (if (<= (- 1.0 x) 1.0) (acos (- 1.0 x)) (+ (asin (- 1.0 x)) (* PI 0.5))))
double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = acos((1.0 - x));
} else {
tmp = asin((1.0 - x)) + (((double) M_PI) * 0.5);
}
return tmp;
}
public static double code(double x) {
double tmp;
if ((1.0 - x) <= 1.0) {
tmp = Math.acos((1.0 - x));
} else {
tmp = Math.asin((1.0 - x)) + (Math.PI * 0.5);
}
return tmp;
}
def code(x): tmp = 0 if (1.0 - x) <= 1.0: tmp = math.acos((1.0 - x)) else: tmp = math.asin((1.0 - x)) + (math.pi * 0.5) return tmp
function code(x) tmp = 0.0 if (Float64(1.0 - x) <= 1.0) tmp = acos(Float64(1.0 - x)); else tmp = Float64(asin(Float64(1.0 - x)) + Float64(pi * 0.5)); end return tmp end
function tmp_2 = code(x) tmp = 0.0; if ((1.0 - x) <= 1.0) tmp = acos((1.0 - x)); else tmp = asin((1.0 - x)) + (pi * 0.5); end tmp_2 = tmp; end
code[x_] := If[LessEqual[N[(1.0 - x), $MachinePrecision], 1.0], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision], N[(N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision] + N[(Pi * 0.5), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - x \leq 1:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\mathbf{else}:\\
\;\;\;\;\sin^{-1} \left(1 - x\right) + \pi \cdot 0.5\\
\end{array}
\end{array}
if (-.f64 #s(literal 1 binary64) x) < 1Initial program 6.8%
if 1 < (-.f64 #s(literal 1 binary64) x) Initial program 6.8%
acos-asin6.8%
sub-neg6.8%
div-inv6.8%
metadata-eval6.8%
Applied egg-rr6.8%
sub-neg6.8%
Simplified6.8%
sub-neg6.8%
add-sqr-sqrt10.4%
distribute-rgt-neg-out10.4%
add-sqr-sqrt0.0%
sqrt-unprod6.9%
distribute-rgt-neg-out6.9%
add-sqr-sqrt6.9%
distribute-rgt-neg-out6.9%
add-sqr-sqrt6.9%
sqr-neg6.9%
sqrt-unprod6.9%
add-sqr-sqrt6.9%
Applied egg-rr6.9%
Final simplification6.8%
(FPCore (x) :precision binary64 (acos (* x (+ (/ 1.0 x) -1.0))))
double code(double x) {
return acos((x * ((1.0 / x) + -1.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((x * ((1.0d0 / x) + (-1.0d0))))
end function
public static double code(double x) {
return Math.acos((x * ((1.0 / x) + -1.0)));
}
def code(x): return math.acos((x * ((1.0 / x) + -1.0)))
function code(x) return acos(Float64(x * Float64(Float64(1.0 / x) + -1.0))) end
function tmp = code(x) tmp = acos((x * ((1.0 / x) + -1.0))); end
code[x_] := N[ArcCos[N[(x * N[(N[(1.0 / x), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(x \cdot \left(\frac{1}{x} + -1\right)\right)
\end{array}
Initial program 6.8%
Taylor expanded in x around inf 7.3%
Final simplification7.3%
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Initial program 6.8%
(FPCore (x) :precision binary64 (* 2.0 (asin (sqrt (/ x 2.0)))))
double code(double x) {
return 2.0 * asin(sqrt((x / 2.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = 2.0d0 * asin(sqrt((x / 2.0d0)))
end function
public static double code(double x) {
return 2.0 * Math.asin(Math.sqrt((x / 2.0)));
}
def code(x): return 2.0 * math.asin(math.sqrt((x / 2.0)))
function code(x) return Float64(2.0 * asin(sqrt(Float64(x / 2.0)))) end
function tmp = code(x) tmp = 2.0 * asin(sqrt((x / 2.0))); end
code[x_] := N[(2.0 * N[ArcSin[N[Sqrt[N[(x / 2.0), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
2 \cdot \sin^{-1} \left(\sqrt{\frac{x}{2}}\right)
\end{array}
herbie shell --seed 2024179
(FPCore (x)
:name "bug323 (missed optimization)"
:precision binary64
:pre (and (<= 0.0 x) (<= x 0.5))
:alt
(! :herbie-platform default (* 2 (asin (sqrt (/ x 2)))))
(acos (- 1.0 x)))