
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
(FPCore (x) :precision binary64 (let* ((t_0 (sqrt (sqrt PI)))) (fma (* t_0 t_0) (* 0.5 (sqrt PI)) (- (fma PI 0.5 (- (acos (- 1.0 x))))))))
double code(double x) {
double t_0 = sqrt(sqrt(((double) M_PI)));
return fma((t_0 * t_0), (0.5 * sqrt(((double) M_PI))), -fma(((double) M_PI), 0.5, -acos((1.0 - x))));
}
function code(x) t_0 = sqrt(sqrt(pi)) return fma(Float64(t_0 * t_0), Float64(0.5 * sqrt(pi)), Float64(-fma(pi, 0.5, Float64(-acos(Float64(1.0 - x)))))) end
code[x_] := Block[{t$95$0 = N[Sqrt[N[Sqrt[Pi], $MachinePrecision]], $MachinePrecision]}, N[(N[(t$95$0 * t$95$0), $MachinePrecision] * N[(0.5 * N[Sqrt[Pi], $MachinePrecision]), $MachinePrecision] + (-N[(Pi * 0.5 + (-N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision])), $MachinePrecision])), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{\sqrt{\pi}}\\
\mathsf{fma}\left(t\_0 \cdot t\_0, 0.5 \cdot \sqrt{\pi}, -\mathsf{fma}\left(\pi, 0.5, -\cos^{-1} \left(1 - x\right)\right)\right)
\end{array}
\end{array}
Initial program 6.8%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
add-sqr-sqrtN/A
associate-*l*N/A
lower-fma.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f645.0
Applied rewrites5.0%
lift-sqrt.f64N/A
pow1/2N/A
sqr-powN/A
lower-*.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f6410.3
Applied rewrites10.3%
lift-asin.f64N/A
asin-acosN/A
lift-acos.f64N/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
*-commutativeN/A
lower-fma.f64N/A
lower-neg.f6410.3
Applied rewrites10.3%
Final simplification10.3%
(FPCore (x) :precision binary64 (let* ((t_0 (sqrt (sqrt PI)))) (fma (* t_0 t_0) (* 0.5 (sqrt PI)) (- (asin (- 1.0 x))))))
double code(double x) {
double t_0 = sqrt(sqrt(((double) M_PI)));
return fma((t_0 * t_0), (0.5 * sqrt(((double) M_PI))), -asin((1.0 - x)));
}
function code(x) t_0 = sqrt(sqrt(pi)) return fma(Float64(t_0 * t_0), Float64(0.5 * sqrt(pi)), Float64(-asin(Float64(1.0 - x)))) end
code[x_] := Block[{t$95$0 = N[Sqrt[N[Sqrt[Pi], $MachinePrecision]], $MachinePrecision]}, N[(N[(t$95$0 * t$95$0), $MachinePrecision] * N[(0.5 * N[Sqrt[Pi], $MachinePrecision]), $MachinePrecision] + (-N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision])), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{\sqrt{\pi}}\\
\mathsf{fma}\left(t\_0 \cdot t\_0, 0.5 \cdot \sqrt{\pi}, -\sin^{-1} \left(1 - x\right)\right)
\end{array}
\end{array}
Initial program 6.8%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
add-sqr-sqrtN/A
associate-*l*N/A
lower-fma.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f645.0
Applied rewrites5.0%
lift-sqrt.f64N/A
pow1/2N/A
sqr-powN/A
lower-*.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f6410.3
Applied rewrites10.3%
Final simplification10.3%
(FPCore (x) :precision binary64 (let* ((t_0 (* 0.5 (sqrt PI)))) (fma (sqrt PI) t_0 (fma t_0 (- (sqrt PI)) (acos (- 1.0 x))))))
double code(double x) {
double t_0 = 0.5 * sqrt(((double) M_PI));
return fma(sqrt(((double) M_PI)), t_0, fma(t_0, -sqrt(((double) M_PI)), acos((1.0 - x))));
}
function code(x) t_0 = Float64(0.5 * sqrt(pi)) return fma(sqrt(pi), t_0, fma(t_0, Float64(-sqrt(pi)), acos(Float64(1.0 - x)))) end
code[x_] := Block[{t$95$0 = N[(0.5 * N[Sqrt[Pi], $MachinePrecision]), $MachinePrecision]}, N[(N[Sqrt[Pi], $MachinePrecision] * t$95$0 + N[(t$95$0 * (-N[Sqrt[Pi], $MachinePrecision]) + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := 0.5 \cdot \sqrt{\pi}\\
\mathsf{fma}\left(\sqrt{\pi}, t\_0, \mathsf{fma}\left(t\_0, -\sqrt{\pi}, \cos^{-1} \left(1 - x\right)\right)\right)
\end{array}
\end{array}
Initial program 6.8%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
add-sqr-sqrtN/A
associate-*l*N/A
lower-fma.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f645.0
Applied rewrites5.0%
lift-asin.f64N/A
asin-acosN/A
lift-acos.f64N/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
rem-square-sqrtN/A
lift-sqrt.f64N/A
lift-sqrt.f64N/A
associate-*r*N/A
*-commutativeN/A
lift-*.f64N/A
lower-fma.f64N/A
lift-*.f64N/A
*-commutativeN/A
lower-*.f64N/A
lower-neg.f6410.2
Applied rewrites10.2%
lift-neg.f64N/A
lift-fma.f64N/A
distribute-neg-inN/A
lift-*.f64N/A
associate-*l*N/A
lift-sqrt.f64N/A
lift-sqrt.f64N/A
rem-square-sqrtN/A
*-commutativeN/A
lift-neg.f64N/A
remove-double-negN/A
Applied rewrites10.2%
Final simplification10.2%
(FPCore (x) :precision binary64 (fma (* 0.5 (sqrt PI)) (- (sqrt PI)) (+ (* 0.5 PI) (acos (- 1.0 x)))))
double code(double x) {
return fma((0.5 * sqrt(((double) M_PI))), -sqrt(((double) M_PI)), ((0.5 * ((double) M_PI)) + acos((1.0 - x))));
}
function code(x) return fma(Float64(0.5 * sqrt(pi)), Float64(-sqrt(pi)), Float64(Float64(0.5 * pi) + acos(Float64(1.0 - x)))) end
code[x_] := N[(N[(0.5 * N[Sqrt[Pi], $MachinePrecision]), $MachinePrecision] * (-N[Sqrt[Pi], $MachinePrecision]) + N[(N[(0.5 * Pi), $MachinePrecision] + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(0.5 \cdot \sqrt{\pi}, -\sqrt{\pi}, 0.5 \cdot \pi + \cos^{-1} \left(1 - x\right)\right)
\end{array}
Initial program 6.8%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
add-sqr-sqrtN/A
associate-*l*N/A
lower-fma.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f645.0
Applied rewrites5.0%
lift-sqrt.f64N/A
pow1/2N/A
sqr-powN/A
lower-*.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
sqrt-pow2N/A
lift-sqrt.f64N/A
pow1/2N/A
lower-sqrt.f6410.3
Applied rewrites10.3%
lift-asin.f64N/A
asin-acosN/A
lift-acos.f64N/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
*-commutativeN/A
lower-fma.f64N/A
lower-neg.f6410.3
Applied rewrites10.3%
lift-*.f64N/A
lift-sqrt.f64N/A
lift-sqrt.f64N/A
rem-square-sqrt5.0
lower-fma.f64N/A
lift-*.f64N/A
associate-*r*N/A
lift-sqrt.f64N/A
lift-sqrt.f64N/A
rem-square-sqrtN/A
+-commutativeN/A
lift-neg.f64N/A
neg-mul-1N/A
Applied rewrites10.2%
Final simplification10.2%
(FPCore (x) :precision binary64 (if (<= (- 1.0 x) 0.9999999999999996) (fma PI 0.5 (fma PI -0.5 (acos (- 1.0 x)))) (fma (/ 2.0 PI) (* 0.25 (* PI PI)) (- (asin 1.0)))))
double code(double x) {
double tmp;
if ((1.0 - x) <= 0.9999999999999996) {
tmp = fma(((double) M_PI), 0.5, fma(((double) M_PI), -0.5, acos((1.0 - x))));
} else {
tmp = fma((2.0 / ((double) M_PI)), (0.25 * (((double) M_PI) * ((double) M_PI))), -asin(1.0));
}
return tmp;
}
function code(x) tmp = 0.0 if (Float64(1.0 - x) <= 0.9999999999999996) tmp = fma(pi, 0.5, fma(pi, -0.5, acos(Float64(1.0 - x)))); else tmp = fma(Float64(2.0 / pi), Float64(0.25 * Float64(pi * pi)), Float64(-asin(1.0))); end return tmp end
code[x_] := If[LessEqual[N[(1.0 - x), $MachinePrecision], 0.9999999999999996], N[(Pi * 0.5 + N[(Pi * -0.5 + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(N[(2.0 / Pi), $MachinePrecision] * N[(0.25 * N[(Pi * Pi), $MachinePrecision]), $MachinePrecision] + (-N[ArcSin[1.0], $MachinePrecision])), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - x \leq 0.9999999999999996:\\
\;\;\;\;\mathsf{fma}\left(\pi, 0.5, \mathsf{fma}\left(\pi, -0.5, \cos^{-1} \left(1 - x\right)\right)\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(\frac{2}{\pi}, 0.25 \cdot \left(\pi \cdot \pi\right), -\sin^{-1} 1\right)\\
\end{array}
\end{array}
if (-.f64 #s(literal 1 binary64) x) < 0.99999999999999956Initial program 61.5%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f6461.4
Applied rewrites61.4%
lift-asin.f64N/A
asin-acosN/A
lift-acos.f64N/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
*-commutativeN/A
lower-fma.f64N/A
lower-neg.f6461.5
Applied rewrites61.5%
lift-neg.f64N/A
lift-fma.f64N/A
distribute-neg-inN/A
distribute-rgt-neg-inN/A
lift-neg.f64N/A
remove-double-negN/A
lower-fma.f64N/A
metadata-eval61.5
Applied rewrites61.5%
if 0.99999999999999956 < (-.f64 #s(literal 1 binary64) x) Initial program 3.9%
Taylor expanded in x around 0
Applied rewrites3.9%
lift-acos.f64N/A
acos-asinN/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
Applied rewrites7.5%
Final simplification10.2%
(FPCore (x) :precision binary64 (fma (/ 2.0 PI) (* 0.25 (* PI PI)) (- (asin (- 1.0 x)))))
double code(double x) {
return fma((2.0 / ((double) M_PI)), (0.25 * (((double) M_PI) * ((double) M_PI))), -asin((1.0 - x)));
}
function code(x) return fma(Float64(2.0 / pi), Float64(0.25 * Float64(pi * pi)), Float64(-asin(Float64(1.0 - x)))) end
code[x_] := N[(N[(2.0 / Pi), $MachinePrecision] * N[(0.25 * N[(Pi * Pi), $MachinePrecision]), $MachinePrecision] + (-N[ArcSin[N[(1.0 - x), $MachinePrecision]], $MachinePrecision])), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\frac{2}{\pi}, 0.25 \cdot \left(\pi \cdot \pi\right), -\sin^{-1} \left(1 - x\right)\right)
\end{array}
Initial program 6.8%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
add-sqr-sqrtN/A
associate-*l*N/A
lower-fma.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f645.0
Applied rewrites5.0%
lift-fma.f64N/A
Applied rewrites10.2%
Final simplification10.2%
(FPCore (x) :precision binary64 (if (<= x 5.5e-17) (acos (- x)) (fma PI 0.5 (fma PI -0.5 (acos (- 1.0 x))))))
double code(double x) {
double tmp;
if (x <= 5.5e-17) {
tmp = acos(-x);
} else {
tmp = fma(((double) M_PI), 0.5, fma(((double) M_PI), -0.5, acos((1.0 - x))));
}
return tmp;
}
function code(x) tmp = 0.0 if (x <= 5.5e-17) tmp = acos(Float64(-x)); else tmp = fma(pi, 0.5, fma(pi, -0.5, acos(Float64(1.0 - x)))); end return tmp end
code[x_] := If[LessEqual[x, 5.5e-17], N[ArcCos[(-x)], $MachinePrecision], N[(Pi * 0.5 + N[(Pi * -0.5 + N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \leq 5.5 \cdot 10^{-17}:\\
\;\;\;\;\cos^{-1} \left(-x\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(\pi, 0.5, \mathsf{fma}\left(\pi, -0.5, \cos^{-1} \left(1 - x\right)\right)\right)\\
\end{array}
\end{array}
if x < 5.50000000000000001e-17Initial program 3.9%
Taylor expanded in x around inf
mul-1-negN/A
lower-neg.f646.5
Applied rewrites6.5%
if 5.50000000000000001e-17 < x Initial program 61.5%
lift-acos.f64N/A
acos-asinN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
lower-PI.f64N/A
metadata-evalN/A
lower-neg.f64N/A
lower-asin.f6461.4
Applied rewrites61.4%
lift-asin.f64N/A
asin-acosN/A
lift-acos.f64N/A
lift-PI.f64N/A
div-invN/A
metadata-evalN/A
*-commutativeN/A
sub-negN/A
*-commutativeN/A
lower-fma.f64N/A
lower-neg.f6461.5
Applied rewrites61.5%
lift-neg.f64N/A
lift-fma.f64N/A
distribute-neg-inN/A
distribute-rgt-neg-inN/A
lift-neg.f64N/A
remove-double-negN/A
lower-fma.f64N/A
metadata-eval61.5
Applied rewrites61.5%
(FPCore (x) :precision binary64 (if (<= x 5.5e-17) (acos (- x)) (acos (- 1.0 x))))
double code(double x) {
double tmp;
if (x <= 5.5e-17) {
tmp = acos(-x);
} else {
tmp = acos((1.0 - x));
}
return tmp;
}
real(8) function code(x)
real(8), intent (in) :: x
real(8) :: tmp
if (x <= 5.5d-17) then
tmp = acos(-x)
else
tmp = acos((1.0d0 - x))
end if
code = tmp
end function
public static double code(double x) {
double tmp;
if (x <= 5.5e-17) {
tmp = Math.acos(-x);
} else {
tmp = Math.acos((1.0 - x));
}
return tmp;
}
def code(x): tmp = 0 if x <= 5.5e-17: tmp = math.acos(-x) else: tmp = math.acos((1.0 - x)) return tmp
function code(x) tmp = 0.0 if (x <= 5.5e-17) tmp = acos(Float64(-x)); else tmp = acos(Float64(1.0 - x)); end return tmp end
function tmp_2 = code(x) tmp = 0.0; if (x <= 5.5e-17) tmp = acos(-x); else tmp = acos((1.0 - x)); end tmp_2 = tmp; end
code[x_] := If[LessEqual[x, 5.5e-17], N[ArcCos[(-x)], $MachinePrecision], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \leq 5.5 \cdot 10^{-17}:\\
\;\;\;\;\cos^{-1} \left(-x\right)\\
\mathbf{else}:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\end{array}
\end{array}
if x < 5.50000000000000001e-17Initial program 3.9%
Taylor expanded in x around inf
mul-1-negN/A
lower-neg.f646.5
Applied rewrites6.5%
if 5.50000000000000001e-17 < x Initial program 61.5%
(FPCore (x) :precision binary64 (acos (- x)))
double code(double x) {
return acos(-x);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(-x)
end function
public static double code(double x) {
return Math.acos(-x);
}
def code(x): return math.acos(-x)
function code(x) return acos(Float64(-x)) end
function tmp = code(x) tmp = acos(-x); end
code[x_] := N[ArcCos[(-x)], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(-x\right)
\end{array}
Initial program 6.8%
Taylor expanded in x around inf
mul-1-negN/A
lower-neg.f646.8
Applied rewrites6.8%
(FPCore (x) :precision binary64 (acos 1.0))
double code(double x) {
return acos(1.0);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(1.0d0)
end function
public static double code(double x) {
return Math.acos(1.0);
}
def code(x): return math.acos(1.0)
function code(x) return acos(1.0) end
function tmp = code(x) tmp = acos(1.0); end
code[x_] := N[ArcCos[1.0], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} 1
\end{array}
Initial program 6.8%
Taylor expanded in x around 0
Applied rewrites3.8%
(FPCore (x) :precision binary64 (* 2.0 (asin (sqrt (/ x 2.0)))))
double code(double x) {
return 2.0 * asin(sqrt((x / 2.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = 2.0d0 * asin(sqrt((x / 2.0d0)))
end function
public static double code(double x) {
return 2.0 * Math.asin(Math.sqrt((x / 2.0)));
}
def code(x): return 2.0 * math.asin(math.sqrt((x / 2.0)))
function code(x) return Float64(2.0 * asin(sqrt(Float64(x / 2.0)))) end
function tmp = code(x) tmp = 2.0 * asin(sqrt((x / 2.0))); end
code[x_] := N[(2.0 * N[ArcSin[N[Sqrt[N[(x / 2.0), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
2 \cdot \sin^{-1} \left(\sqrt{\frac{x}{2}}\right)
\end{array}
herbie shell --seed 2024235
(FPCore (x)
:name "bug323 (missed optimization)"
:precision binary64
:pre (and (<= 0.0 x) (<= x 0.5))
:alt
(! :herbie-platform default (* 2 (asin (sqrt (/ x 2)))))
(acos (- 1.0 x)))