
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x) :precision binary64 (acos (- 1.0 x)))
double code(double x) {
return acos((1.0 - x));
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos((1.0d0 - x))
end function
public static double code(double x) {
return Math.acos((1.0 - x));
}
def code(x): return math.acos((1.0 - x))
function code(x) return acos(Float64(1.0 - x)) end
function tmp = code(x) tmp = acos((1.0 - x)); end
code[x_] := N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(1 - x\right)
\end{array}
(FPCore (x)
:precision binary64
(let* ((t_0 (fma PI 0.5 (asin 1.0)))
(t_1 (- (/ (pow (asin 1.0) 2.0) t_0)))
(t_2 (/ (* 0.25 (* PI PI)) t_0))
(t_3 (fma t_1 (- t_1 t_2) (* 0.0625 (pow (/ t_0 (* PI PI)) -2.0)))))
(if (<= x 5.5e-17)
(/
(-
(* (pow t_2 3.0) t_3)
(* t_3 (pow (* t_0 (pow (asin 1.0) -2.0)) -3.0)))
(pow t_3 2.0))
(acos (- 1.0 x)))))
double code(double x) {
double t_0 = fma(((double) M_PI), 0.5, asin(1.0));
double t_1 = -(pow(asin(1.0), 2.0) / t_0);
double t_2 = (0.25 * (((double) M_PI) * ((double) M_PI))) / t_0;
double t_3 = fma(t_1, (t_1 - t_2), (0.0625 * pow((t_0 / (((double) M_PI) * ((double) M_PI))), -2.0)));
double tmp;
if (x <= 5.5e-17) {
tmp = ((pow(t_2, 3.0) * t_3) - (t_3 * pow((t_0 * pow(asin(1.0), -2.0)), -3.0))) / pow(t_3, 2.0);
} else {
tmp = acos((1.0 - x));
}
return tmp;
}
function code(x) t_0 = fma(pi, 0.5, asin(1.0)) t_1 = Float64(-Float64((asin(1.0) ^ 2.0) / t_0)) t_2 = Float64(Float64(0.25 * Float64(pi * pi)) / t_0) t_3 = fma(t_1, Float64(t_1 - t_2), Float64(0.0625 * (Float64(t_0 / Float64(pi * pi)) ^ -2.0))) tmp = 0.0 if (x <= 5.5e-17) tmp = Float64(Float64(Float64((t_2 ^ 3.0) * t_3) - Float64(t_3 * (Float64(t_0 * (asin(1.0) ^ -2.0)) ^ -3.0))) / (t_3 ^ 2.0)); else tmp = acos(Float64(1.0 - x)); end return tmp end
code[x_] := Block[{t$95$0 = N[(Pi * 0.5 + N[ArcSin[1.0], $MachinePrecision]), $MachinePrecision]}, Block[{t$95$1 = (-N[(N[Power[N[ArcSin[1.0], $MachinePrecision], 2.0], $MachinePrecision] / t$95$0), $MachinePrecision])}, Block[{t$95$2 = N[(N[(0.25 * N[(Pi * Pi), $MachinePrecision]), $MachinePrecision] / t$95$0), $MachinePrecision]}, Block[{t$95$3 = N[(t$95$1 * N[(t$95$1 - t$95$2), $MachinePrecision] + N[(0.0625 * N[Power[N[(t$95$0 / N[(Pi * Pi), $MachinePrecision]), $MachinePrecision], -2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]}, If[LessEqual[x, 5.5e-17], N[(N[(N[(N[Power[t$95$2, 3.0], $MachinePrecision] * t$95$3), $MachinePrecision] - N[(t$95$3 * N[Power[N[(t$95$0 * N[Power[N[ArcSin[1.0], $MachinePrecision], -2.0], $MachinePrecision]), $MachinePrecision], -3.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] / N[Power[t$95$3, 2.0], $MachinePrecision]), $MachinePrecision], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]]]]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \mathsf{fma}\left(\pi, 0.5, \sin^{-1} 1\right)\\
t_1 := -\frac{{\sin^{-1} 1}^{2}}{t\_0}\\
t_2 := \frac{0.25 \cdot \left(\pi \cdot \pi\right)}{t\_0}\\
t_3 := \mathsf{fma}\left(t\_1, t\_1 - t\_2, 0.0625 \cdot {\left(\frac{t\_0}{\pi \cdot \pi}\right)}^{-2}\right)\\
\mathbf{if}\;x \leq 5.5 \cdot 10^{-17}:\\
\;\;\;\;\frac{{t\_2}^{3} \cdot t\_3 - t\_3 \cdot {\left(t\_0 \cdot {\sin^{-1} 1}^{-2}\right)}^{-3}}{{t\_3}^{2}}\\
\mathbf{else}:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\end{array}
\end{array}
if x < 5.50000000000000001e-17Initial program 3.8%
Taylor expanded in x around 0
Simplified3.8%
acos-asinN/A
flip--N/A
div-subN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
Applied egg-rr7.8%
Applied egg-rr7.8%
Applied egg-rr7.8%
if 5.50000000000000001e-17 < x Initial program 68.5%
(FPCore (x)
:precision binary64
(let* ((t_0 (acos (- 1.0 x)))
(t_1 (fma PI (* 0.25 PI) (* (asin 1.0) (fma PI 0.5 (asin 1.0))))))
(if (<= t_0 0.0)
(/
(fma (* (* PI (* PI PI)) 0.125) t_1 (* t_1 (- (pow (asin 1.0) 3.0))))
(pow t_1 2.0))
t_0)))
double code(double x) {
double t_0 = acos((1.0 - x));
double t_1 = fma(((double) M_PI), (0.25 * ((double) M_PI)), (asin(1.0) * fma(((double) M_PI), 0.5, asin(1.0))));
double tmp;
if (t_0 <= 0.0) {
tmp = fma(((((double) M_PI) * (((double) M_PI) * ((double) M_PI))) * 0.125), t_1, (t_1 * -pow(asin(1.0), 3.0))) / pow(t_1, 2.0);
} else {
tmp = t_0;
}
return tmp;
}
function code(x) t_0 = acos(Float64(1.0 - x)) t_1 = fma(pi, Float64(0.25 * pi), Float64(asin(1.0) * fma(pi, 0.5, asin(1.0)))) tmp = 0.0 if (t_0 <= 0.0) tmp = Float64(fma(Float64(Float64(pi * Float64(pi * pi)) * 0.125), t_1, Float64(t_1 * Float64(-(asin(1.0) ^ 3.0)))) / (t_1 ^ 2.0)); else tmp = t_0; end return tmp end
code[x_] := Block[{t$95$0 = N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[(Pi * N[(0.25 * Pi), $MachinePrecision] + N[(N[ArcSin[1.0], $MachinePrecision] * N[(Pi * 0.5 + N[ArcSin[1.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]}, If[LessEqual[t$95$0, 0.0], N[(N[(N[(N[(Pi * N[(Pi * Pi), $MachinePrecision]), $MachinePrecision] * 0.125), $MachinePrecision] * t$95$1 + N[(t$95$1 * (-N[Power[N[ArcSin[1.0], $MachinePrecision], 3.0], $MachinePrecision])), $MachinePrecision]), $MachinePrecision] / N[Power[t$95$1, 2.0], $MachinePrecision]), $MachinePrecision], t$95$0]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \cos^{-1} \left(1 - x\right)\\
t_1 := \mathsf{fma}\left(\pi, 0.25 \cdot \pi, \sin^{-1} 1 \cdot \mathsf{fma}\left(\pi, 0.5, \sin^{-1} 1\right)\right)\\
\mathbf{if}\;t\_0 \leq 0:\\
\;\;\;\;\frac{\mathsf{fma}\left(\left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot 0.125, t\_1, t\_1 \cdot \left(-{\sin^{-1} 1}^{3}\right)\right)}{{t\_1}^{2}}\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if (acos.f64 (-.f64 #s(literal 1 binary64) x)) < 0.0Initial program 3.8%
Taylor expanded in x around 0
Simplified3.8%
acos-asinN/A
flip--N/A
div-subN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
Applied egg-rr7.8%
Applied egg-rr7.8%
if 0.0 < (acos.f64 (-.f64 #s(literal 1 binary64) x)) Initial program 68.5%
Final simplification11.6%
(FPCore (x)
:precision binary64
(let* ((t_0 (fma PI 0.5 (asin 1.0))))
(if (<= x 5.5e-17)
(/
(fma (* PI (* 0.25 PI)) t_0 (- (* t_0 (pow (asin 1.0) 2.0))))
(pow t_0 2.0))
(acos (- 1.0 x)))))
double code(double x) {
double t_0 = fma(((double) M_PI), 0.5, asin(1.0));
double tmp;
if (x <= 5.5e-17) {
tmp = fma((((double) M_PI) * (0.25 * ((double) M_PI))), t_0, -(t_0 * pow(asin(1.0), 2.0))) / pow(t_0, 2.0);
} else {
tmp = acos((1.0 - x));
}
return tmp;
}
function code(x) t_0 = fma(pi, 0.5, asin(1.0)) tmp = 0.0 if (x <= 5.5e-17) tmp = Float64(fma(Float64(pi * Float64(0.25 * pi)), t_0, Float64(-Float64(t_0 * (asin(1.0) ^ 2.0)))) / (t_0 ^ 2.0)); else tmp = acos(Float64(1.0 - x)); end return tmp end
code[x_] := Block[{t$95$0 = N[(Pi * 0.5 + N[ArcSin[1.0], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[x, 5.5e-17], N[(N[(N[(Pi * N[(0.25 * Pi), $MachinePrecision]), $MachinePrecision] * t$95$0 + (-N[(t$95$0 * N[Power[N[ArcSin[1.0], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision])), $MachinePrecision] / N[Power[t$95$0, 2.0], $MachinePrecision]), $MachinePrecision], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \mathsf{fma}\left(\pi, 0.5, \sin^{-1} 1\right)\\
\mathbf{if}\;x \leq 5.5 \cdot 10^{-17}:\\
\;\;\;\;\frac{\mathsf{fma}\left(\pi \cdot \left(0.25 \cdot \pi\right), t\_0, -t\_0 \cdot {\sin^{-1} 1}^{2}\right)}{{t\_0}^{2}}\\
\mathbf{else}:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\end{array}
\end{array}
if x < 5.50000000000000001e-17Initial program 3.8%
Taylor expanded in x around 0
Simplified3.8%
acos-asinN/A
flip--N/A
div-subN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
Applied egg-rr7.8%
lift-PI.f64N/A
lift-PI.f64N/A
lift-*.f64N/A
lift-*.f64N/A
lift-PI.f64N/A
lift-asin.f64N/A
lift-fma.f64N/A
associate-*r/N/A
lift-asin.f64N/A
lift-pow.f64N/A
lift-PI.f64N/A
lift-asin.f64N/A
lift-fma.f64N/A
Applied egg-rr7.8%
if 5.50000000000000001e-17 < x Initial program 68.5%
Final simplification11.6%
(FPCore (x)
:precision binary64
(let* ((t_0 (acos (- 1.0 x))) (t_1 (fma PI 0.5 (asin 1.0))))
(if (<= t_0 0.0)
(fma (/ 0.25 t_1) (* PI PI) (- (/ (pow (asin 1.0) 2.0) t_1)))
t_0)))
double code(double x) {
double t_0 = acos((1.0 - x));
double t_1 = fma(((double) M_PI), 0.5, asin(1.0));
double tmp;
if (t_0 <= 0.0) {
tmp = fma((0.25 / t_1), (((double) M_PI) * ((double) M_PI)), -(pow(asin(1.0), 2.0) / t_1));
} else {
tmp = t_0;
}
return tmp;
}
function code(x) t_0 = acos(Float64(1.0 - x)) t_1 = fma(pi, 0.5, asin(1.0)) tmp = 0.0 if (t_0 <= 0.0) tmp = fma(Float64(0.25 / t_1), Float64(pi * pi), Float64(-Float64((asin(1.0) ^ 2.0) / t_1))); else tmp = t_0; end return tmp end
code[x_] := Block[{t$95$0 = N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]}, Block[{t$95$1 = N[(Pi * 0.5 + N[ArcSin[1.0], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[t$95$0, 0.0], N[(N[(0.25 / t$95$1), $MachinePrecision] * N[(Pi * Pi), $MachinePrecision] + (-N[(N[Power[N[ArcSin[1.0], $MachinePrecision], 2.0], $MachinePrecision] / t$95$1), $MachinePrecision])), $MachinePrecision], t$95$0]]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \cos^{-1} \left(1 - x\right)\\
t_1 := \mathsf{fma}\left(\pi, 0.5, \sin^{-1} 1\right)\\
\mathbf{if}\;t\_0 \leq 0:\\
\;\;\;\;\mathsf{fma}\left(\frac{0.25}{t\_1}, \pi \cdot \pi, -\frac{{\sin^{-1} 1}^{2}}{t\_1}\right)\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if (acos.f64 (-.f64 #s(literal 1 binary64) x)) < 0.0Initial program 3.8%
Taylor expanded in x around 0
Simplified3.8%
acos-asinN/A
flip--N/A
div-subN/A
sub-negN/A
div-invN/A
lower-fma.f64N/A
Applied egg-rr7.8%
lift-PI.f64N/A
lift-PI.f64N/A
lift-*.f64N/A
lift-*.f64N/A
lift-PI.f64N/A
lift-asin.f64N/A
lift-fma.f64N/A
/-rgt-identityN/A
clear-numN/A
lift-/.f64N/A
lift-asin.f64N/A
lift-pow.f64N/A
lift-PI.f64N/A
lift-asin.f64N/A
Applied egg-rr7.8%
if 0.0 < (acos.f64 (-.f64 #s(literal 1 binary64) x)) Initial program 68.5%
Final simplification11.6%
(FPCore (x) :precision binary64 (if (<= x 5.5e-17) (acos (- x)) (acos (- 1.0 x))))
double code(double x) {
double tmp;
if (x <= 5.5e-17) {
tmp = acos(-x);
} else {
tmp = acos((1.0 - x));
}
return tmp;
}
real(8) function code(x)
real(8), intent (in) :: x
real(8) :: tmp
if (x <= 5.5d-17) then
tmp = acos(-x)
else
tmp = acos((1.0d0 - x))
end if
code = tmp
end function
public static double code(double x) {
double tmp;
if (x <= 5.5e-17) {
tmp = Math.acos(-x);
} else {
tmp = Math.acos((1.0 - x));
}
return tmp;
}
def code(x): tmp = 0 if x <= 5.5e-17: tmp = math.acos(-x) else: tmp = math.acos((1.0 - x)) return tmp
function code(x) tmp = 0.0 if (x <= 5.5e-17) tmp = acos(Float64(-x)); else tmp = acos(Float64(1.0 - x)); end return tmp end
function tmp_2 = code(x) tmp = 0.0; if (x <= 5.5e-17) tmp = acos(-x); else tmp = acos((1.0 - x)); end tmp_2 = tmp; end
code[x_] := If[LessEqual[x, 5.5e-17], N[ArcCos[(-x)], $MachinePrecision], N[ArcCos[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \leq 5.5 \cdot 10^{-17}:\\
\;\;\;\;\cos^{-1} \left(-x\right)\\
\mathbf{else}:\\
\;\;\;\;\cos^{-1} \left(1 - x\right)\\
\end{array}
\end{array}
if x < 5.50000000000000001e-17Initial program 3.8%
Taylor expanded in x around inf
mul-1-negN/A
lower-neg.f646.7
Simplified6.7%
if 5.50000000000000001e-17 < x Initial program 68.5%
(FPCore (x) :precision binary64 (acos (- x)))
double code(double x) {
return acos(-x);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(-x)
end function
public static double code(double x) {
return Math.acos(-x);
}
def code(x): return math.acos(-x)
function code(x) return acos(Float64(-x)) end
function tmp = code(x) tmp = acos(-x); end
code[x_] := N[ArcCos[(-x)], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} \left(-x\right)
\end{array}
Initial program 7.9%
Taylor expanded in x around inf
mul-1-negN/A
lower-neg.f647.1
Simplified7.1%
(FPCore (x) :precision binary64 (acos 1.0))
double code(double x) {
return acos(1.0);
}
real(8) function code(x)
real(8), intent (in) :: x
code = acos(1.0d0)
end function
public static double code(double x) {
return Math.acos(1.0);
}
def code(x): return math.acos(1.0)
function code(x) return acos(1.0) end
function tmp = code(x) tmp = acos(1.0); end
code[x_] := N[ArcCos[1.0], $MachinePrecision]
\begin{array}{l}
\\
\cos^{-1} 1
\end{array}
Initial program 7.9%
Taylor expanded in x around 0
Simplified3.8%
(FPCore (x) :precision binary64 (* 2.0 (asin (sqrt (/ x 2.0)))))
double code(double x) {
return 2.0 * asin(sqrt((x / 2.0)));
}
real(8) function code(x)
real(8), intent (in) :: x
code = 2.0d0 * asin(sqrt((x / 2.0d0)))
end function
public static double code(double x) {
return 2.0 * Math.asin(Math.sqrt((x / 2.0)));
}
def code(x): return 2.0 * math.asin(math.sqrt((x / 2.0)))
function code(x) return Float64(2.0 * asin(sqrt(Float64(x / 2.0)))) end
function tmp = code(x) tmp = 2.0 * asin(sqrt((x / 2.0))); end
code[x_] := N[(2.0 * N[ArcSin[N[Sqrt[N[(x / 2.0), $MachinePrecision]], $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
2 \cdot \sin^{-1} \left(\sqrt{\frac{x}{2}}\right)
\end{array}
herbie shell --seed 2024207
(FPCore (x)
:name "bug323 (missed optimization)"
:precision binary64
:pre (and (<= 0.0 x) (<= x 0.5))
:alt
(! :herbie-platform default (* 2 (asin (sqrt (/ x 2)))))
(acos (- 1.0 x)))