
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}
(FPCore (a b) :precision binary64 (let* ((t_0 (fma a a (* b b)))) (+ (+ (/ t_0 (/ 1.0 t_0)) (* 4.0 (* b b))) -1.0)))
double code(double a, double b) {
double t_0 = fma(a, a, (b * b));
return ((t_0 / (1.0 / t_0)) + (4.0 * (b * b))) + -1.0;
}
function code(a, b) t_0 = fma(a, a, Float64(b * b)) return Float64(Float64(Float64(t_0 / Float64(1.0 / t_0)) + Float64(4.0 * Float64(b * b))) + -1.0) end
code[a_, b_] := Block[{t$95$0 = N[(a * a + N[(b * b), $MachinePrecision]), $MachinePrecision]}, N[(N[(N[(t$95$0 / N[(1.0 / t$95$0), $MachinePrecision]), $MachinePrecision] + N[(4.0 * N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \mathsf{fma}\left(a, a, b \cdot b\right)\\
\left(\frac{t\_0}{\frac{1}{t\_0}} + 4 \cdot \left(b \cdot b\right)\right) + -1
\end{array}
\end{array}
Initial program 74.1%
lift-pow.f64N/A
unpow2N/A
lift-+.f64N/A
flip-+N/A
clear-numN/A
un-div-invN/A
lower-/.f64N/A
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f64N/A
clear-numN/A
flip-+N/A
lift-+.f64N/A
lower-/.f6474.1
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f6474.1
Applied rewrites74.1%
Taylor expanded in a around 0
unpow2N/A
lower-*.f6499.5
Applied rewrites99.5%
Final simplification99.5%
(FPCore (a b)
:precision binary64
(if (<= (* b b) 5.0)
(fma (fma a (+ a 4.0) 4.0) (* a a) -1.0)
(if (<= (* b b) 5e+302)
(fma
b
(* b (fma b b 4.0))
(fma a (fma (* b b) (fma 2.0 a -12.0) (* a 4.0)) -1.0))
(fma (* b b) 4.0 -1.0))))
double code(double a, double b) {
double tmp;
if ((b * b) <= 5.0) {
tmp = fma(fma(a, (a + 4.0), 4.0), (a * a), -1.0);
} else if ((b * b) <= 5e+302) {
tmp = fma(b, (b * fma(b, b, 4.0)), fma(a, fma((b * b), fma(2.0, a, -12.0), (a * 4.0)), -1.0));
} else {
tmp = fma((b * b), 4.0, -1.0);
}
return tmp;
}
function code(a, b) tmp = 0.0 if (Float64(b * b) <= 5.0) tmp = fma(fma(a, Float64(a + 4.0), 4.0), Float64(a * a), -1.0); elseif (Float64(b * b) <= 5e+302) tmp = fma(b, Float64(b * fma(b, b, 4.0)), fma(a, fma(Float64(b * b), fma(2.0, a, -12.0), Float64(a * 4.0)), -1.0)); else tmp = fma(Float64(b * b), 4.0, -1.0); end return tmp end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 5.0], N[(N[(a * N[(a + 4.0), $MachinePrecision] + 4.0), $MachinePrecision] * N[(a * a), $MachinePrecision] + -1.0), $MachinePrecision], If[LessEqual[N[(b * b), $MachinePrecision], 5e+302], N[(b * N[(b * N[(b * b + 4.0), $MachinePrecision]), $MachinePrecision] + N[(a * N[(N[(b * b), $MachinePrecision] * N[(2.0 * a + -12.0), $MachinePrecision] + N[(a * 4.0), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision], N[(N[(b * b), $MachinePrecision] * 4.0 + -1.0), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 5:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(a, a + 4, 4\right), a \cdot a, -1\right)\\
\mathbf{elif}\;b \cdot b \leq 5 \cdot 10^{+302}:\\
\;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \mathsf{fma}\left(a, \mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(2, a, -12\right), a \cdot 4\right), -1\right)\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\
\end{array}
\end{array}
if (*.f64 b b) < 5Initial program 83.7%
Taylor expanded in b around 0
sub-negN/A
+-commutativeN/A
metadata-evalN/A
pow-sqrN/A
*-commutativeN/A
associate-*r*N/A
distribute-rgt-outN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
unpow2N/A
lower-fma.f64N/A
+-commutativeN/A
distribute-lft-inN/A
metadata-evalN/A
lower-fma.f6499.3
Applied rewrites99.3%
Applied rewrites99.4%
if 5 < (*.f64 b b) < 5e302Initial program 70.9%
Taylor expanded in a around 0
+-commutativeN/A
associate-+r+N/A
associate--l+N/A
+-commutativeN/A
metadata-evalN/A
pow-plusN/A
cube-unmultN/A
unpow2N/A
unpow2N/A
associate-*r*N/A
distribute-rgt-outN/A
lower-fma.f64N/A
Applied rewrites93.7%
if 5e302 < (*.f64 b b) Initial program 60.0%
Taylor expanded in a around 0
sub-negN/A
+-commutativeN/A
metadata-evalN/A
pow-sqrN/A
distribute-rgt-outN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
unpow2N/A
lower-fma.f64100.0
Applied rewrites100.0%
Taylor expanded in b around 0
Applied rewrites98.6%
Final simplification97.8%
herbie shell --seed 2024229
(FPCore (a b)
:name "Bouland and Aaronson, Equation (25)"
:precision binary64
(- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))