
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}
(FPCore (a b) :precision binary64 (fma (* (fma (* 2.0 a) a (fma (fma -3.0 a 1.0) 4.0 (* b b))) b) b (fma (* a a) (fma a a (fma a 4.0 4.0)) -1.0)))
double code(double a, double b) {
return fma((fma((2.0 * a), a, fma(fma(-3.0, a, 1.0), 4.0, (b * b))) * b), b, fma((a * a), fma(a, a, fma(a, 4.0, 4.0)), -1.0));
}
function code(a, b) return fma(Float64(fma(Float64(2.0 * a), a, fma(fma(-3.0, a, 1.0), 4.0, Float64(b * b))) * b), b, fma(Float64(a * a), fma(a, a, fma(a, 4.0, 4.0)), -1.0)) end
code[a_, b_] := N[(N[(N[(N[(2.0 * a), $MachinePrecision] * a + N[(N[(-3.0 * a + 1.0), $MachinePrecision] * 4.0 + N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * b + N[(N[(a * a), $MachinePrecision] * N[(a * a + N[(a * 4.0 + 4.0), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\mathsf{fma}\left(2 \cdot a, a, \mathsf{fma}\left(\mathsf{fma}\left(-3, a, 1\right), 4, b \cdot b\right)\right) \cdot b, b, \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, \mathsf{fma}\left(a, 4, 4\right)\right), -1\right)\right)
\end{array}
Initial program 74.9%
Taylor expanded in b around 0
Applied rewrites99.5%
Final simplification99.5%
(FPCore (a b) :precision binary64 (if (<= (* b b) 5e-7) (fma (* (fma a (+ 4.0 a) 4.0) a) a -1.0) (fma (* (fma (* 2.0 a) a (fma (fma (/ b a) b -12.0) a 4.0)) b) b -1.0)))
double code(double a, double b) {
double tmp;
if ((b * b) <= 5e-7) {
tmp = fma((fma(a, (4.0 + a), 4.0) * a), a, -1.0);
} else {
tmp = fma((fma((2.0 * a), a, fma(fma((b / a), b, -12.0), a, 4.0)) * b), b, -1.0);
}
return tmp;
}
function code(a, b) tmp = 0.0 if (Float64(b * b) <= 5e-7) tmp = fma(Float64(fma(a, Float64(4.0 + a), 4.0) * a), a, -1.0); else tmp = fma(Float64(fma(Float64(2.0 * a), a, fma(fma(Float64(b / a), b, -12.0), a, 4.0)) * b), b, -1.0); end return tmp end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 5e-7], N[(N[(N[(a * N[(4.0 + a), $MachinePrecision] + 4.0), $MachinePrecision] * a), $MachinePrecision] * a + -1.0), $MachinePrecision], N[(N[(N[(N[(2.0 * a), $MachinePrecision] * a + N[(N[(N[(b / a), $MachinePrecision] * b + -12.0), $MachinePrecision] * a + 4.0), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * b + -1.0), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 5 \cdot 10^{-7}:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(a, 4 + a, 4\right) \cdot a, a, -1\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(2 \cdot a, a, \mathsf{fma}\left(\mathsf{fma}\left(\frac{b}{a}, b, -12\right), a, 4\right)\right) \cdot b, b, -1\right)\\
\end{array}
\end{array}
if (*.f64 b b) < 4.99999999999999977e-7Initial program 83.6%
Taylor expanded in b around 0
sub-negN/A
+-commutativeN/A
metadata-evalN/A
pow-sqrN/A
*-commutativeN/A
associate-*r*N/A
distribute-rgt-outN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
unpow2N/A
lower-fma.f64N/A
+-commutativeN/A
distribute-rgt-inN/A
metadata-evalN/A
lower-fma.f6499.6
Applied rewrites99.6%
Applied rewrites99.7%
if 4.99999999999999977e-7 < (*.f64 b b) Initial program 65.3%
Taylor expanded in b around 0
Applied rewrites99.8%
Taylor expanded in a around inf
Applied rewrites96.9%
Taylor expanded in a around 0
Applied rewrites93.7%
Taylor expanded in a around 0
Applied rewrites93.7%
Final simplification96.6%
herbie shell --seed 2024234
(FPCore (a b)
:name "Bouland and Aaronson, Equation (25)"
:precision binary64
(- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))