
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (- 1.0 a)) (* (* b b) (+ 3.0 a))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 - a)) + ((b * b) * (3.0d0 + a))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 - a)) + Float64(Float64(b * b) * Float64(3.0 + a))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 - a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(3.0 + a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 - a\right) + \left(b \cdot b\right) \cdot \left(3 + a\right)\right)\right) - 1
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a b) :precision binary64 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (- 1.0 a)) (* (* b b) (+ 3.0 a))))) 1.0))
double code(double a, double b) {
return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 - a)) + ((b * b) * (3.0d0 + a))))) - 1.0d0
end function
public static double code(double a, double b) {
return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0;
}
def code(a, b): return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0
function code(a, b) return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 - a)) + Float64(Float64(b * b) * Float64(3.0 + a))))) - 1.0) end
function tmp = code(a, b) tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 - a)) + ((b * b) * (3.0 + a))))) - 1.0; end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 - a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(3.0 + a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 - a\right) + \left(b \cdot b\right) \cdot \left(3 + a\right)\right)\right) - 1
\end{array}
(FPCore (a b) :precision binary64 (fma (* (fma (fma 2.0 a 4.0) a (fma b b 12.0)) b) b (fma (* a a) (fma 4.0 (- 1.0 a) (* a a)) -1.0)))
double code(double a, double b) {
return fma((fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, fma((a * a), fma(4.0, (1.0 - a), (a * a)), -1.0));
}
function code(a, b) return fma(Float64(fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, fma(Float64(a * a), fma(4.0, Float64(1.0 - a), Float64(a * a)), -1.0)) end
code[a_, b_] := N[(N[(N[(N[(2.0 * a + 4.0), $MachinePrecision] * a + N[(b * b + 12.0), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * b + N[(N[(a * a), $MachinePrecision] * N[(4.0 * N[(1.0 - a), $MachinePrecision] + N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(2, a, 4\right), a, \mathsf{fma}\left(b, b, 12\right)\right) \cdot b, b, \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(4, 1 - a, a \cdot a\right), -1\right)\right)
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.0
Applied rewrites99.0%
Taylor expanded in b around 0
Applied rewrites99.9%
(FPCore (a b) :precision binary64 (fma (* (fma (fma 2.0 a 4.0) a (fma b b 12.0)) b) b (fma (* a a) (* a a) -1.0)))
double code(double a, double b) {
return fma((fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, fma((a * a), (a * a), -1.0));
}
function code(a, b) return fma(Float64(fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, fma(Float64(a * a), Float64(a * a), -1.0)) end
code[a_, b_] := N[(N[(N[(N[(2.0 * a + 4.0), $MachinePrecision] * a + N[(b * b + 12.0), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * b + N[(N[(a * a), $MachinePrecision] * N[(a * a), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(2, a, 4\right), a, \mathsf{fma}\left(b, b, 12\right)\right) \cdot b, b, \mathsf{fma}\left(a \cdot a, a \cdot a, -1\right)\right)
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.0
Applied rewrites99.0%
Taylor expanded in b around 0
Applied rewrites99.9%
Taylor expanded in a around inf
Applied rewrites99.1%
(FPCore (a b) :precision binary64 (fma (* (fma b b 12.0) b) b (fma (* a a) (fma 4.0 (- 1.0 a) (* a a)) -1.0)))
double code(double a, double b) {
return fma((fma(b, b, 12.0) * b), b, fma((a * a), fma(4.0, (1.0 - a), (a * a)), -1.0));
}
function code(a, b) return fma(Float64(fma(b, b, 12.0) * b), b, fma(Float64(a * a), fma(4.0, Float64(1.0 - a), Float64(a * a)), -1.0)) end
code[a_, b_] := N[(N[(N[(b * b + 12.0), $MachinePrecision] * b), $MachinePrecision] * b + N[(N[(a * a), $MachinePrecision] * N[(4.0 * N[(1.0 - a), $MachinePrecision] + N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\mathsf{fma}\left(b, b, 12\right) \cdot b, b, \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(4, 1 - a, a \cdot a\right), -1\right)\right)
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.0
Applied rewrites99.0%
Taylor expanded in b around 0
Applied rewrites99.9%
Taylor expanded in a around 0
Applied rewrites99.0%
(FPCore (a b) :precision binary64 (if (<= (* b b) 2e-31) (fma (* a a) (fma 4.0 (- 1.0 a) (* a a)) -1.0) (fma (* (fma (fma 2.0 a 4.0) a (fma b b 12.0)) b) b -1.0)))
double code(double a, double b) {
double tmp;
if ((b * b) <= 2e-31) {
tmp = fma((a * a), fma(4.0, (1.0 - a), (a * a)), -1.0);
} else {
tmp = fma((fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, -1.0);
}
return tmp;
}
function code(a, b) tmp = 0.0 if (Float64(b * b) <= 2e-31) tmp = fma(Float64(a * a), fma(4.0, Float64(1.0 - a), Float64(a * a)), -1.0); else tmp = fma(Float64(fma(fma(2.0, a, 4.0), a, fma(b, b, 12.0)) * b), b, -1.0); end return tmp end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 2e-31], N[(N[(a * a), $MachinePrecision] * N[(4.0 * N[(1.0 - a), $MachinePrecision] + N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(N[(N[(N[(2.0 * a + 4.0), $MachinePrecision] * a + N[(b * b + 12.0), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * b + -1.0), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 2 \cdot 10^{-31}:\\
\;\;\;\;\mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(4, 1 - a, a \cdot a\right), -1\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(2, a, 4\right), a, \mathsf{fma}\left(b, b, 12\right)\right) \cdot b, b, -1\right)\\
\end{array}
\end{array}
if (*.f64 b b) < 2e-31Initial program 80.9%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6498.1
Applied rewrites98.1%
Taylor expanded in b around 0
sub-negN/A
*-commutativeN/A
associate-*r*N/A
metadata-evalN/A
pow-sqrN/A
distribute-rgt-outN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-fma.f64N/A
lower--.f64N/A
unpow2N/A
lower-*.f6499.9
Applied rewrites99.9%
if 2e-31 < (*.f64 b b) Initial program 74.8%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.8
Applied rewrites99.8%
Taylor expanded in b around 0
Applied rewrites99.9%
Taylor expanded in a around 0
Applied rewrites95.1%
(FPCore (a b) :precision binary64 (if (<= (* b b) 5.0) (fma (* a a) (fma 4.0 (- 1.0 a) (* a a)) -1.0) (fma (* (fma b b 12.0) b) b -1.0)))
double code(double a, double b) {
double tmp;
if ((b * b) <= 5.0) {
tmp = fma((a * a), fma(4.0, (1.0 - a), (a * a)), -1.0);
} else {
tmp = fma((fma(b, b, 12.0) * b), b, -1.0);
}
return tmp;
}
function code(a, b) tmp = 0.0 if (Float64(b * b) <= 5.0) tmp = fma(Float64(a * a), fma(4.0, Float64(1.0 - a), Float64(a * a)), -1.0); else tmp = fma(Float64(fma(b, b, 12.0) * b), b, -1.0); end return tmp end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 5.0], N[(N[(a * a), $MachinePrecision] * N[(4.0 * N[(1.0 - a), $MachinePrecision] + N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(N[(N[(b * b + 12.0), $MachinePrecision] * b), $MachinePrecision] * b + -1.0), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 5:\\
\;\;\;\;\mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(4, 1 - a, a \cdot a\right), -1\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(b, b, 12\right) \cdot b, b, -1\right)\\
\end{array}
\end{array}
if (*.f64 b b) < 5Initial program 80.1%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6498.2
Applied rewrites98.2%
Taylor expanded in b around 0
sub-negN/A
*-commutativeN/A
associate-*r*N/A
metadata-evalN/A
pow-sqrN/A
distribute-rgt-outN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-fma.f64N/A
lower--.f64N/A
unpow2N/A
lower-*.f6499.3
Applied rewrites99.3%
if 5 < (*.f64 b b) Initial program 75.3%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.8
Applied rewrites99.8%
Taylor expanded in a around 0
sub-negN/A
metadata-evalN/A
pow-sqrN/A
distribute-rgt-inN/A
*-commutativeN/A
unpow2N/A
associate-*r*N/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f64N/A
*-commutativeN/A
lower-*.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f6492.2
Applied rewrites92.2%
(FPCore (a b) :precision binary64 (fma (* (* b b) b) b (fma (* a a) (* a a) -1.0)))
double code(double a, double b) {
return fma(((b * b) * b), b, fma((a * a), (a * a), -1.0));
}
function code(a, b) return fma(Float64(Float64(b * b) * b), b, fma(Float64(a * a), Float64(a * a), -1.0)) end
code[a_, b_] := N[(N[(N[(b * b), $MachinePrecision] * b), $MachinePrecision] * b + N[(N[(a * a), $MachinePrecision] * N[(a * a), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\left(b \cdot b\right) \cdot b, b, \mathsf{fma}\left(a \cdot a, a \cdot a, -1\right)\right)
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.0
Applied rewrites99.0%
Taylor expanded in b around 0
Applied rewrites99.9%
Taylor expanded in a around inf
Applied rewrites99.1%
Taylor expanded in b around inf
Applied rewrites97.7%
(FPCore (a b) :precision binary64 (fma (* (fma b b 12.0) b) b -1.0))
double code(double a, double b) {
return fma((fma(b, b, 12.0) * b), b, -1.0);
}
function code(a, b) return fma(Float64(fma(b, b, 12.0) * b), b, -1.0) end
code[a_, b_] := N[(N[(N[(b * b + 12.0), $MachinePrecision] * b), $MachinePrecision] * b + -1.0), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(\mathsf{fma}\left(b, b, 12\right) \cdot b, b, -1\right)
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
lower-*.f64N/A
unpow2N/A
lower-*.f6499.0
Applied rewrites99.0%
Taylor expanded in a around 0
sub-negN/A
metadata-evalN/A
pow-sqrN/A
distribute-rgt-inN/A
*-commutativeN/A
unpow2N/A
associate-*r*N/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f64N/A
*-commutativeN/A
lower-*.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f6471.9
Applied rewrites71.9%
(FPCore (a b) :precision binary64 (- (* (* 12.0 b) b) 1.0))
double code(double a, double b) {
return ((12.0 * b) * b) - 1.0;
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = ((12.0d0 * b) * b) - 1.0d0
end function
public static double code(double a, double b) {
return ((12.0 * b) * b) - 1.0;
}
def code(a, b): return ((12.0 * b) * b) - 1.0
function code(a, b) return Float64(Float64(Float64(12.0 * b) * b) - 1.0) end
function tmp = code(a, b) tmp = ((12.0 * b) * b) - 1.0; end
code[a_, b_] := N[(N[(N[(12.0 * b), $MachinePrecision] * b), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}
\\
\left(12 \cdot b\right) \cdot b - 1
\end{array}
Initial program 77.6%
Taylor expanded in a around 0
*-commutativeN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-pow.f6471.9
Applied rewrites71.9%
Taylor expanded in b around 0
Applied rewrites51.9%
Applied rewrites51.9%
herbie shell --seed 2024306
(FPCore (a b)
:name "Bouland and Aaronson, Equation (24)"
:precision binary64
(- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (- 1.0 a)) (* (* b b) (+ 3.0 a))))) 1.0))