
(FPCore (x y) :precision binary64 (+ (+ (+ (* x x) (* y y)) (* y y)) (* y y)))
double code(double x, double y) {
return (((x * x) + (y * y)) + (y * y)) + (y * y);
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
code = (((x * x) + (y * y)) + (y * y)) + (y * y)
end function
public static double code(double x, double y) {
return (((x * x) + (y * y)) + (y * y)) + (y * y);
}
def code(x, y): return (((x * x) + (y * y)) + (y * y)) + (y * y)
function code(x, y) return Float64(Float64(Float64(Float64(x * x) + Float64(y * y)) + Float64(y * y)) + Float64(y * y)) end
function tmp = code(x, y) tmp = (((x * x) + (y * y)) + (y * y)) + (y * y); end
code[x_, y_] := N[(N[(N[(N[(x * x), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(\left(x \cdot x + y \cdot y\right) + y \cdot y\right) + y \cdot y
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 7 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x y) :precision binary64 (+ (+ (+ (* x x) (* y y)) (* y y)) (* y y)))
double code(double x, double y) {
return (((x * x) + (y * y)) + (y * y)) + (y * y);
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
code = (((x * x) + (y * y)) + (y * y)) + (y * y)
end function
public static double code(double x, double y) {
return (((x * x) + (y * y)) + (y * y)) + (y * y);
}
def code(x, y): return (((x * x) + (y * y)) + (y * y)) + (y * y)
function code(x, y) return Float64(Float64(Float64(Float64(x * x) + Float64(y * y)) + Float64(y * y)) + Float64(y * y)) end
function tmp = code(x, y) tmp = (((x * x) + (y * y)) + (y * y)) + (y * y); end
code[x_, y_] := N[(N[(N[(N[(x * x), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(\left(x \cdot x + y \cdot y\right) + y \cdot y\right) + y \cdot y
\end{array}
(FPCore (x y) :precision binary64 (fma (* 2.0 y) y (fma y y (* x x))))
double code(double x, double y) {
return fma((2.0 * y), y, fma(y, y, (x * x)));
}
function code(x, y) return fma(Float64(2.0 * y), y, fma(y, y, Float64(x * x))) end
code[x_, y_] := N[(N[(2.0 * y), $MachinePrecision] * y + N[(y * y + N[(x * x), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(2 \cdot y, y, \mathsf{fma}\left(y, y, x \cdot x\right)\right)
\end{array}
Initial program 99.9%
lift-+.f64N/A
lift-+.f64N/A
associate-+l+N/A
+-commutativeN/A
count-2N/A
lift-*.f64N/A
associate-*r*N/A
count-2N/A
lower-fma.f64N/A
count-2N/A
lower-*.f6499.9
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6499.9
Applied rewrites99.9%
(FPCore (x y) :precision binary64 (if (<= (* x x) 1.65e-18) (fma y (+ y y) (* y y)) (* x x)))
double code(double x, double y) {
double tmp;
if ((x * x) <= 1.65e-18) {
tmp = fma(y, (y + y), (y * y));
} else {
tmp = x * x;
}
return tmp;
}
function code(x, y) tmp = 0.0 if (Float64(x * x) <= 1.65e-18) tmp = fma(y, Float64(y + y), Float64(y * y)); else tmp = Float64(x * x); end return tmp end
code[x_, y_] := If[LessEqual[N[(x * x), $MachinePrecision], 1.65e-18], N[(y * N[(y + y), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision], N[(x * x), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \cdot x \leq 1.65 \cdot 10^{-18}:\\
\;\;\;\;\mathsf{fma}\left(y, y + y, y \cdot y\right)\\
\mathbf{else}:\\
\;\;\;\;x \cdot x\\
\end{array}
\end{array}
if (*.f64 x x) < 1.6500000000000001e-18Initial program 99.7%
Taylor expanded in x around 0
distribute-lft1-inN/A
metadata-evalN/A
lower-*.f64N/A
unpow2N/A
lower-*.f6487.4
Applied rewrites87.4%
Applied rewrites87.6%
if 1.6500000000000001e-18 < (*.f64 x x) Initial program 100.0%
lift-+.f64N/A
+-commutativeN/A
flip-+N/A
div-invN/A
lower-*.f64N/A
lower--.f64N/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
lower-/.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
+-commutativeN/A
lower-*.f64N/A
Applied rewrites21.2%
Taylor expanded in x around inf
associate-+r+N/A
associate-+r+N/A
distribute-lft1-inN/A
metadata-evalN/A
mul0-lftN/A
metadata-evalN/A
*-rgt-identityN/A
unpow2N/A
lower-*.f6481.7
Applied rewrites81.7%
(FPCore (x y) :precision binary64 (if (<= (* x x) 1.65e-18) (* (* 3.0 y) y) (* x x)))
double code(double x, double y) {
double tmp;
if ((x * x) <= 1.65e-18) {
tmp = (3.0 * y) * y;
} else {
tmp = x * x;
}
return tmp;
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8) :: tmp
if ((x * x) <= 1.65d-18) then
tmp = (3.0d0 * y) * y
else
tmp = x * x
end if
code = tmp
end function
public static double code(double x, double y) {
double tmp;
if ((x * x) <= 1.65e-18) {
tmp = (3.0 * y) * y;
} else {
tmp = x * x;
}
return tmp;
}
def code(x, y): tmp = 0 if (x * x) <= 1.65e-18: tmp = (3.0 * y) * y else: tmp = x * x return tmp
function code(x, y) tmp = 0.0 if (Float64(x * x) <= 1.65e-18) tmp = Float64(Float64(3.0 * y) * y); else tmp = Float64(x * x); end return tmp end
function tmp_2 = code(x, y) tmp = 0.0; if ((x * x) <= 1.65e-18) tmp = (3.0 * y) * y; else tmp = x * x; end tmp_2 = tmp; end
code[x_, y_] := If[LessEqual[N[(x * x), $MachinePrecision], 1.65e-18], N[(N[(3.0 * y), $MachinePrecision] * y), $MachinePrecision], N[(x * x), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \cdot x \leq 1.65 \cdot 10^{-18}:\\
\;\;\;\;\left(3 \cdot y\right) \cdot y\\
\mathbf{else}:\\
\;\;\;\;x \cdot x\\
\end{array}
\end{array}
if (*.f64 x x) < 1.6500000000000001e-18Initial program 99.7%
Taylor expanded in x around 0
distribute-lft1-inN/A
metadata-evalN/A
lower-*.f64N/A
unpow2N/A
lower-*.f6487.4
Applied rewrites87.4%
Applied rewrites87.5%
if 1.6500000000000001e-18 < (*.f64 x x) Initial program 100.0%
lift-+.f64N/A
+-commutativeN/A
flip-+N/A
div-invN/A
lower-*.f64N/A
lower--.f64N/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
lower-/.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
+-commutativeN/A
lower-*.f64N/A
Applied rewrites21.2%
Taylor expanded in x around inf
associate-+r+N/A
associate-+r+N/A
distribute-lft1-inN/A
metadata-evalN/A
mul0-lftN/A
metadata-evalN/A
*-rgt-identityN/A
unpow2N/A
lower-*.f6481.7
Applied rewrites81.7%
(FPCore (x y) :precision binary64 (if (<= (* x x) 1.65e-18) (* 3.0 (* y y)) (* x x)))
double code(double x, double y) {
double tmp;
if ((x * x) <= 1.65e-18) {
tmp = 3.0 * (y * y);
} else {
tmp = x * x;
}
return tmp;
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8) :: tmp
if ((x * x) <= 1.65d-18) then
tmp = 3.0d0 * (y * y)
else
tmp = x * x
end if
code = tmp
end function
public static double code(double x, double y) {
double tmp;
if ((x * x) <= 1.65e-18) {
tmp = 3.0 * (y * y);
} else {
tmp = x * x;
}
return tmp;
}
def code(x, y): tmp = 0 if (x * x) <= 1.65e-18: tmp = 3.0 * (y * y) else: tmp = x * x return tmp
function code(x, y) tmp = 0.0 if (Float64(x * x) <= 1.65e-18) tmp = Float64(3.0 * Float64(y * y)); else tmp = Float64(x * x); end return tmp end
function tmp_2 = code(x, y) tmp = 0.0; if ((x * x) <= 1.65e-18) tmp = 3.0 * (y * y); else tmp = x * x; end tmp_2 = tmp; end
code[x_, y_] := If[LessEqual[N[(x * x), $MachinePrecision], 1.65e-18], N[(3.0 * N[(y * y), $MachinePrecision]), $MachinePrecision], N[(x * x), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;x \cdot x \leq 1.65 \cdot 10^{-18}:\\
\;\;\;\;3 \cdot \left(y \cdot y\right)\\
\mathbf{else}:\\
\;\;\;\;x \cdot x\\
\end{array}
\end{array}
if (*.f64 x x) < 1.6500000000000001e-18Initial program 99.7%
Taylor expanded in x around 0
distribute-lft1-inN/A
metadata-evalN/A
lower-*.f64N/A
unpow2N/A
lower-*.f6487.4
Applied rewrites87.4%
if 1.6500000000000001e-18 < (*.f64 x x) Initial program 100.0%
lift-+.f64N/A
+-commutativeN/A
flip-+N/A
div-invN/A
lower-*.f64N/A
lower--.f64N/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
lower-/.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
+-commutativeN/A
lower-*.f64N/A
Applied rewrites21.2%
Taylor expanded in x around inf
associate-+r+N/A
associate-+r+N/A
distribute-lft1-inN/A
metadata-evalN/A
mul0-lftN/A
metadata-evalN/A
*-rgt-identityN/A
unpow2N/A
lower-*.f6481.7
Applied rewrites81.7%
(FPCore (x y) :precision binary64 (fma y (fma 2.0 y y) (* x x)))
double code(double x, double y) {
return fma(y, fma(2.0, y, y), (x * x));
}
function code(x, y) return fma(y, fma(2.0, y, y), Float64(x * x)) end
code[x_, y_] := N[(y * N[(2.0 * y + y), $MachinePrecision] + N[(x * x), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(y, \mathsf{fma}\left(2, y, y\right), x \cdot x\right)
\end{array}
Initial program 99.9%
lift-+.f64N/A
lift-+.f64N/A
lift-+.f64N/A
associate-+l+N/A
associate-+l+N/A
+-commutativeN/A
lift-*.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-*.f64N/A
distribute-lft-outN/A
lower-fma.f64N/A
count-2N/A
lower-fma.f6499.9
Applied rewrites99.9%
(FPCore (x y) :precision binary64 (fma 3.0 (* y y) (* x x)))
double code(double x, double y) {
return fma(3.0, (y * y), (x * x));
}
function code(x, y) return fma(3.0, Float64(y * y), Float64(x * x)) end
code[x_, y_] := N[(3.0 * N[(y * y), $MachinePrecision] + N[(x * x), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\mathsf{fma}\left(3, y \cdot y, x \cdot x\right)
\end{array}
Initial program 99.9%
lift-+.f64N/A
lift-+.f64N/A
lift-+.f64N/A
associate-+l+N/A
associate-+l+N/A
+-commutativeN/A
count-2N/A
distribute-lft1-inN/A
metadata-evalN/A
lower-fma.f6499.9
Applied rewrites99.9%
(FPCore (x y) :precision binary64 (* x x))
double code(double x, double y) {
return x * x;
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
code = x * x
end function
public static double code(double x, double y) {
return x * x;
}
def code(x, y): return x * x
function code(x, y) return Float64(x * x) end
function tmp = code(x, y) tmp = x * x; end
code[x_, y_] := N[(x * x), $MachinePrecision]
\begin{array}{l}
\\
x \cdot x
\end{array}
Initial program 99.9%
lift-+.f64N/A
+-commutativeN/A
flip-+N/A
div-invN/A
lower-*.f64N/A
lower--.f64N/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
pow2N/A
lift-*.f64N/A
pow-prod-downN/A
pow-prod-upN/A
lower-pow.f64N/A
metadata-evalN/A
lower-/.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
+-commutativeN/A
lower-*.f64N/A
Applied rewrites32.7%
Taylor expanded in x around inf
associate-+r+N/A
associate-+r+N/A
distribute-lft1-inN/A
metadata-evalN/A
mul0-lftN/A
metadata-evalN/A
*-rgt-identityN/A
unpow2N/A
lower-*.f6454.2
Applied rewrites54.2%
(FPCore (x y) :precision binary64 (+ (* x x) (* y (+ y (+ y y)))))
double code(double x, double y) {
return (x * x) + (y * (y + (y + y)));
}
real(8) function code(x, y)
real(8), intent (in) :: x
real(8), intent (in) :: y
code = (x * x) + (y * (y + (y + y)))
end function
public static double code(double x, double y) {
return (x * x) + (y * (y + (y + y)));
}
def code(x, y): return (x * x) + (y * (y + (y + y)))
function code(x, y) return Float64(Float64(x * x) + Float64(y * Float64(y + Float64(y + y)))) end
function tmp = code(x, y) tmp = (x * x) + (y * (y + (y + y))); end
code[x_, y_] := N[(N[(x * x), $MachinePrecision] + N[(y * N[(y + N[(y + y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
x \cdot x + y \cdot \left(y + \left(y + y\right)\right)
\end{array}
herbie shell --seed 2024318
(FPCore (x y)
:name "Linear.Quaternion:$c/ from linear-1.19.1.3, E"
:precision binary64
:alt
(! :herbie-platform default (+ (* x x) (* y (+ y (+ y y)))))
(+ (+ (+ (* x x) (* y y)) (* y y)) (* y y)))