
(FPCore (x y z) :precision binary64 (sqrt (+ (* x x) (+ (* y y) (* z z)))))
double code(double x, double y, double z) {
return sqrt(((x * x) + ((y * y) + (z * z))));
}
real(8) function code(x, y, z)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
code = sqrt(((x * x) + ((y * y) + (z * z))))
end function
public static double code(double x, double y, double z) {
return Math.sqrt(((x * x) + ((y * y) + (z * z))));
}
def code(x, y, z): return math.sqrt(((x * x) + ((y * y) + (z * z))))
function code(x, y, z) return sqrt(Float64(Float64(x * x) + Float64(Float64(y * y) + Float64(z * z)))) end
function tmp = code(x, y, z) tmp = sqrt(((x * x) + ((y * y) + (z * z)))); end
code[x_, y_, z_] := N[Sqrt[N[(N[(x * x), $MachinePrecision] + N[(N[(y * y), $MachinePrecision] + N[(z * z), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{x \cdot x + \left(y \cdot y + z \cdot z\right)}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 3 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x y z) :precision binary64 (sqrt (+ (* x x) (+ (* y y) (* z z)))))
double code(double x, double y, double z) {
return sqrt(((x * x) + ((y * y) + (z * z))));
}
real(8) function code(x, y, z)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
code = sqrt(((x * x) + ((y * y) + (z * z))))
end function
public static double code(double x, double y, double z) {
return Math.sqrt(((x * x) + ((y * y) + (z * z))));
}
def code(x, y, z): return math.sqrt(((x * x) + ((y * y) + (z * z))))
function code(x, y, z) return sqrt(Float64(Float64(x * x) + Float64(Float64(y * y) + Float64(z * z)))) end
function tmp = code(x, y, z) tmp = sqrt(((x * x) + ((y * y) + (z * z)))); end
code[x_, y_, z_] := N[Sqrt[N[(N[(x * x), $MachinePrecision] + N[(N[(y * y), $MachinePrecision] + N[(z * z), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{x \cdot x + \left(y \cdot y + z \cdot z\right)}
\end{array}
z_m = (fabs.f64 z) y_m = (fabs.f64 y) x_m = (fabs.f64 x) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (hypot z_m y_m))
z_m = fabs(z);
y_m = fabs(y);
x_m = fabs(x);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return hypot(z_m, y_m);
}
z_m = Math.abs(z);
y_m = Math.abs(y);
x_m = Math.abs(x);
assert x_m < y_m && y_m < z_m;
public static double code(double x_m, double y_m, double z_m) {
return Math.hypot(z_m, y_m);
}
z_m = math.fabs(z) y_m = math.fabs(y) x_m = math.fabs(x) [x_m, y_m, z_m] = sort([x_m, y_m, z_m]) def code(x_m, y_m, z_m): return math.hypot(z_m, y_m)
z_m = abs(z) y_m = abs(y) x_m = abs(x) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return hypot(z_m, y_m) end
z_m = abs(z);
y_m = abs(y);
x_m = abs(x);
x_m, y_m, z_m = num2cell(sort([x_m, y_m, z_m])){:}
function tmp = code(x_m, y_m, z_m)
tmp = hypot(z_m, y_m);
end
z_m = N[Abs[z], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] x_m = N[Abs[x], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := N[Sqrt[z$95$m ^ 2 + y$95$m ^ 2], $MachinePrecision]
\begin{array}{l}
z_m = \left|z\right|
\\
y_m = \left|y\right|
\\
x_m = \left|x\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\mathsf{hypot}\left(z\_m, y\_m\right)
\end{array}
Initial program 48.2%
Taylor expanded in x around 0
+-commutativeN/A
unpow2N/A
lower-fma.f64N/A
unpow2N/A
lower-*.f6433.4
Applied rewrites33.4%
lower-hypot.f6468.7
Applied rewrites68.7%
z_m = (fabs.f64 z) y_m = (fabs.f64 y) x_m = (fabs.f64 x) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (fma (/ (* y_m 0.5) z_m) y_m z_m))
z_m = fabs(z);
y_m = fabs(y);
x_m = fabs(x);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return fma(((y_m * 0.5) / z_m), y_m, z_m);
}
z_m = abs(z) y_m = abs(y) x_m = abs(x) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return fma(Float64(Float64(y_m * 0.5) / z_m), y_m, z_m) end
z_m = N[Abs[z], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] x_m = N[Abs[x], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := N[(N[(N[(y$95$m * 0.5), $MachinePrecision] / z$95$m), $MachinePrecision] * y$95$m + z$95$m), $MachinePrecision]
\begin{array}{l}
z_m = \left|z\right|
\\
y_m = \left|y\right|
\\
x_m = \left|x\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\mathsf{fma}\left(\frac{y\_m \cdot 0.5}{z\_m}, y\_m, z\_m\right)
\end{array}
Initial program 48.2%
Taylor expanded in z around inf
distribute-rgt-inN/A
*-lft-identityN/A
+-commutativeN/A
associate-*l*N/A
*-commutativeN/A
associate-*r/N/A
unpow2N/A
times-fracN/A
*-inversesN/A
associate-/l*N/A
*-lft-identityN/A
lower-fma.f64N/A
Applied rewrites18.5%
Taylor expanded in x around 0
+-commutativeN/A
lower-fma.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f6419.9
Applied rewrites19.9%
lift-*.f64N/A
lift-/.f64N/A
lift-/.f64N/A
lift-*.f64N/A
associate-/l*N/A
*-commutativeN/A
associate-*r*N/A
*-commutativeN/A
lower-fma.f64N/A
associate-*l/N/A
*-commutativeN/A
lower-/.f64N/A
*-commutativeN/A
lower-*.f6421.5
Applied rewrites21.5%
z_m = (fabs.f64 z) y_m = (fabs.f64 y) x_m = (fabs.f64 x) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 z_m)
z_m = fabs(z);
y_m = fabs(y);
x_m = fabs(x);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return z_m;
}
z_m = abs(z)
y_m = abs(y)
x_m = abs(x)
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
real(8) function code(x_m, y_m, z_m)
real(8), intent (in) :: x_m
real(8), intent (in) :: y_m
real(8), intent (in) :: z_m
code = z_m
end function
z_m = Math.abs(z);
y_m = Math.abs(y);
x_m = Math.abs(x);
assert x_m < y_m && y_m < z_m;
public static double code(double x_m, double y_m, double z_m) {
return z_m;
}
z_m = math.fabs(z) y_m = math.fabs(y) x_m = math.fabs(x) [x_m, y_m, z_m] = sort([x_m, y_m, z_m]) def code(x_m, y_m, z_m): return z_m
z_m = abs(z) y_m = abs(y) x_m = abs(x) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return z_m end
z_m = abs(z);
y_m = abs(y);
x_m = abs(x);
x_m, y_m, z_m = num2cell(sort([x_m, y_m, z_m])){:}
function tmp = code(x_m, y_m, z_m)
tmp = z_m;
end
z_m = N[Abs[z], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] x_m = N[Abs[x], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := z$95$m
\begin{array}{l}
z_m = \left|z\right|
\\
y_m = \left|y\right|
\\
x_m = \left|x\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
z\_m
\end{array}
Initial program 48.2%
Taylor expanded in z around inf
unpow2N/A
lower-*.f6419.3
Applied rewrites19.3%
sqrt-prodN/A
rem-square-sqrt20.7
Applied rewrites20.7%
(FPCore (x y z) :precision binary64 (hypot x (hypot y z)))
double code(double x, double y, double z) {
return hypot(x, hypot(y, z));
}
public static double code(double x, double y, double z) {
return Math.hypot(x, Math.hypot(y, z));
}
def code(x, y, z): return math.hypot(x, math.hypot(y, z))
function code(x, y, z) return hypot(x, hypot(y, z)) end
function tmp = code(x, y, z) tmp = hypot(x, hypot(y, z)); end
code[x_, y_, z_] := N[Sqrt[x ^ 2 + N[Sqrt[y ^ 2 + z ^ 2], $MachinePrecision] ^ 2], $MachinePrecision]
\begin{array}{l}
\\
\mathsf{hypot}\left(x, \mathsf{hypot}\left(y, z\right)\right)
\end{array}
herbie shell --seed 2024219
(FPCore (x y z)
:name "bug366 (missed optimization)"
:precision binary64
:alt
(! :herbie-platform default (hypot x (hypot y z)))
(sqrt (+ (* x x) (+ (* y y) (* z z)))))