
(FPCore (a b) :precision binary64 (sqrt (- (* a a) (* b b))))
double code(double a, double b) {
return sqrt(((a * a) - (b * b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt(((a * a) - (b * b)))
end function
public static double code(double a, double b) {
return Math.sqrt(((a * a) - (b * b)));
}
def code(a, b): return math.sqrt(((a * a) - (b * b)))
function code(a, b) return sqrt(Float64(Float64(a * a) - Float64(b * b))) end
function tmp = code(a, b) tmp = sqrt(((a * a) - (b * b))); end
code[a_, b_] := N[Sqrt[N[(N[(a * a), $MachinePrecision] - N[(b * b), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{a \cdot a - b \cdot b}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 4 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a b) :precision binary64 (sqrt (- (* a a) (* b b))))
double code(double a, double b) {
return sqrt(((a * a) - (b * b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt(((a * a) - (b * b)))
end function
public static double code(double a, double b) {
return Math.sqrt(((a * a) - (b * b)));
}
def code(a, b): return math.sqrt(((a * a) - (b * b)))
function code(a, b) return sqrt(Float64(Float64(a * a) - Float64(b * b))) end
function tmp = code(a, b) tmp = sqrt(((a * a) - (b * b))); end
code[a_, b_] := N[Sqrt[N[(N[(a * a), $MachinePrecision] - N[(b * b), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{a \cdot a - b \cdot b}
\end{array}
b_m = (fabs.f64 b) a_m = (fabs.f64 a) (FPCore (a_m b_m) :precision binary64 (* (+ b_m a_m) (sqrt (/ (- a_m b_m) (+ b_m a_m)))))
b_m = fabs(b);
a_m = fabs(a);
double code(double a_m, double b_m) {
return (b_m + a_m) * sqrt(((a_m - b_m) / (b_m + a_m)));
}
b_m = abs(b)
a_m = abs(a)
real(8) function code(a_m, b_m)
real(8), intent (in) :: a_m
real(8), intent (in) :: b_m
code = (b_m + a_m) * sqrt(((a_m - b_m) / (b_m + a_m)))
end function
b_m = Math.abs(b);
a_m = Math.abs(a);
public static double code(double a_m, double b_m) {
return (b_m + a_m) * Math.sqrt(((a_m - b_m) / (b_m + a_m)));
}
b_m = math.fabs(b) a_m = math.fabs(a) def code(a_m, b_m): return (b_m + a_m) * math.sqrt(((a_m - b_m) / (b_m + a_m)))
b_m = abs(b) a_m = abs(a) function code(a_m, b_m) return Float64(Float64(b_m + a_m) * sqrt(Float64(Float64(a_m - b_m) / Float64(b_m + a_m)))) end
b_m = abs(b); a_m = abs(a); function tmp = code(a_m, b_m) tmp = (b_m + a_m) * sqrt(((a_m - b_m) / (b_m + a_m))); end
b_m = N[Abs[b], $MachinePrecision] a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b$95$m_] := N[(N[(b$95$m + a$95$m), $MachinePrecision] * N[Sqrt[N[(N[(a$95$m - b$95$m), $MachinePrecision] / N[(b$95$m + a$95$m), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
b_m = \left|b\right|
\\
a_m = \left|a\right|
\\
\left(b\_m + a\_m\right) \cdot \sqrt{\frac{a\_m - b\_m}{b\_m + a\_m}}
\end{array}
Initial program 57.0%
lift-sqrt.f64N/A
pow1/2N/A
lift--.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
*-commutativeN/A
unpow-prod-downN/A
lower-*.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
lower--.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f6445.8
Applied rewrites45.8%
lift-sqrt.f64N/A
lift--.f64N/A
flip--N/A
difference-of-squaresN/A
+-commutativeN/A
lift-+.f64N/A
lift--.f64N/A
+-commutativeN/A
lift-+.f64N/A
associate-/l*N/A
sqrt-prodN/A
lift-sqrt.f64N/A
lower-*.f64N/A
lower-sqrt.f64N/A
lower-/.f6445.8
Applied rewrites45.8%
lift-*.f64N/A
*-commutativeN/A
lift-*.f64N/A
associate-*r*N/A
lift-sqrt.f64N/A
lift-sqrt.f64N/A
rem-square-sqrtN/A
lower-*.f6446.7
Applied rewrites46.7%
b_m = (fabs.f64 b) a_m = (fabs.f64 a) (FPCore (a_m b_m) :precision binary64 (* (sqrt (- a_m b_m)) (sqrt (+ b_m a_m))))
b_m = fabs(b);
a_m = fabs(a);
double code(double a_m, double b_m) {
return sqrt((a_m - b_m)) * sqrt((b_m + a_m));
}
b_m = abs(b)
a_m = abs(a)
real(8) function code(a_m, b_m)
real(8), intent (in) :: a_m
real(8), intent (in) :: b_m
code = sqrt((a_m - b_m)) * sqrt((b_m + a_m))
end function
b_m = Math.abs(b);
a_m = Math.abs(a);
public static double code(double a_m, double b_m) {
return Math.sqrt((a_m - b_m)) * Math.sqrt((b_m + a_m));
}
b_m = math.fabs(b) a_m = math.fabs(a) def code(a_m, b_m): return math.sqrt((a_m - b_m)) * math.sqrt((b_m + a_m))
b_m = abs(b) a_m = abs(a) function code(a_m, b_m) return Float64(sqrt(Float64(a_m - b_m)) * sqrt(Float64(b_m + a_m))) end
b_m = abs(b); a_m = abs(a); function tmp = code(a_m, b_m) tmp = sqrt((a_m - b_m)) * sqrt((b_m + a_m)); end
b_m = N[Abs[b], $MachinePrecision] a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b$95$m_] := N[(N[Sqrt[N[(a$95$m - b$95$m), $MachinePrecision]], $MachinePrecision] * N[Sqrt[N[(b$95$m + a$95$m), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
b_m = \left|b\right|
\\
a_m = \left|a\right|
\\
\sqrt{a\_m - b\_m} \cdot \sqrt{b\_m + a\_m}
\end{array}
Initial program 57.0%
lift-sqrt.f64N/A
pow1/2N/A
lift--.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
*-commutativeN/A
unpow-prod-downN/A
lower-*.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
lower--.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f6445.8
Applied rewrites45.8%
b_m = (fabs.f64 b) a_m = (fabs.f64 a) (FPCore (a_m b_m) :precision binary64 (fma (* (/ -0.5 a_m) b_m) b_m a_m))
b_m = fabs(b);
a_m = fabs(a);
double code(double a_m, double b_m) {
return fma(((-0.5 / a_m) * b_m), b_m, a_m);
}
b_m = abs(b) a_m = abs(a) function code(a_m, b_m) return fma(Float64(Float64(-0.5 / a_m) * b_m), b_m, a_m) end
b_m = N[Abs[b], $MachinePrecision] a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b$95$m_] := N[(N[(N[(-0.5 / a$95$m), $MachinePrecision] * b$95$m), $MachinePrecision] * b$95$m + a$95$m), $MachinePrecision]
\begin{array}{l}
b_m = \left|b\right|
\\
a_m = \left|a\right|
\\
\mathsf{fma}\left(\frac{-0.5}{a\_m} \cdot b\_m, b\_m, a\_m\right)
\end{array}
Initial program 57.0%
Taylor expanded in b around 0
+-commutativeN/A
associate-*r/N/A
associate-*l/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
associate-*r/N/A
unpow2N/A
associate-*r*N/A
lower-fma.f64N/A
lower-*.f64N/A
associate-*r/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f6446.3
Applied rewrites46.3%
b_m = (fabs.f64 b) a_m = (fabs.f64 a) (FPCore (a_m b_m) :precision binary64 a_m)
b_m = fabs(b);
a_m = fabs(a);
double code(double a_m, double b_m) {
return a_m;
}
b_m = abs(b)
a_m = abs(a)
real(8) function code(a_m, b_m)
real(8), intent (in) :: a_m
real(8), intent (in) :: b_m
code = a_m
end function
b_m = Math.abs(b);
a_m = Math.abs(a);
public static double code(double a_m, double b_m) {
return a_m;
}
b_m = math.fabs(b) a_m = math.fabs(a) def code(a_m, b_m): return a_m
b_m = abs(b) a_m = abs(a) function code(a_m, b_m) return a_m end
b_m = abs(b); a_m = abs(a); function tmp = code(a_m, b_m) tmp = a_m; end
b_m = N[Abs[b], $MachinePrecision] a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b$95$m_] := a$95$m
\begin{array}{l}
b_m = \left|b\right|
\\
a_m = \left|a\right|
\\
a\_m
\end{array}
Initial program 57.0%
lift-sqrt.f64N/A
pow1/2N/A
lift--.f64N/A
lift-*.f64N/A
lift-*.f64N/A
difference-of-squaresN/A
*-commutativeN/A
unpow-prod-downN/A
lower-*.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
lower--.f64N/A
pow1/2N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f6445.8
Applied rewrites45.8%
Taylor expanded in a around inf
+-commutativeN/A
associate-*r/N/A
distribute-rgt1-inN/A
metadata-evalN/A
mul0-lftN/A
metadata-evalN/A
mul0-lftN/A
associate-*r/N/A
mul0-lftN/A
metadata-evalN/A
*-rgt-identity45.9
Applied rewrites45.9%
(FPCore (a b) :precision binary64 (* (sqrt (+ (fabs a) (fabs b))) (sqrt (- (fabs a) (fabs b)))))
double code(double a, double b) {
return sqrt((fabs(a) + fabs(b))) * sqrt((fabs(a) - fabs(b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt((abs(a) + abs(b))) * sqrt((abs(a) - abs(b)))
end function
public static double code(double a, double b) {
return Math.sqrt((Math.abs(a) + Math.abs(b))) * Math.sqrt((Math.abs(a) - Math.abs(b)));
}
def code(a, b): return math.sqrt((math.fabs(a) + math.fabs(b))) * math.sqrt((math.fabs(a) - math.fabs(b)))
function code(a, b) return Float64(sqrt(Float64(abs(a) + abs(b))) * sqrt(Float64(abs(a) - abs(b)))) end
function tmp = code(a, b) tmp = sqrt((abs(a) + abs(b))) * sqrt((abs(a) - abs(b))); end
code[a_, b_] := N[(N[Sqrt[N[(N[Abs[a], $MachinePrecision] + N[Abs[b], $MachinePrecision]), $MachinePrecision]], $MachinePrecision] * N[Sqrt[N[(N[Abs[a], $MachinePrecision] - N[Abs[b], $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\sqrt{\left|a\right| + \left|b\right|} \cdot \sqrt{\left|a\right| - \left|b\right|}
\end{array}
herbie shell --seed 2024322
(FPCore (a b)
:name "bug366, discussion (missed optimization)"
:precision binary64
:alt
(! :herbie-platform default (let* ((fa (fabs a)) (fb (fabs b))) (* (sqrt (+ fa fb)) (sqrt (- fa fb)))))
(sqrt (- (* a a) (* b b))))