
(FPCore (a b) :precision binary64 (sqrt (- (* a a) (* b b))))
double code(double a, double b) {
return sqrt(((a * a) - (b * b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt(((a * a) - (b * b)))
end function
public static double code(double a, double b) {
return Math.sqrt(((a * a) - (b * b)));
}
def code(a, b): return math.sqrt(((a * a) - (b * b)))
function code(a, b) return sqrt(Float64(Float64(a * a) - Float64(b * b))) end
function tmp = code(a, b) tmp = sqrt(((a * a) - (b * b))); end
code[a_, b_] := N[Sqrt[N[(N[(a * a), $MachinePrecision] - N[(b * b), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{a \cdot a - b \cdot b}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 3 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a b) :precision binary64 (sqrt (- (* a a) (* b b))))
double code(double a, double b) {
return sqrt(((a * a) - (b * b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt(((a * a) - (b * b)))
end function
public static double code(double a, double b) {
return Math.sqrt(((a * a) - (b * b)));
}
def code(a, b): return math.sqrt(((a * a) - (b * b)))
function code(a, b) return sqrt(Float64(Float64(a * a) - Float64(b * b))) end
function tmp = code(a, b) tmp = sqrt(((a * a) - (b * b))); end
code[a_, b_] := N[Sqrt[N[(N[(a * a), $MachinePrecision] - N[(b * b), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{a \cdot a - b \cdot b}
\end{array}
a_m = (fabs.f64 a) (FPCore (a_m b) :precision binary64 (fma (* (/ -0.5 a_m) b) b a_m))
a_m = fabs(a);
double code(double a_m, double b) {
return fma(((-0.5 / a_m) * b), b, a_m);
}
a_m = abs(a) function code(a_m, b) return fma(Float64(Float64(-0.5 / a_m) * b), b, a_m) end
a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b_] := N[(N[(N[(-0.5 / a$95$m), $MachinePrecision] * b), $MachinePrecision] * b + a$95$m), $MachinePrecision]
\begin{array}{l}
a_m = \left|a\right|
\\
\mathsf{fma}\left(\frac{-0.5}{a\_m} \cdot b, b, a\_m\right)
\end{array}
Initial program 57.0%
Taylor expanded in b around 0
+-commutativeN/A
associate-*r/N/A
associate-*l/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
associate-*r/N/A
unpow2N/A
associate-*r*N/A
lower-fma.f64N/A
lower-*.f64N/A
associate-*r/N/A
metadata-evalN/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f6448.3
Applied rewrites48.3%
a_m = (fabs.f64 a) (FPCore (a_m b) :precision binary64 (sqrt (* a_m a_m)))
a_m = fabs(a);
double code(double a_m, double b) {
return sqrt((a_m * a_m));
}
a_m = abs(a)
real(8) function code(a_m, b)
real(8), intent (in) :: a_m
real(8), intent (in) :: b
code = sqrt((a_m * a_m))
end function
a_m = Math.abs(a);
public static double code(double a_m, double b) {
return Math.sqrt((a_m * a_m));
}
a_m = math.fabs(a) def code(a_m, b): return math.sqrt((a_m * a_m))
a_m = abs(a) function code(a_m, b) return sqrt(Float64(a_m * a_m)) end
a_m = abs(a); function tmp = code(a_m, b) tmp = sqrt((a_m * a_m)); end
a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b_] := N[Sqrt[N[(a$95$m * a$95$m), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
a_m = \left|a\right|
\\
\sqrt{a\_m \cdot a\_m}
\end{array}
Initial program 57.0%
Taylor expanded in b around 0
unpow2N/A
lower-*.f6457.4
Applied rewrites57.4%
a_m = (fabs.f64 a) (FPCore (a_m b) :precision binary64 (- a_m))
a_m = fabs(a);
double code(double a_m, double b) {
return -a_m;
}
a_m = abs(a)
real(8) function code(a_m, b)
real(8), intent (in) :: a_m
real(8), intent (in) :: b
code = -a_m
end function
a_m = Math.abs(a);
public static double code(double a_m, double b) {
return -a_m;
}
a_m = math.fabs(a) def code(a_m, b): return -a_m
a_m = abs(a) function code(a_m, b) return Float64(-a_m) end
a_m = abs(a); function tmp = code(a_m, b) tmp = -a_m; end
a_m = N[Abs[a], $MachinePrecision] code[a$95$m_, b_] := (-a$95$m)
\begin{array}{l}
a_m = \left|a\right|
\\
-a\_m
\end{array}
Initial program 57.0%
Taylor expanded in a around -inf
mul-1-negN/A
lower-neg.f6452.8
Applied rewrites52.8%
(FPCore (a b) :precision binary64 (* (sqrt (+ (fabs a) (fabs b))) (sqrt (- (fabs a) (fabs b)))))
double code(double a, double b) {
return sqrt((fabs(a) + fabs(b))) * sqrt((fabs(a) - fabs(b)));
}
real(8) function code(a, b)
real(8), intent (in) :: a
real(8), intent (in) :: b
code = sqrt((abs(a) + abs(b))) * sqrt((abs(a) - abs(b)))
end function
public static double code(double a, double b) {
return Math.sqrt((Math.abs(a) + Math.abs(b))) * Math.sqrt((Math.abs(a) - Math.abs(b)));
}
def code(a, b): return math.sqrt((math.fabs(a) + math.fabs(b))) * math.sqrt((math.fabs(a) - math.fabs(b)))
function code(a, b) return Float64(sqrt(Float64(abs(a) + abs(b))) * sqrt(Float64(abs(a) - abs(b)))) end
function tmp = code(a, b) tmp = sqrt((abs(a) + abs(b))) * sqrt((abs(a) - abs(b))); end
code[a_, b_] := N[(N[Sqrt[N[(N[Abs[a], $MachinePrecision] + N[Abs[b], $MachinePrecision]), $MachinePrecision]], $MachinePrecision] * N[Sqrt[N[(N[Abs[a], $MachinePrecision] - N[Abs[b], $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\sqrt{\left|a\right| + \left|b\right|} \cdot \sqrt{\left|a\right| - \left|b\right|}
\end{array}
herbie shell --seed 2024270
(FPCore (a b)
:name "bug366, discussion (missed optimization)"
:precision binary64
:alt
(! :herbie-platform default (let* ((fa (fabs a)) (fb (fabs b))) (* (sqrt (+ fa fb)) (sqrt (- fa fb)))))
(sqrt (- (* a a) (* b b))))