
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 4 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 5e+252) (fma re_m re_m (* im_m (- im_m))) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 5e+252) {
tmp = fma(re_m, re_m, (im_m * -im_m));
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 5e+252) tmp = fma(re_m, re_m, Float64(im_m * Float64(-im_m))); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 5e+252], N[(re$95$m * re$95$m + N[(im$95$m * (-im$95$m)), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re\_m \cdot re\_m \leq 5 \cdot 10^{+252}:\\
\;\;\;\;\mathsf{fma}\left(re\_m, re\_m, im\_m \cdot \left(-im\_m\right)\right)\\
\mathbf{else}:\\
\;\;\;\;re\_m \cdot \left(re\_m + im\_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 4.9999999999999997e252Initial program 100.0%
sqr-neg100.0%
cancel-sign-sub100.0%
fma-def100.0%
Simplified100.0%
if 4.9999999999999997e252 < (*.f64 re re) Initial program 76.4%
difference-of-squares100.0%
add-sqr-sqrt54.2%
sqrt-prod79.2%
sqr-neg79.2%
sqrt-unprod34.7%
add-sqr-sqrt83.3%
sub-neg83.3%
pow183.3%
pow183.3%
pow-prod-up83.3%
add-sqr-sqrt40.2%
add-sqr-sqrt25.0%
difference-of-squares25.0%
metadata-eval25.0%
unpow-prod-down25.0%
Applied egg-rr25.0%
unpow225.0%
unpow225.0%
unswap-sqr25.0%
difference-of-squares25.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr25.0%
metadata-eval25.0%
unpow125.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr25.0%
metadata-eval25.0%
unpow125.0%
difference-of-squares25.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr48.6%
metadata-eval48.6%
unpow148.6%
Simplified83.3%
Taylor expanded in re around inf 72.2%
associate-*r*72.2%
unpow272.2%
distribute-rgt-out88.9%
*-commutative88.9%
Simplified88.9%
Final simplification96.9%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 5e+252) (- (* re_m re_m) (* im_m im_m)) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 5e+252) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
real(8) :: tmp
if ((re_m * re_m) <= 5d+252) then
tmp = (re_m * re_m) - (im_m * im_m)
else
tmp = re_m * (re_m + (im_m * (-2.0d0)))
end if
re_sqr = tmp
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 5e+252) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): tmp = 0 if (re_m * re_m) <= 5e+252: tmp = (re_m * re_m) - (im_m * im_m) else: tmp = re_m * (re_m + (im_m * -2.0)) return tmp
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 5e+252) tmp = Float64(Float64(re_m * re_m) - Float64(im_m * im_m)); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = abs(re); im_m = abs(im); function tmp_2 = re_sqr(re_m, im_m) tmp = 0.0; if ((re_m * re_m) <= 5e+252) tmp = (re_m * re_m) - (im_m * im_m); else tmp = re_m * (re_m + (im_m * -2.0)); end tmp_2 = tmp; end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 5e+252], N[(N[(re$95$m * re$95$m), $MachinePrecision] - N[(im$95$m * im$95$m), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re\_m \cdot re\_m \leq 5 \cdot 10^{+252}:\\
\;\;\;\;re\_m \cdot re\_m - im\_m \cdot im\_m\\
\mathbf{else}:\\
\;\;\;\;re\_m \cdot \left(re\_m + im\_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 4.9999999999999997e252Initial program 100.0%
if 4.9999999999999997e252 < (*.f64 re re) Initial program 76.4%
difference-of-squares100.0%
add-sqr-sqrt54.2%
sqrt-prod79.2%
sqr-neg79.2%
sqrt-unprod34.7%
add-sqr-sqrt83.3%
sub-neg83.3%
pow183.3%
pow183.3%
pow-prod-up83.3%
add-sqr-sqrt40.2%
add-sqr-sqrt25.0%
difference-of-squares25.0%
metadata-eval25.0%
unpow-prod-down25.0%
Applied egg-rr25.0%
unpow225.0%
unpow225.0%
unswap-sqr25.0%
difference-of-squares25.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr25.0%
metadata-eval25.0%
unpow125.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr25.0%
metadata-eval25.0%
unpow125.0%
difference-of-squares25.0%
unpow1/225.0%
unpow1/225.0%
pow-sqr48.6%
metadata-eval48.6%
unpow148.6%
Simplified83.3%
Taylor expanded in re around inf 72.2%
associate-*r*72.2%
unpow272.2%
distribute-rgt-out88.9%
*-commutative88.9%
Simplified88.9%
Final simplification96.9%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* re_m (+ re_m (* im_m -2.0))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = re_m * (re_m + (im_m * (-2.0d0)))
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return re_m * (re_m + (im_m * -2.0))
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(re_m * Float64(re_m + Float64(im_m * -2.0))) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = re_m * (re_m + (im_m * -2.0)); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
re\_m \cdot \left(re\_m + im\_m \cdot -2\right)
\end{array}
Initial program 93.4%
difference-of-squares100.0%
add-sqr-sqrt51.1%
sqrt-prod73.1%
sqr-neg73.1%
sqrt-unprod24.7%
add-sqr-sqrt52.2%
sub-neg52.2%
pow152.2%
pow152.2%
pow-prod-up52.2%
add-sqr-sqrt27.7%
add-sqr-sqrt15.2%
difference-of-squares15.2%
metadata-eval15.2%
unpow-prod-down15.2%
Applied egg-rr15.2%
unpow215.2%
unpow215.2%
unswap-sqr15.2%
difference-of-squares15.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr15.2%
metadata-eval15.2%
unpow115.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr15.2%
metadata-eval15.2%
unpow115.2%
difference-of-squares15.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr27.5%
metadata-eval27.5%
unpow127.5%
Simplified52.2%
Taylor expanded in re around inf 50.7%
associate-*r*50.7%
unpow250.7%
distribute-rgt-out55.4%
*-commutative55.4%
Simplified55.4%
Final simplification55.4%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* re_m (* im_m -2.0)))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return re_m * (im_m * -2.0);
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = re_m * (im_m * (-2.0d0))
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return re_m * (im_m * -2.0);
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return re_m * (im_m * -2.0)
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(re_m * Float64(im_m * -2.0)) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = re_m * (im_m * -2.0); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(re$95$m * N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
re\_m \cdot \left(im\_m \cdot -2\right)
\end{array}
Initial program 93.4%
difference-of-squares100.0%
add-sqr-sqrt51.1%
sqrt-prod73.1%
sqr-neg73.1%
sqrt-unprod24.7%
add-sqr-sqrt52.2%
sub-neg52.2%
pow152.2%
pow152.2%
pow-prod-up52.2%
add-sqr-sqrt27.7%
add-sqr-sqrt15.2%
difference-of-squares15.2%
metadata-eval15.2%
unpow-prod-down15.2%
Applied egg-rr15.2%
unpow215.2%
unpow215.2%
unswap-sqr15.2%
difference-of-squares15.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr15.2%
metadata-eval15.2%
unpow115.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr15.2%
metadata-eval15.2%
unpow115.2%
difference-of-squares15.2%
unpow1/215.2%
unpow1/215.2%
pow-sqr27.5%
metadata-eval27.5%
unpow127.5%
Simplified52.2%
Taylor expanded in re around inf 50.7%
associate-*r*50.7%
unpow250.7%
distribute-rgt-out55.4%
*-commutative55.4%
Simplified55.4%
Taylor expanded in re around 0 16.6%
*-commutative16.6%
*-commutative16.6%
associate-*r*16.6%
*-commutative16.6%
Simplified16.6%
Final simplification16.6%
herbie shell --seed 2024027
(FPCore re_sqr (re im)
:name "math.square on complex, real part"
:precision binary64
(- (* re re) (* im im)))