
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 4 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 1e+252) (fma re_m re_m (* im_m (- im_m))) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 1e+252) {
tmp = fma(re_m, re_m, (im_m * -im_m));
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 1e+252) tmp = fma(re_m, re_m, Float64(im_m * Float64(-im_m))); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 1e+252], N[(re$95$m * re$95$m + N[(im$95$m * (-im$95$m)), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re_m \cdot re_m \leq 10^{+252}:\\
\;\;\;\;\mathsf{fma}\left(re_m, re_m, im_m \cdot \left(-im_m\right)\right)\\
\mathbf{else}:\\
\;\;\;\;re_m \cdot \left(re_m + im_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 1.0000000000000001e252Initial program 100.0%
sqr-neg100.0%
cancel-sign-sub100.0%
fma-def100.0%
Simplified100.0%
if 1.0000000000000001e252 < (*.f64 re re) Initial program 75.0%
difference-of-squares100.0%
add-sqr-sqrt54.2%
sqrt-prod88.9%
sqr-neg88.9%
sqrt-unprod41.7%
add-sqr-sqrt84.7%
sub-neg84.7%
pow184.7%
pow184.7%
pow-prod-up84.7%
add-sqr-sqrt42.9%
add-sqr-sqrt18.0%
difference-of-squares18.0%
metadata-eval18.0%
unpow-prod-down18.0%
Applied egg-rr18.0%
unpow218.0%
unpow218.0%
unswap-sqr18.0%
difference-of-squares18.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr18.0%
metadata-eval18.0%
unpow118.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr18.0%
metadata-eval18.0%
unpow118.0%
difference-of-squares18.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr43.1%
metadata-eval43.1%
unpow143.1%
Simplified84.7%
Taylor expanded in re around inf 73.6%
associate-*r*73.6%
unpow273.6%
distribute-rgt-out94.4%
*-commutative94.4%
Simplified94.4%
Final simplification98.4%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 1e+252) (- (* re_m re_m) (* im_m im_m)) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 1e+252) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
real(8) :: tmp
if ((re_m * re_m) <= 1d+252) then
tmp = (re_m * re_m) - (im_m * im_m)
else
tmp = re_m * (re_m + (im_m * (-2.0d0)))
end if
re_sqr = tmp
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 1e+252) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): tmp = 0 if (re_m * re_m) <= 1e+252: tmp = (re_m * re_m) - (im_m * im_m) else: tmp = re_m * (re_m + (im_m * -2.0)) return tmp
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 1e+252) tmp = Float64(Float64(re_m * re_m) - Float64(im_m * im_m)); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = abs(re); im_m = abs(im); function tmp_2 = re_sqr(re_m, im_m) tmp = 0.0; if ((re_m * re_m) <= 1e+252) tmp = (re_m * re_m) - (im_m * im_m); else tmp = re_m * (re_m + (im_m * -2.0)); end tmp_2 = tmp; end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 1e+252], N[(N[(re$95$m * re$95$m), $MachinePrecision] - N[(im$95$m * im$95$m), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re_m \cdot re_m \leq 10^{+252}:\\
\;\;\;\;re_m \cdot re_m - im_m \cdot im_m\\
\mathbf{else}:\\
\;\;\;\;re_m \cdot \left(re_m + im_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 1.0000000000000001e252Initial program 100.0%
if 1.0000000000000001e252 < (*.f64 re re) Initial program 75.0%
difference-of-squares100.0%
add-sqr-sqrt54.2%
sqrt-prod88.9%
sqr-neg88.9%
sqrt-unprod41.7%
add-sqr-sqrt84.7%
sub-neg84.7%
pow184.7%
pow184.7%
pow-prod-up84.7%
add-sqr-sqrt42.9%
add-sqr-sqrt18.0%
difference-of-squares18.0%
metadata-eval18.0%
unpow-prod-down18.0%
Applied egg-rr18.0%
unpow218.0%
unpow218.0%
unswap-sqr18.0%
difference-of-squares18.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr18.0%
metadata-eval18.0%
unpow118.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr18.0%
metadata-eval18.0%
unpow118.0%
difference-of-squares18.0%
unpow1/218.0%
unpow1/218.0%
pow-sqr43.1%
metadata-eval43.1%
unpow143.1%
Simplified84.7%
Taylor expanded in re around inf 73.6%
associate-*r*73.6%
unpow273.6%
distribute-rgt-out94.4%
*-commutative94.4%
Simplified94.4%
Final simplification98.4%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* re_m (+ re_m (* im_m -2.0))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = re_m * (re_m + (im_m * (-2.0d0)))
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return re_m * (re_m + (im_m * -2.0))
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(re_m * Float64(re_m + Float64(im_m * -2.0))) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = re_m * (re_m + (im_m * -2.0)); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
re_m \cdot \left(re_m + im_m \cdot -2\right)
\end{array}
Initial program 93.0%
difference-of-squares100.0%
add-sqr-sqrt53.4%
sqrt-prod79.1%
sqr-neg79.1%
sqrt-unprod27.6%
add-sqr-sqrt56.6%
sub-neg56.6%
pow156.6%
pow156.6%
pow-prod-up56.6%
add-sqr-sqrt31.1%
add-sqr-sqrt15.4%
difference-of-squares15.4%
metadata-eval15.4%
unpow-prod-down15.4%
Applied egg-rr15.4%
unpow215.4%
unpow215.4%
unswap-sqr15.4%
difference-of-squares15.4%
unpow1/215.4%
unpow1/215.4%
pow-sqr15.5%
metadata-eval15.5%
unpow115.5%
unpow1/215.5%
unpow1/215.5%
pow-sqr15.5%
metadata-eval15.5%
unpow115.5%
difference-of-squares15.5%
unpow1/215.5%
unpow1/215.5%
pow-sqr29.0%
metadata-eval29.0%
unpow129.0%
Simplified56.6%
Taylor expanded in re around inf 56.0%
associate-*r*56.0%
unpow256.0%
distribute-rgt-out61.8%
*-commutative61.8%
Simplified61.8%
Final simplification61.8%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* -2.0 (* re_m im_m)))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return -2.0 * (re_m * im_m);
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = (-2.0d0) * (re_m * im_m)
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return -2.0 * (re_m * im_m);
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return -2.0 * (re_m * im_m)
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(-2.0 * Float64(re_m * im_m)) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = -2.0 * (re_m * im_m); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(-2.0 * N[(re$95$m * im$95$m), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
-2 \cdot \left(re_m \cdot im_m\right)
\end{array}
Initial program 93.0%
difference-of-squares100.0%
add-sqr-sqrt53.4%
sqrt-prod79.1%
sqr-neg79.1%
sqrt-unprod27.6%
add-sqr-sqrt56.6%
sub-neg56.6%
pow156.6%
pow156.6%
pow-prod-up56.6%
add-sqr-sqrt31.1%
add-sqr-sqrt15.4%
difference-of-squares15.4%
metadata-eval15.4%
unpow-prod-down15.4%
Applied egg-rr15.4%
unpow215.4%
unpow215.4%
unswap-sqr15.4%
difference-of-squares15.4%
unpow1/215.4%
unpow1/215.4%
pow-sqr15.5%
metadata-eval15.5%
unpow115.5%
unpow1/215.5%
unpow1/215.5%
pow-sqr15.5%
metadata-eval15.5%
unpow115.5%
difference-of-squares15.5%
unpow1/215.5%
unpow1/215.5%
pow-sqr29.0%
metadata-eval29.0%
unpow129.0%
Simplified56.6%
Taylor expanded in re around inf 56.0%
associate-*r*56.0%
unpow256.0%
distribute-rgt-out61.8%
*-commutative61.8%
Simplified61.8%
Taylor expanded in re around 0 18.2%
Final simplification18.2%
herbie shell --seed 2024026
(FPCore re_sqr (re im)
:name "math.square on complex, real part"
:precision binary64
(- (* re re) (* im im)))