
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 4 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore re_sqr (re im) :precision binary64 (- (* re re) (* im im)))
double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
real(8) function re_sqr(re, im)
real(8), intent (in) :: re
real(8), intent (in) :: im
re_sqr = (re * re) - (im * im)
end function
public static double re_sqr(double re, double im) {
return (re * re) - (im * im);
}
def re_sqr(re, im): return (re * re) - (im * im)
function re_sqr(re, im) return Float64(Float64(re * re) - Float64(im * im)) end
function tmp = re_sqr(re, im) tmp = (re * re) - (im * im); end
re$95$sqr[re_, im_] := N[(N[(re * re), $MachinePrecision] - N[(im * im), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
re \cdot re - im \cdot im
\end{array}
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 3e+289) (fma re_m re_m (* im_m (- im_m))) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 3e+289) {
tmp = fma(re_m, re_m, (im_m * -im_m));
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 3e+289) tmp = fma(re_m, re_m, Float64(im_m * Float64(-im_m))); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 3e+289], N[(re$95$m * re$95$m + N[(im$95$m * (-im$95$m)), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re_m \cdot re_m \leq 3 \cdot 10^{+289}:\\
\;\;\;\;\mathsf{fma}\left(re_m, re_m, im_m \cdot \left(-im_m\right)\right)\\
\mathbf{else}:\\
\;\;\;\;re_m \cdot \left(re_m + im_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 3.0000000000000002e289Initial program 100.0%
sqr-neg100.0%
cancel-sign-sub100.0%
fma-def100.0%
Simplified100.0%
if 3.0000000000000002e289 < (*.f64 re re) Initial program 78.6%
difference-of-squares100.0%
add-sqr-sqrt40.0%
sqrt-prod91.4%
sqr-neg91.4%
sqrt-unprod54.3%
add-sqr-sqrt90.0%
sub-neg90.0%
pow190.0%
pow190.0%
pow-prod-up90.0%
add-sqr-sqrt48.6%
add-sqr-sqrt17.1%
difference-of-squares17.1%
metadata-eval17.1%
unpow-prod-down17.1%
Applied egg-rr17.1%
unpow217.1%
unpow217.1%
unswap-sqr17.1%
difference-of-squares17.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr17.1%
metadata-eval17.1%
unpow117.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr17.1%
metadata-eval17.1%
unpow117.1%
difference-of-squares17.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr35.7%
metadata-eval35.7%
unpow135.7%
Simplified90.0%
Taylor expanded in re around inf 78.6%
associate-*r*78.6%
unpow278.6%
distribute-rgt-out97.1%
*-commutative97.1%
Simplified97.1%
Final simplification99.2%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (if (<= (* re_m re_m) 3e+289) (- (* re_m re_m) (* im_m im_m)) (* re_m (+ re_m (* im_m -2.0)))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 3e+289) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
real(8) :: tmp
if ((re_m * re_m) <= 3d+289) then
tmp = (re_m * re_m) - (im_m * im_m)
else
tmp = re_m * (re_m + (im_m * (-2.0d0)))
end if
re_sqr = tmp
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
double tmp;
if ((re_m * re_m) <= 3e+289) {
tmp = (re_m * re_m) - (im_m * im_m);
} else {
tmp = re_m * (re_m + (im_m * -2.0));
}
return tmp;
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): tmp = 0 if (re_m * re_m) <= 3e+289: tmp = (re_m * re_m) - (im_m * im_m) else: tmp = re_m * (re_m + (im_m * -2.0)) return tmp
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) tmp = 0.0 if (Float64(re_m * re_m) <= 3e+289) tmp = Float64(Float64(re_m * re_m) - Float64(im_m * im_m)); else tmp = Float64(re_m * Float64(re_m + Float64(im_m * -2.0))); end return tmp end
re_m = abs(re); im_m = abs(im); function tmp_2 = re_sqr(re_m, im_m) tmp = 0.0; if ((re_m * re_m) <= 3e+289) tmp = (re_m * re_m) - (im_m * im_m); else tmp = re_m * (re_m + (im_m * -2.0)); end tmp_2 = tmp; end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := If[LessEqual[N[(re$95$m * re$95$m), $MachinePrecision], 3e+289], N[(N[(re$95$m * re$95$m), $MachinePrecision] - N[(im$95$m * im$95$m), $MachinePrecision]), $MachinePrecision], N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
\begin{array}{l}
\mathbf{if}\;re_m \cdot re_m \leq 3 \cdot 10^{+289}:\\
\;\;\;\;re_m \cdot re_m - im_m \cdot im_m\\
\mathbf{else}:\\
\;\;\;\;re_m \cdot \left(re_m + im_m \cdot -2\right)\\
\end{array}
\end{array}
if (*.f64 re re) < 3.0000000000000002e289Initial program 100.0%
if 3.0000000000000002e289 < (*.f64 re re) Initial program 78.6%
difference-of-squares100.0%
add-sqr-sqrt40.0%
sqrt-prod91.4%
sqr-neg91.4%
sqrt-unprod54.3%
add-sqr-sqrt90.0%
sub-neg90.0%
pow190.0%
pow190.0%
pow-prod-up90.0%
add-sqr-sqrt48.6%
add-sqr-sqrt17.1%
difference-of-squares17.1%
metadata-eval17.1%
unpow-prod-down17.1%
Applied egg-rr17.1%
unpow217.1%
unpow217.1%
unswap-sqr17.1%
difference-of-squares17.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr17.1%
metadata-eval17.1%
unpow117.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr17.1%
metadata-eval17.1%
unpow117.1%
difference-of-squares17.1%
unpow1/217.1%
unpow1/217.1%
pow-sqr35.7%
metadata-eval35.7%
unpow135.7%
Simplified90.0%
Taylor expanded in re around inf 78.6%
associate-*r*78.6%
unpow278.6%
distribute-rgt-out97.1%
*-commutative97.1%
Simplified97.1%
Final simplification99.2%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* re_m (+ re_m (* im_m -2.0))))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = re_m * (re_m + (im_m * (-2.0d0)))
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return re_m * (re_m + (im_m * -2.0));
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return re_m * (re_m + (im_m * -2.0))
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(re_m * Float64(re_m + Float64(im_m * -2.0))) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = re_m * (re_m + (im_m * -2.0)); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(re$95$m * N[(re$95$m + N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
re_m \cdot \left(re_m + im_m \cdot -2\right)
\end{array}
Initial program 94.1%
difference-of-squares100.0%
add-sqr-sqrt48.4%
sqrt-prod76.6%
sqr-neg76.6%
sqrt-unprod28.9%
add-sqr-sqrt52.1%
sub-neg52.1%
pow152.1%
pow152.1%
pow-prod-up52.1%
add-sqr-sqrt27.6%
add-sqr-sqrt12.1%
difference-of-squares12.1%
metadata-eval12.1%
unpow-prod-down12.1%
Applied egg-rr12.1%
unpow212.1%
unpow212.1%
unswap-sqr12.1%
difference-of-squares12.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr12.1%
metadata-eval12.1%
unpow112.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr12.1%
metadata-eval12.1%
unpow112.1%
difference-of-squares12.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr23.2%
metadata-eval23.2%
unpow123.2%
Simplified52.1%
Taylor expanded in re around inf 50.9%
associate-*r*50.9%
unpow250.9%
distribute-rgt-out55.9%
*-commutative55.9%
Simplified55.9%
Final simplification55.9%
re_m = (fabs.f64 re) im_m = (fabs.f64 im) (FPCore re_sqr (re_m im_m) :precision binary64 (* re_m (* im_m -2.0)))
re_m = fabs(re);
im_m = fabs(im);
double re_sqr(double re_m, double im_m) {
return re_m * (im_m * -2.0);
}
re_m = abs(re)
im_m = abs(im)
real(8) function re_sqr(re_m, im_m)
real(8), intent (in) :: re_m
real(8), intent (in) :: im_m
re_sqr = re_m * (im_m * (-2.0d0))
end function
re_m = Math.abs(re);
im_m = Math.abs(im);
public static double re_sqr(double re_m, double im_m) {
return re_m * (im_m * -2.0);
}
re_m = math.fabs(re) im_m = math.fabs(im) def re_sqr(re_m, im_m): return re_m * (im_m * -2.0)
re_m = abs(re) im_m = abs(im) function re_sqr(re_m, im_m) return Float64(re_m * Float64(im_m * -2.0)) end
re_m = abs(re); im_m = abs(im); function tmp = re_sqr(re_m, im_m) tmp = re_m * (im_m * -2.0); end
re_m = N[Abs[re], $MachinePrecision] im_m = N[Abs[im], $MachinePrecision] re$95$sqr[re$95$m_, im$95$m_] := N[(re$95$m * N[(im$95$m * -2.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
re_m = \left|re\right|
\\
im_m = \left|im\right|
\\
re_m \cdot \left(im_m \cdot -2\right)
\end{array}
Initial program 94.1%
difference-of-squares100.0%
add-sqr-sqrt48.4%
sqrt-prod76.6%
sqr-neg76.6%
sqrt-unprod28.9%
add-sqr-sqrt52.1%
sub-neg52.1%
pow152.1%
pow152.1%
pow-prod-up52.1%
add-sqr-sqrt27.6%
add-sqr-sqrt12.1%
difference-of-squares12.1%
metadata-eval12.1%
unpow-prod-down12.1%
Applied egg-rr12.1%
unpow212.1%
unpow212.1%
unswap-sqr12.1%
difference-of-squares12.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr12.1%
metadata-eval12.1%
unpow112.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr12.1%
metadata-eval12.1%
unpow112.1%
difference-of-squares12.1%
unpow1/212.1%
unpow1/212.1%
pow-sqr23.2%
metadata-eval23.2%
unpow123.2%
Simplified52.1%
Taylor expanded in re around inf 50.9%
associate-*r*50.9%
unpow250.9%
distribute-rgt-out55.9%
*-commutative55.9%
Simplified55.9%
Taylor expanded in re around 0 15.6%
*-commutative15.6%
*-commutative15.6%
associate-*r*15.6%
*-commutative15.6%
Simplified15.6%
Final simplification15.6%
herbie shell --seed 2024024
(FPCore re_sqr (re im)
:name "math.square on complex, real part"
:precision binary64
(- (* re re) (* im im)))