
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 12 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
(FPCore (a1 a2 th) :precision binary64 (* (/ (fma a1 a1 (* a2 a2)) (sqrt 2.0)) (cos th)))
double code(double a1, double a2, double th) {
return (fma(a1, a1, (a2 * a2)) / sqrt(2.0)) * cos(th);
}
function code(a1, a2, th) return Float64(Float64(fma(a1, a1, Float64(a2 * a2)) / sqrt(2.0)) * cos(th)) end
code[a1_, a2_, th_] := N[(N[(N[(a1 * a1 + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision] * N[Cos[th], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right)}{\sqrt{2}} \cdot \cos th
\end{array}
Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
(FPCore (a1 a2 th)
:precision binary64
(let* ((t_1 (/ (cos th) (sqrt 2.0))))
(if (<= (+ (* t_1 (* a1 a1)) (* (* a2 a2) t_1)) -5e-118)
(* (* a2 a2) (/ (fma (* th th) -0.5 1.0) (sqrt 2.0)))
(/ (fma a2 a2 (* a1 a1)) (sqrt 2.0)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
double tmp;
if (((t_1 * (a1 * a1)) + ((a2 * a2) * t_1)) <= -5e-118) {
tmp = (a2 * a2) * (fma((th * th), -0.5, 1.0) / sqrt(2.0));
} else {
tmp = fma(a2, a2, (a1 * a1)) / sqrt(2.0);
}
return tmp;
}
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) tmp = 0.0 if (Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(Float64(a2 * a2) * t_1)) <= -5e-118) tmp = Float64(Float64(a2 * a2) * Float64(fma(Float64(th * th), -0.5, 1.0) / sqrt(2.0))); else tmp = Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0)); end return tmp end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(N[(a2 * a2), $MachinePrecision] * t$95$1), $MachinePrecision]), $MachinePrecision], -5e-118], N[(N[(a2 * a2), $MachinePrecision] * N[(N[(N[(th * th), $MachinePrecision] * -0.5 + 1.0), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
\mathbf{if}\;t\_1 \cdot \left(a1 \cdot a1\right) + \left(a2 \cdot a2\right) \cdot t\_1 \leq -5 \cdot 10^{-118}:\\
\;\;\;\;\left(a2 \cdot a2\right) \cdot \frac{\mathsf{fma}\left(th \cdot th, -0.5, 1\right)}{\sqrt{2}}\\
\mathbf{else}:\\
\;\;\;\;\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}\\
\end{array}
\end{array}
if (+.f64 (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a1 a1)) (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a2 a2))) < -5.00000000000000015e-118Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
*-commutativeN/A
lower-*.f64N/A
lift-*.f64N/A
lower-fma.f6499.6
Applied rewrites99.6%
Taylor expanded in th around 0
+-commutativeN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
sub-negN/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f640.2
Applied rewrites0.2%
Taylor expanded in th around 0
Applied rewrites55.3%
Taylor expanded in a1 around 0
unpow2N/A
lower-*.f6440.6
Applied rewrites40.6%
if -5.00000000000000015e-118 < (+.f64 (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a1 a1)) (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a2 a2))) Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
Taylor expanded in th around 0
lower-/.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6484.8
Applied rewrites84.8%
Final simplification76.7%
(FPCore (a1 a2 th)
:precision binary64
(let* ((t_1 (/ (cos th) (sqrt 2.0))))
(if (<= (+ (* t_1 (* a1 a1)) (* (* a2 a2) t_1)) -1e-61)
(* (* a1 a1) (/ (fma (* th th) -0.5 1.0) (sqrt 2.0)))
(/ (fma a2 a2 (* a1 a1)) (sqrt 2.0)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
double tmp;
if (((t_1 * (a1 * a1)) + ((a2 * a2) * t_1)) <= -1e-61) {
tmp = (a1 * a1) * (fma((th * th), -0.5, 1.0) / sqrt(2.0));
} else {
tmp = fma(a2, a2, (a1 * a1)) / sqrt(2.0);
}
return tmp;
}
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) tmp = 0.0 if (Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(Float64(a2 * a2) * t_1)) <= -1e-61) tmp = Float64(Float64(a1 * a1) * Float64(fma(Float64(th * th), -0.5, 1.0) / sqrt(2.0))); else tmp = Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0)); end return tmp end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(N[(a2 * a2), $MachinePrecision] * t$95$1), $MachinePrecision]), $MachinePrecision], -1e-61], N[(N[(a1 * a1), $MachinePrecision] * N[(N[(N[(th * th), $MachinePrecision] * -0.5 + 1.0), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
\mathbf{if}\;t\_1 \cdot \left(a1 \cdot a1\right) + \left(a2 \cdot a2\right) \cdot t\_1 \leq -1 \cdot 10^{-61}:\\
\;\;\;\;\left(a1 \cdot a1\right) \cdot \frac{\mathsf{fma}\left(th \cdot th, -0.5, 1\right)}{\sqrt{2}}\\
\mathbf{else}:\\
\;\;\;\;\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}\\
\end{array}
\end{array}
if (+.f64 (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a1 a1)) (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a2 a2))) < -1e-61Initial program 99.7%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
*-commutativeN/A
lower-*.f64N/A
lift-*.f64N/A
lower-fma.f6499.7
Applied rewrites99.7%
Taylor expanded in th around 0
+-commutativeN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
sub-negN/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f64N/A
unpow2N/A
lower-*.f640.2
Applied rewrites0.2%
Taylor expanded in th around 0
Applied rewrites58.8%
Taylor expanded in a1 around inf
unpow2N/A
lower-*.f6447.7
Applied rewrites47.7%
if -1e-61 < (+.f64 (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a1 a1)) (*.f64 (/.f64 (cos.f64 th) (sqrt.f64 #s(literal 2 binary64))) (*.f64 a2 a2))) Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
Taylor expanded in th around 0
lower-/.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6483.6
Applied rewrites83.6%
Final simplification77.5%
(FPCore (a1 a2 th)
:precision binary64
(if (<= (cos th) -0.02)
(/
(fma (* a1 a1) (- (sqrt 2.0)) (* a2 (* a2 (sqrt 2.0))))
(- (* (sqrt 2.0) (sqrt 2.0))))
(fma a1 (/ a1 (sqrt 2.0)) (/ 1.0 (/ (sqrt 2.0) (* a2 a2))))))
double code(double a1, double a2, double th) {
double tmp;
if (cos(th) <= -0.02) {
tmp = fma((a1 * a1), -sqrt(2.0), (a2 * (a2 * sqrt(2.0)))) / -(sqrt(2.0) * sqrt(2.0));
} else {
tmp = fma(a1, (a1 / sqrt(2.0)), (1.0 / (sqrt(2.0) / (a2 * a2))));
}
return tmp;
}
function code(a1, a2, th) tmp = 0.0 if (cos(th) <= -0.02) tmp = Float64(fma(Float64(a1 * a1), Float64(-sqrt(2.0)), Float64(a2 * Float64(a2 * sqrt(2.0)))) / Float64(-Float64(sqrt(2.0) * sqrt(2.0)))); else tmp = fma(a1, Float64(a1 / sqrt(2.0)), Float64(1.0 / Float64(sqrt(2.0) / Float64(a2 * a2)))); end return tmp end
code[a1_, a2_, th_] := If[LessEqual[N[Cos[th], $MachinePrecision], -0.02], N[(N[(N[(a1 * a1), $MachinePrecision] * (-N[Sqrt[2.0], $MachinePrecision]) + N[(a2 * N[(a2 * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] / (-N[(N[Sqrt[2.0], $MachinePrecision] * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision])), $MachinePrecision], N[(a1 * N[(a1 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision] + N[(1.0 / N[(N[Sqrt[2.0], $MachinePrecision] / N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\cos th \leq -0.02:\\
\;\;\;\;\frac{\mathsf{fma}\left(a1 \cdot a1, -\sqrt{2}, a2 \cdot \left(a2 \cdot \sqrt{2}\right)\right)}{-\sqrt{2} \cdot \sqrt{2}}\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(a1, \frac{a1}{\sqrt{2}}, \frac{1}{\frac{\sqrt{2}}{a2 \cdot a2}}\right)\\
\end{array}
\end{array}
if (cos.f64 th) < -0.0200000000000000004Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6411.2
Applied rewrites11.2%
lift-sqrt.f64N/A
associate-*r/N/A
lift-*.f64N/A
lift-*.f64N/A
lift-sqrt.f64N/A
frac-2negN/A
frac-addN/A
lower-/.f64N/A
lower-fma.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f6411.2
Applied rewrites11.2%
Applied rewrites0.6%
Applied rewrites36.6%
if -0.0200000000000000004 < (cos.f64 th) Initial program 99.7%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6486.3
Applied rewrites86.3%
lift-*.f64N/A
lift-sqrt.f64N/A
clear-numN/A
lower-/.f64N/A
lower-/.f6486.3
Applied rewrites86.3%
Final simplification75.1%
(FPCore (a1 a2 th)
:precision binary64
(if (<= (cos th) -0.02)
(/
(fma (* a1 a1) (- (sqrt 2.0)) (* (* a2 a2) (sqrt 2.0)))
(- (* (sqrt 2.0) (sqrt 2.0))))
(fma a1 (/ a1 (sqrt 2.0)) (/ 1.0 (/ (sqrt 2.0) (* a2 a2))))))
double code(double a1, double a2, double th) {
double tmp;
if (cos(th) <= -0.02) {
tmp = fma((a1 * a1), -sqrt(2.0), ((a2 * a2) * sqrt(2.0))) / -(sqrt(2.0) * sqrt(2.0));
} else {
tmp = fma(a1, (a1 / sqrt(2.0)), (1.0 / (sqrt(2.0) / (a2 * a2))));
}
return tmp;
}
function code(a1, a2, th) tmp = 0.0 if (cos(th) <= -0.02) tmp = Float64(fma(Float64(a1 * a1), Float64(-sqrt(2.0)), Float64(Float64(a2 * a2) * sqrt(2.0))) / Float64(-Float64(sqrt(2.0) * sqrt(2.0)))); else tmp = fma(a1, Float64(a1 / sqrt(2.0)), Float64(1.0 / Float64(sqrt(2.0) / Float64(a2 * a2)))); end return tmp end
code[a1_, a2_, th_] := If[LessEqual[N[Cos[th], $MachinePrecision], -0.02], N[(N[(N[(a1 * a1), $MachinePrecision] * (-N[Sqrt[2.0], $MachinePrecision]) + N[(N[(a2 * a2), $MachinePrecision] * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] / (-N[(N[Sqrt[2.0], $MachinePrecision] * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision])), $MachinePrecision], N[(a1 * N[(a1 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision] + N[(1.0 / N[(N[Sqrt[2.0], $MachinePrecision] / N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\cos th \leq -0.02:\\
\;\;\;\;\frac{\mathsf{fma}\left(a1 \cdot a1, -\sqrt{2}, \left(a2 \cdot a2\right) \cdot \sqrt{2}\right)}{-\sqrt{2} \cdot \sqrt{2}}\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(a1, \frac{a1}{\sqrt{2}}, \frac{1}{\frac{\sqrt{2}}{a2 \cdot a2}}\right)\\
\end{array}
\end{array}
if (cos.f64 th) < -0.0200000000000000004Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6411.2
Applied rewrites11.2%
lift-sqrt.f64N/A
associate-*r/N/A
lift-*.f64N/A
lift-*.f64N/A
lift-sqrt.f64N/A
frac-2negN/A
frac-addN/A
lower-/.f64N/A
lower-fma.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f6411.2
Applied rewrites11.2%
Applied rewrites0.6%
Applied rewrites36.6%
if -0.0200000000000000004 < (cos.f64 th) Initial program 99.7%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6486.3
Applied rewrites86.3%
lift-*.f64N/A
lift-sqrt.f64N/A
clear-numN/A
lower-/.f64N/A
lower-/.f6486.3
Applied rewrites86.3%
Final simplification75.1%
(FPCore (a1 a2 th) :precision binary64 (if (<= (cos th) -0.02) (* (fma (sqrt 2.0) (* a2 a2) (- (* a1 (* a1 (sqrt 2.0))))) -0.5) (fma a1 (/ a1 (sqrt 2.0)) (/ 1.0 (/ (sqrt 2.0) (* a2 a2))))))
double code(double a1, double a2, double th) {
double tmp;
if (cos(th) <= -0.02) {
tmp = fma(sqrt(2.0), (a2 * a2), -(a1 * (a1 * sqrt(2.0)))) * -0.5;
} else {
tmp = fma(a1, (a1 / sqrt(2.0)), (1.0 / (sqrt(2.0) / (a2 * a2))));
}
return tmp;
}
function code(a1, a2, th) tmp = 0.0 if (cos(th) <= -0.02) tmp = Float64(fma(sqrt(2.0), Float64(a2 * a2), Float64(-Float64(a1 * Float64(a1 * sqrt(2.0))))) * -0.5); else tmp = fma(a1, Float64(a1 / sqrt(2.0)), Float64(1.0 / Float64(sqrt(2.0) / Float64(a2 * a2)))); end return tmp end
code[a1_, a2_, th_] := If[LessEqual[N[Cos[th], $MachinePrecision], -0.02], N[(N[(N[Sqrt[2.0], $MachinePrecision] * N[(a2 * a2), $MachinePrecision] + (-N[(a1 * N[(a1 * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision])), $MachinePrecision] * -0.5), $MachinePrecision], N[(a1 * N[(a1 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision] + N[(1.0 / N[(N[Sqrt[2.0], $MachinePrecision] / N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\cos th \leq -0.02:\\
\;\;\;\;\mathsf{fma}\left(\sqrt{2}, a2 \cdot a2, -a1 \cdot \left(a1 \cdot \sqrt{2}\right)\right) \cdot -0.5\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(a1, \frac{a1}{\sqrt{2}}, \frac{1}{\frac{\sqrt{2}}{a2 \cdot a2}}\right)\\
\end{array}
\end{array}
if (cos.f64 th) < -0.0200000000000000004Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6411.2
Applied rewrites11.2%
lift-sqrt.f64N/A
associate-*r/N/A
lift-*.f64N/A
lift-*.f64N/A
lift-sqrt.f64N/A
frac-2negN/A
frac-addN/A
lower-/.f64N/A
lower-fma.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f6411.2
Applied rewrites11.2%
Applied rewrites0.6%
Applied rewrites36.6%
if -0.0200000000000000004 < (cos.f64 th) Initial program 99.7%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6486.3
Applied rewrites86.3%
lift-*.f64N/A
lift-sqrt.f64N/A
clear-numN/A
lower-/.f64N/A
lower-/.f6486.3
Applied rewrites86.3%
Final simplification75.1%
(FPCore (a1 a2 th) :precision binary64 (if (<= (cos th) -0.02) (* (fma (sqrt 2.0) (* a2 a2) (- (* a1 (* a1 (sqrt 2.0))))) -0.5) (/ (fma a2 a2 (* a1 a1)) (sqrt 2.0))))
double code(double a1, double a2, double th) {
double tmp;
if (cos(th) <= -0.02) {
tmp = fma(sqrt(2.0), (a2 * a2), -(a1 * (a1 * sqrt(2.0)))) * -0.5;
} else {
tmp = fma(a2, a2, (a1 * a1)) / sqrt(2.0);
}
return tmp;
}
function code(a1, a2, th) tmp = 0.0 if (cos(th) <= -0.02) tmp = Float64(fma(sqrt(2.0), Float64(a2 * a2), Float64(-Float64(a1 * Float64(a1 * sqrt(2.0))))) * -0.5); else tmp = Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0)); end return tmp end
code[a1_, a2_, th_] := If[LessEqual[N[Cos[th], $MachinePrecision], -0.02], N[(N[(N[Sqrt[2.0], $MachinePrecision] * N[(a2 * a2), $MachinePrecision] + (-N[(a1 * N[(a1 * N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision])), $MachinePrecision] * -0.5), $MachinePrecision], N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\cos th \leq -0.02:\\
\;\;\;\;\mathsf{fma}\left(\sqrt{2}, a2 \cdot a2, -a1 \cdot \left(a1 \cdot \sqrt{2}\right)\right) \cdot -0.5\\
\mathbf{else}:\\
\;\;\;\;\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}\\
\end{array}
\end{array}
if (cos.f64 th) < -0.0200000000000000004Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6411.2
Applied rewrites11.2%
lift-sqrt.f64N/A
associate-*r/N/A
lift-*.f64N/A
lift-*.f64N/A
lift-sqrt.f64N/A
frac-2negN/A
frac-addN/A
lower-/.f64N/A
lower-fma.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f64N/A
lower-*.f64N/A
lower-neg.f6411.2
Applied rewrites11.2%
Applied rewrites0.6%
Applied rewrites36.6%
if -0.0200000000000000004 < (cos.f64 th) Initial program 99.7%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
Taylor expanded in th around 0
lower-/.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6486.3
Applied rewrites86.3%
Final simplification75.1%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ (* a2 a2) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return cos(th) * ((a2 * a2) / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * ((a2 * a2) / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * ((a2 * a2) / Math.sqrt(2.0));
}
def code(a1, a2, th): return math.cos(th) * ((a2 * a2) / math.sqrt(2.0))
function code(a1, a2, th) return Float64(cos(th) * Float64(Float64(a2 * a2) / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = cos(th) * ((a2 * a2) / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 * a2), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{a2 \cdot a2}{\sqrt{2}}
\end{array}
Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
Taylor expanded in a1 around 0
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6453.6
Applied rewrites53.6%
Final simplification53.6%
(FPCore (a1 a2 th) :precision binary64 (* (* a2 a2) (/ (cos th) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return (a2 * a2) * (cos(th) / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = (a2 * a2) * (cos(th) / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return (a2 * a2) * (Math.cos(th) / Math.sqrt(2.0));
}
def code(a1, a2, th): return (a2 * a2) * (math.cos(th) / math.sqrt(2.0))
function code(a1, a2, th) return Float64(Float64(a2 * a2) * Float64(cos(th) / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = (a2 * a2) * (cos(th) / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(N[(a2 * a2), $MachinePrecision] * N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(a2 \cdot a2\right) \cdot \frac{\cos th}{\sqrt{2}}
\end{array}
Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
*-commutativeN/A
lower-*.f64N/A
lift-*.f64N/A
lower-fma.f6499.6
Applied rewrites99.6%
Taylor expanded in a1 around 0
unpow2N/A
lower-*.f6453.6
Applied rewrites53.6%
(FPCore (a1 a2 th) :precision binary64 (/ (fma a2 a2 (* a1 a1)) (sqrt 2.0)))
double code(double a1, double a2, double th) {
return fma(a2, a2, (a1 * a1)) / sqrt(2.0);
}
function code(a1, a2, th) return Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0)) end
code[a1_, a2_, th_] := N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}
\end{array}
Initial program 99.6%
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-cos.f64N/A
lift-sqrt.f64N/A
lift-/.f64N/A
lift-*.f64N/A
distribute-lft-outN/A
lift-/.f64N/A
div-invN/A
associate-*l*N/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites99.7%
Taylor expanded in th around 0
lower-/.f64N/A
+-commutativeN/A
unpow2N/A
lower-fma.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6469.3
Applied rewrites69.3%
(FPCore (a1 a2 th) :precision binary64 (/ (* a2 a2) (sqrt 2.0)))
double code(double a1, double a2, double th) {
return (a2 * a2) / sqrt(2.0);
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = (a2 * a2) / sqrt(2.0d0)
end function
public static double code(double a1, double a2, double th) {
return (a2 * a2) / Math.sqrt(2.0);
}
def code(a1, a2, th): return (a2 * a2) / math.sqrt(2.0)
function code(a1, a2, th) return Float64(Float64(a2 * a2) / sqrt(2.0)) end
function tmp = code(a1, a2, th) tmp = (a2 * a2) / sqrt(2.0); end
code[a1_, a2_, th_] := N[(N[(a2 * a2), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\frac{a2 \cdot a2}{\sqrt{2}}
\end{array}
Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6469.3
Applied rewrites69.3%
Taylor expanded in a1 around 0
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6438.9
Applied rewrites38.9%
(FPCore (a1 a2 th) :precision binary64 (* a1 (/ a1 (sqrt 2.0))))
double code(double a1, double a2, double th) {
return a1 * (a1 / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = a1 * (a1 / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return a1 * (a1 / Math.sqrt(2.0));
}
def code(a1, a2, th): return a1 * (a1 / math.sqrt(2.0))
function code(a1, a2, th) return Float64(a1 * Float64(a1 / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = a1 * (a1 / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(a1 * N[(a1 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
a1 \cdot \frac{a1}{\sqrt{2}}
\end{array}
Initial program 99.6%
Taylor expanded in th around 0
unpow2N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6469.3
Applied rewrites69.3%
Taylor expanded in a1 around inf
lower-/.f64N/A
unpow2N/A
lower-*.f64N/A
lower-sqrt.f6443.4
Applied rewrites43.4%
lift-sqrt.f64N/A
associate-/l*N/A
*-commutativeN/A
lower-*.f64N/A
lower-/.f6443.4
Applied rewrites43.4%
Final simplification43.4%
herbie shell --seed 2024219
(FPCore (a1 a2 th)
:name "Migdal et al, Equation (64)"
:precision binary64
(+ (* (/ (cos th) (sqrt 2.0)) (* a1 a1)) (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))