
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ (fma a2 a2 (* a1 a1)) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return cos(th) * (fma(a2, a2, (a1 * a1)) / sqrt(2.0));
}
function code(a1, a2, th) return Float64(cos(th) * Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0))) end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
cos-neg99.5%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
Final simplification99.6%
(FPCore (a1 a2 th) :precision binary64 (* (* (cos th) (sqrt 0.5)) (+ (* a1 a1) (* a2 a2))))
double code(double a1, double a2, double th) {
return (cos(th) * sqrt(0.5)) * ((a1 * a1) + (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = (cos(th) * sqrt(0.5d0)) * ((a1 * a1) + (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
return (Math.cos(th) * Math.sqrt(0.5)) * ((a1 * a1) + (a2 * a2));
}
def code(a1, a2, th): return (math.cos(th) * math.sqrt(0.5)) * ((a1 * a1) + (a2 * a2))
function code(a1, a2, th) return Float64(Float64(cos(th) * sqrt(0.5)) * Float64(Float64(a1 * a1) + Float64(a2 * a2))) end
function tmp = code(a1, a2, th) tmp = (cos(th) * sqrt(0.5)) * ((a1 * a1) + (a2 * a2)); end
code[a1_, a2_, th_] := N[(N[(N[Cos[th], $MachinePrecision] * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision] * N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(\cos th \cdot \sqrt{0.5}\right) \cdot \left(a1 \cdot a1 + a2 \cdot a2\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
Simplified99.5%
clear-num99.6%
associate-/r/99.5%
pow1/299.5%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Taylor expanded in th around inf 99.6%
*-commutative99.6%
Simplified99.6%
Final simplification99.6%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (* a2 (* a2 (pow 2.0 -0.5)))))
double code(double a1, double a2, double th) {
return cos(th) * (a2 * (a2 * pow(2.0, -0.5)));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * (a2 * (a2 * (2.0d0 ** (-0.5d0))))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (a2 * (a2 * Math.pow(2.0, -0.5)));
}
def code(a1, a2, th): return math.cos(th) * (a2 * (a2 * math.pow(2.0, -0.5)))
function code(a1, a2, th) return Float64(cos(th) * Float64(a2 * Float64(a2 * (2.0 ^ -0.5)))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (a2 * (a2 * (2.0 ^ -0.5))); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(a2 * N[(a2 * N[Power[2.0, -0.5], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \left(a2 \cdot \left(a2 \cdot {2}^{-0.5}\right)\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
cos-neg99.5%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
Taylor expanded in a2 around inf 60.1%
associate-*l/60.1%
Simplified60.1%
pow260.1%
div-inv60.0%
associate-*l*60.1%
pow1/260.1%
pow-flip60.1%
metadata-eval60.1%
Applied egg-rr60.1%
Final simplification60.1%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (* a2 (/ a2 (sqrt 2.0)))))
double code(double a1, double a2, double th) {
return cos(th) * (a2 * (a2 / sqrt(2.0)));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * (a2 * (a2 / sqrt(2.0d0)))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (a2 * (a2 / Math.sqrt(2.0)));
}
def code(a1, a2, th): return math.cos(th) * (a2 * (a2 / math.sqrt(2.0)))
function code(a1, a2, th) return Float64(cos(th) * Float64(a2 * Float64(a2 / sqrt(2.0)))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (a2 * (a2 / sqrt(2.0))); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(a2 * N[(a2 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \left(a2 \cdot \frac{a2}{\sqrt{2}}\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
cos-neg99.5%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
Taylor expanded in a2 around inf 60.1%
associate-*l/60.1%
Simplified60.1%
pow239.4%
associate-/l*39.5%
Applied egg-rr60.1%
Final simplification60.1%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ a2 (/ (sqrt 2.0) a2))))
double code(double a1, double a2, double th) {
return cos(th) * (a2 / (sqrt(2.0) / a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * (a2 / (sqrt(2.0d0) / a2))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (a2 / (Math.sqrt(2.0) / a2));
}
def code(a1, a2, th): return math.cos(th) * (a2 / (math.sqrt(2.0) / a2))
function code(a1, a2, th) return Float64(cos(th) * Float64(a2 / Float64(sqrt(2.0) / a2))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (a2 / (sqrt(2.0) / a2)); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(a2 / N[(N[Sqrt[2.0], $MachinePrecision] / a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{a2}{\frac{\sqrt{2}}{a2}}
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
cos-neg99.5%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
Taylor expanded in a2 around inf 60.1%
pow260.1%
associate-/l*60.0%
div-inv60.0%
*-commutative60.0%
associate-*r*60.0%
pow260.0%
add-sqr-sqrt60.0%
sqrt-unprod60.0%
frac-times60.0%
metadata-eval60.0%
rem-square-sqrt60.1%
metadata-eval60.1%
Applied egg-rr60.1%
metadata-eval60.1%
sqrt-pow152.0%
sqrt-prod52.1%
metadata-eval52.1%
div-inv52.1%
sqrt-div52.0%
sqrt-pow160.1%
metadata-eval60.1%
unpow260.1%
associate-*r/60.1%
clear-num60.1%
un-div-inv60.1%
Applied egg-rr60.1%
Final simplification60.1%
(FPCore (a1 a2 th) :precision binary64 (* a2 (/ a2 (sqrt 2.0))))
double code(double a1, double a2, double th) {
return a2 * (a2 / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = a2 * (a2 / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return a2 * (a2 / Math.sqrt(2.0));
}
def code(a1, a2, th): return a2 * (a2 / math.sqrt(2.0))
function code(a1, a2, th) return Float64(a2 * Float64(a2 / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = a2 * (a2 / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(a2 * N[(a2 / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
a2 \cdot \frac{a2}{\sqrt{2}}
\end{array}
Initial program 99.6%
distribute-lft-out99.5%
Simplified99.5%
Taylor expanded in th around 0 64.8%
Taylor expanded in a1 around 0 39.4%
pow239.4%
associate-/l*39.5%
Applied egg-rr39.5%
Final simplification39.5%
herbie shell --seed 2024074
(FPCore (a1 a2 th)
:name "Migdal et al, Equation (64)"
:precision binary64
(+ (* (/ (cos th) (sqrt 2.0)) (* a1 a1)) (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))