
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t_1 \cdot \left(a1 \cdot a1\right) + t_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t_1 \cdot \left(a1 \cdot a1\right) + t_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (* (hypot a1 a2) (* (hypot a1 a2) (pow 2.0 -0.5)))))
double code(double a1, double a2, double th) {
return cos(th) * (hypot(a1, a2) * (hypot(a1, a2) * pow(2.0, -0.5)));
}
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (Math.hypot(a1, a2) * (Math.hypot(a1, a2) * Math.pow(2.0, -0.5)));
}
def code(a1, a2, th): return math.cos(th) * (math.hypot(a1, a2) * (math.hypot(a1, a2) * math.pow(2.0, -0.5)))
function code(a1, a2, th) return Float64(cos(th) * Float64(hypot(a1, a2) * Float64(hypot(a1, a2) * (2.0 ^ -0.5)))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (hypot(a1, a2) * (hypot(a1, a2) * (2.0 ^ -0.5))); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[Sqrt[a1 ^ 2 + a2 ^ 2], $MachinePrecision] * N[(N[Sqrt[a1 ^ 2 + a2 ^ 2], $MachinePrecision] * N[Power[2.0, -0.5], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \left(\mathsf{hypot}\left(a1, a2\right) \cdot \left(\mathsf{hypot}\left(a1, a2\right) \cdot {2}^{-0.5}\right)\right)
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
associate-*l/99.5%
associate-*r/99.6%
fma-def99.6%
Simplified99.6%
fma-def99.6%
div-inv99.5%
add-sqr-sqrt99.5%
associate-*l*99.5%
hypot-def99.5%
hypot-def99.5%
pow1/299.5%
pow-flip99.7%
metadata-eval99.7%
Applied egg-rr99.7%
Final simplification99.7%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ (+ (* a1 a1) (* a2 a2)) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return cos(th) * (((a1 * a1) + (a2 * a2)) / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * (((a1 * a1) + (a2 * a2)) / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (((a1 * a1) + (a2 * a2)) / Math.sqrt(2.0));
}
def code(a1, a2, th): return math.cos(th) * (((a1 * a1) + (a2 * a2)) / math.sqrt(2.0))
function code(a1, a2, th) return Float64(cos(th) * Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (((a1 * a1) + (a2 * a2)) / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{a1 \cdot a1 + a2 \cdot a2}{\sqrt{2}}
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
associate-*l/99.5%
associate-*r/99.6%
fma-def99.6%
Simplified99.6%
fma-def99.6%
+-commutative99.6%
Applied egg-rr99.6%
Final simplification99.6%
(FPCore (a1 a2 th) :precision binary64 (* (* (cos th) (sqrt 0.5)) (+ (* a1 a1) (* a2 a2))))
double code(double a1, double a2, double th) {
return (cos(th) * sqrt(0.5)) * ((a1 * a1) + (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = (cos(th) * sqrt(0.5d0)) * ((a1 * a1) + (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
return (Math.cos(th) * Math.sqrt(0.5)) * ((a1 * a1) + (a2 * a2));
}
def code(a1, a2, th): return (math.cos(th) * math.sqrt(0.5)) * ((a1 * a1) + (a2 * a2))
function code(a1, a2, th) return Float64(Float64(cos(th) * sqrt(0.5)) * Float64(Float64(a1 * a1) + Float64(a2 * a2))) end
function tmp = code(a1, a2, th) tmp = (cos(th) * sqrt(0.5)) * ((a1 * a1) + (a2 * a2)); end
code[a1_, a2_, th_] := N[(N[(N[Cos[th], $MachinePrecision] * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision] * N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(\cos th \cdot \sqrt{0.5}\right) \cdot \left(a1 \cdot a1 + a2 \cdot a2\right)
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
Simplified99.5%
clear-num99.5%
associate-/r/99.5%
pow1/299.5%
pow-flip99.7%
metadata-eval99.7%
Applied egg-rr99.7%
Taylor expanded in th around inf 99.7%
Final simplification99.7%
(FPCore (a1 a2 th) :precision binary64 (* a2 (* (sqrt 0.5) (* (cos th) a2))))
double code(double a1, double a2, double th) {
return a2 * (sqrt(0.5) * (cos(th) * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = a2 * (sqrt(0.5d0) * (cos(th) * a2))
end function
public static double code(double a1, double a2, double th) {
return a2 * (Math.sqrt(0.5) * (Math.cos(th) * a2));
}
def code(a1, a2, th): return a2 * (math.sqrt(0.5) * (math.cos(th) * a2))
function code(a1, a2, th) return Float64(a2 * Float64(sqrt(0.5) * Float64(cos(th) * a2))) end
function tmp = code(a1, a2, th) tmp = a2 * (sqrt(0.5) * (cos(th) * a2)); end
code[a1_, a2_, th_] := N[(a2 * N[(N[Sqrt[0.5], $MachinePrecision] * N[(N[Cos[th], $MachinePrecision] * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
a2 \cdot \left(\sqrt{0.5} \cdot \left(\cos th \cdot a2\right)\right)
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
associate-*l/99.5%
associate-*r/99.6%
fma-def99.6%
Simplified99.6%
Taylor expanded in a1 around 0 56.0%
unpow256.0%
associate-*l*56.0%
Simplified56.0%
div-inv56.0%
associate-*l*56.0%
add-sqr-sqrt56.0%
sqrt-unprod56.0%
frac-times56.0%
metadata-eval56.0%
add-sqr-sqrt56.1%
metadata-eval56.1%
Applied egg-rr56.1%
Final simplification56.1%
(FPCore (a1 a2 th) :precision binary64 (* (sqrt 0.5) (+ (* a1 a1) (* a2 a2))))
double code(double a1, double a2, double th) {
return sqrt(0.5) * ((a1 * a1) + (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = sqrt(0.5d0) * ((a1 * a1) + (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
return Math.sqrt(0.5) * ((a1 * a1) + (a2 * a2));
}
def code(a1, a2, th): return math.sqrt(0.5) * ((a1 * a1) + (a2 * a2))
function code(a1, a2, th) return Float64(sqrt(0.5) * Float64(Float64(a1 * a1) + Float64(a2 * a2))) end
function tmp = code(a1, a2, th) tmp = sqrt(0.5) * ((a1 * a1) + (a2 * a2)); end
code[a1_, a2_, th_] := N[(N[Sqrt[0.5], $MachinePrecision] * N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\sqrt{0.5} \cdot \left(a1 \cdot a1 + a2 \cdot a2\right)
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
Simplified99.5%
clear-num99.5%
associate-/r/99.5%
pow1/299.5%
pow-flip99.7%
metadata-eval99.7%
Applied egg-rr99.7%
Taylor expanded in th around 0 70.0%
Final simplification70.0%
(FPCore (a1 a2 th) :precision binary64 (* a2 (* a2 (sqrt 0.5))))
double code(double a1, double a2, double th) {
return a2 * (a2 * sqrt(0.5));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = a2 * (a2 * sqrt(0.5d0))
end function
public static double code(double a1, double a2, double th) {
return a2 * (a2 * Math.sqrt(0.5));
}
def code(a1, a2, th): return a2 * (a2 * math.sqrt(0.5))
function code(a1, a2, th) return Float64(a2 * Float64(a2 * sqrt(0.5))) end
function tmp = code(a1, a2, th) tmp = a2 * (a2 * sqrt(0.5)); end
code[a1_, a2_, th_] := N[(a2 * N[(a2 * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
a2 \cdot \left(a2 \cdot \sqrt{0.5}\right)
\end{array}
Initial program 99.5%
distribute-lft-out99.5%
associate-*l/99.5%
associate-*r/99.6%
fma-def99.6%
Simplified99.6%
Taylor expanded in a1 around 0 56.0%
unpow256.0%
associate-*l*56.0%
Simplified56.0%
div-inv56.0%
associate-*l*56.0%
add-sqr-sqrt56.0%
sqrt-unprod56.0%
frac-times56.0%
metadata-eval56.0%
add-sqr-sqrt56.1%
metadata-eval56.1%
Applied egg-rr56.1%
Taylor expanded in th around 0 39.1%
Final simplification39.1%
herbie shell --seed 2023242
(FPCore (a1 a2 th)
:name "Migdal et al, Equation (64)"
:precision binary64
(+ (* (/ (cos th) (sqrt 2.0)) (* a1 a1)) (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))