
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 11 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (a1 a2 th) :precision binary64 (let* ((t_1 (/ (cos th) (sqrt 2.0)))) (+ (* t_1 (* a1 a1)) (* t_1 (* a2 a2)))))
double code(double a1, double a2, double th) {
double t_1 = cos(th) / sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: t_1
t_1 = cos(th) / sqrt(2.0d0)
code = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
double t_1 = Math.cos(th) / Math.sqrt(2.0);
return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2));
}
def code(a1, a2, th): t_1 = math.cos(th) / math.sqrt(2.0) return (t_1 * (a1 * a1)) + (t_1 * (a2 * a2))
function code(a1, a2, th) t_1 = Float64(cos(th) / sqrt(2.0)) return Float64(Float64(t_1 * Float64(a1 * a1)) + Float64(t_1 * Float64(a2 * a2))) end
function tmp = code(a1, a2, th) t_1 = cos(th) / sqrt(2.0); tmp = (t_1 * (a1 * a1)) + (t_1 * (a2 * a2)); end
code[a1_, a2_, th_] := Block[{t$95$1 = N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]}, N[(N[(t$95$1 * N[(a1 * a1), $MachinePrecision]), $MachinePrecision] + N[(t$95$1 * N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
t_1 := \frac{\cos th}{\sqrt{2}}\\
t\_1 \cdot \left(a1 \cdot a1\right) + t\_1 \cdot \left(a2 \cdot a2\right)
\end{array}
\end{array}
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ (fma a2 a2 (* a1 a1)) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return cos(th) * (fma(a2, a2, (a1 * a1)) / sqrt(2.0));
}
function code(a1, a2, th) return Float64(cos(th) * Float64(fma(a2, a2, Float64(a1 * a1)) / sqrt(2.0))) end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 * a2 + N[(a1 * a1), $MachinePrecision]), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt{2}}
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
cos-neg99.6%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
(FPCore (a1 a2 th) :precision binary64 (if (<= (cos th) 0.7) (* (cos th) (* (+ a2 a1) (+ a2 a1))) (* (+ (* a1 a1) (* a2 a2)) (sqrt 0.5))))
double code(double a1, double a2, double th) {
double tmp;
if (cos(th) <= 0.7) {
tmp = cos(th) * ((a2 + a1) * (a2 + a1));
} else {
tmp = ((a1 * a1) + (a2 * a2)) * sqrt(0.5);
}
return tmp;
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
real(8) :: tmp
if (cos(th) <= 0.7d0) then
tmp = cos(th) * ((a2 + a1) * (a2 + a1))
else
tmp = ((a1 * a1) + (a2 * a2)) * sqrt(0.5d0)
end if
code = tmp
end function
public static double code(double a1, double a2, double th) {
double tmp;
if (Math.cos(th) <= 0.7) {
tmp = Math.cos(th) * ((a2 + a1) * (a2 + a1));
} else {
tmp = ((a1 * a1) + (a2 * a2)) * Math.sqrt(0.5);
}
return tmp;
}
def code(a1, a2, th): tmp = 0 if math.cos(th) <= 0.7: tmp = math.cos(th) * ((a2 + a1) * (a2 + a1)) else: tmp = ((a1 * a1) + (a2 * a2)) * math.sqrt(0.5) return tmp
function code(a1, a2, th) tmp = 0.0 if (cos(th) <= 0.7) tmp = Float64(cos(th) * Float64(Float64(a2 + a1) * Float64(a2 + a1))); else tmp = Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) * sqrt(0.5)); end return tmp end
function tmp_2 = code(a1, a2, th) tmp = 0.0; if (cos(th) <= 0.7) tmp = cos(th) * ((a2 + a1) * (a2 + a1)); else tmp = ((a1 * a1) + (a2 * a2)) * sqrt(0.5); end tmp_2 = tmp; end
code[a1_, a2_, th_] := If[LessEqual[N[Cos[th], $MachinePrecision], 0.7], N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 + a1), $MachinePrecision] * N[(a2 + a1), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;\cos th \leq 0.7:\\
\;\;\;\;\cos th \cdot \left(\left(a2 + a1\right) \cdot \left(a2 + a1\right)\right)\\
\mathbf{else}:\\
\;\;\;\;\left(a1 \cdot a1 + a2 \cdot a2\right) \cdot \sqrt{0.5}\\
\end{array}
\end{array}
if (cos.f64 th) < 0.69999999999999996Initial program 99.7%
distribute-lft-out99.7%
cos-neg99.7%
associate-*l/99.6%
associate-/l*99.7%
cos-neg99.7%
+-commutative99.7%
fma-define99.7%
Simplified99.7%
div-inv99.6%
add-sqr-sqrt99.6%
associate-*l*99.5%
fma-undefine99.5%
hypot-define99.5%
fma-undefine99.5%
hypot-define99.5%
pow1/299.5%
pow-flip99.5%
metadata-eval99.5%
Applied egg-rr99.5%
Applied egg-rr59.1%
+-commutative59.1%
distribute-lft-out64.4%
+-commutative64.4%
Simplified64.4%
if 0.69999999999999996 < (cos.f64 th) Initial program 99.5%
distribute-lft-out99.5%
Simplified99.5%
clear-num99.5%
associate-/r/99.5%
pow1/299.5%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Taylor expanded in th around 0 92.1%
Final simplification82.0%
(FPCore (a1 a2 th) :precision binary64 (* (/ (cos th) (sqrt 2.0)) (+ (* a1 a1) (* a2 a2))))
double code(double a1, double a2, double th) {
return (cos(th) / sqrt(2.0)) * ((a1 * a1) + (a2 * a2));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = (cos(th) / sqrt(2.0d0)) * ((a1 * a1) + (a2 * a2))
end function
public static double code(double a1, double a2, double th) {
return (Math.cos(th) / Math.sqrt(2.0)) * ((a1 * a1) + (a2 * a2));
}
def code(a1, a2, th): return (math.cos(th) / math.sqrt(2.0)) * ((a1 * a1) + (a2 * a2))
function code(a1, a2, th) return Float64(Float64(cos(th) / sqrt(2.0)) * Float64(Float64(a1 * a1) + Float64(a2 * a2))) end
function tmp = code(a1, a2, th) tmp = (cos(th) / sqrt(2.0)) * ((a1 * a1) + (a2 * a2)); end
code[a1_, a2_, th_] := N[(N[(N[Cos[th], $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision] * N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\frac{\cos th}{\sqrt{2}} \cdot \left(a1 \cdot a1 + a2 \cdot a2\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
Simplified99.6%
(FPCore (a1 a2 th) :precision binary64 (* (+ (* a1 a1) (* a2 a2)) (* (cos th) (sqrt 0.5))))
double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * (cos(th) * sqrt(0.5));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = ((a1 * a1) + (a2 * a2)) * (cos(th) * sqrt(0.5d0))
end function
public static double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * (Math.cos(th) * Math.sqrt(0.5));
}
def code(a1, a2, th): return ((a1 * a1) + (a2 * a2)) * (math.cos(th) * math.sqrt(0.5))
function code(a1, a2, th) return Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) * Float64(cos(th) * sqrt(0.5))) end
function tmp = code(a1, a2, th) tmp = ((a1 * a1) + (a2 * a2)) * (cos(th) * sqrt(0.5)); end
code[a1_, a2_, th_] := N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] * N[(N[Cos[th], $MachinePrecision] * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(a1 \cdot a1 + a2 \cdot a2\right) \cdot \left(\cos th \cdot \sqrt{0.5}\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
Simplified99.6%
clear-num99.6%
associate-/r/99.6%
pow1/299.6%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Taylor expanded in th around inf 99.6%
*-commutative99.6%
Simplified99.6%
Final simplification99.6%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (/ (* a2 a2) (sqrt 2.0))))
double code(double a1, double a2, double th) {
return cos(th) * ((a2 * a2) / sqrt(2.0));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * ((a2 * a2) / sqrt(2.0d0))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * ((a2 * a2) / Math.sqrt(2.0));
}
def code(a1, a2, th): return math.cos(th) * ((a2 * a2) / math.sqrt(2.0))
function code(a1, a2, th) return Float64(cos(th) * Float64(Float64(a2 * a2) / sqrt(2.0))) end
function tmp = code(a1, a2, th) tmp = cos(th) * ((a2 * a2) / sqrt(2.0)); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 * a2), $MachinePrecision] / N[Sqrt[2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \frac{a2 \cdot a2}{\sqrt{2}}
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
cos-neg99.6%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
Taylor expanded in a2 around inf 54.2%
pow254.2%
Applied egg-rr54.2%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (* a2 (* a2 (sqrt 0.5)))))
double code(double a1, double a2, double th) {
return cos(th) * (a2 * (a2 * sqrt(0.5)));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * (a2 * (a2 * sqrt(0.5d0)))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * (a2 * (a2 * Math.sqrt(0.5)));
}
def code(a1, a2, th): return math.cos(th) * (a2 * (a2 * math.sqrt(0.5)))
function code(a1, a2, th) return Float64(cos(th) * Float64(a2 * Float64(a2 * sqrt(0.5)))) end
function tmp = code(a1, a2, th) tmp = cos(th) * (a2 * (a2 * sqrt(0.5))); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(a2 * N[(a2 * N[Sqrt[0.5], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \left(a2 \cdot \left(a2 \cdot \sqrt{0.5}\right)\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
cos-neg99.6%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
div-inv99.6%
add-sqr-sqrt99.6%
associate-*l*99.5%
fma-undefine99.5%
hypot-define99.5%
fma-undefine99.5%
hypot-define99.5%
pow1/299.5%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Taylor expanded in a2 around inf 32.4%
*-commutative32.4%
Simplified32.4%
Taylor expanded in a2 around inf 54.3%
Final simplification54.3%
(FPCore (a1 a2 th) :precision binary64 (* (cos th) (* (+ a2 a1) (+ a2 a1))))
double code(double a1, double a2, double th) {
return cos(th) * ((a2 + a1) * (a2 + a1));
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = cos(th) * ((a2 + a1) * (a2 + a1))
end function
public static double code(double a1, double a2, double th) {
return Math.cos(th) * ((a2 + a1) * (a2 + a1));
}
def code(a1, a2, th): return math.cos(th) * ((a2 + a1) * (a2 + a1))
function code(a1, a2, th) return Float64(cos(th) * Float64(Float64(a2 + a1) * Float64(a2 + a1))) end
function tmp = code(a1, a2, th) tmp = cos(th) * ((a2 + a1) * (a2 + a1)); end
code[a1_, a2_, th_] := N[(N[Cos[th], $MachinePrecision] * N[(N[(a2 + a1), $MachinePrecision] * N[(a2 + a1), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\cos th \cdot \left(\left(a2 + a1\right) \cdot \left(a2 + a1\right)\right)
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
cos-neg99.6%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
div-inv99.6%
add-sqr-sqrt99.6%
associate-*l*99.5%
fma-undefine99.5%
hypot-define99.5%
fma-undefine99.5%
hypot-define99.5%
pow1/299.5%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Applied egg-rr55.7%
+-commutative55.7%
distribute-lft-out62.0%
+-commutative62.0%
Simplified62.0%
Final simplification62.0%
(FPCore (a1 a2 th) :precision binary64 (* (+ (* a1 a1) (* a2 a2)) 0.5))
double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * 0.5;
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = ((a1 * a1) + (a2 * a2)) * 0.5d0
end function
public static double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * 0.5;
}
def code(a1, a2, th): return ((a1 * a1) + (a2 * a2)) * 0.5
function code(a1, a2, th) return Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) * 0.5) end
function tmp = code(a1, a2, th) tmp = ((a1 * a1) + (a2 * a2)) * 0.5; end
code[a1_, a2_, th_] := N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] * 0.5), $MachinePrecision]
\begin{array}{l}
\\
\left(a1 \cdot a1 + a2 \cdot a2\right) \cdot 0.5
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
Simplified99.6%
Taylor expanded in th around 0 67.1%
Applied egg-rr47.3%
Final simplification47.3%
(FPCore (a1 a2 th) :precision binary64 (* (+ (* a1 a1) (* a2 a2)) 0.25))
double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * 0.25;
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = ((a1 * a1) + (a2 * a2)) * 0.25d0
end function
public static double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * 0.25;
}
def code(a1, a2, th): return ((a1 * a1) + (a2 * a2)) * 0.25
function code(a1, a2, th) return Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) * 0.25) end
function tmp = code(a1, a2, th) tmp = ((a1 * a1) + (a2 * a2)) * 0.25; end
code[a1_, a2_, th_] := N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] * 0.25), $MachinePrecision]
\begin{array}{l}
\\
\left(a1 \cdot a1 + a2 \cdot a2\right) \cdot 0.25
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
Simplified99.6%
Taylor expanded in th around 0 67.1%
Applied egg-rr46.5%
Final simplification46.5%
(FPCore (a1 a2 th) :precision binary64 (* (+ (* a1 a1) (* a2 a2)) -0.5))
double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * -0.5;
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = ((a1 * a1) + (a2 * a2)) * (-0.5d0)
end function
public static double code(double a1, double a2, double th) {
return ((a1 * a1) + (a2 * a2)) * -0.5;
}
def code(a1, a2, th): return ((a1 * a1) + (a2 * a2)) * -0.5
function code(a1, a2, th) return Float64(Float64(Float64(a1 * a1) + Float64(a2 * a2)) * -0.5) end
function tmp = code(a1, a2, th) tmp = ((a1 * a1) + (a2 * a2)) * -0.5; end
code[a1_, a2_, th_] := N[(N[(N[(a1 * a1), $MachinePrecision] + N[(a2 * a2), $MachinePrecision]), $MachinePrecision] * -0.5), $MachinePrecision]
\begin{array}{l}
\\
\left(a1 \cdot a1 + a2 \cdot a2\right) \cdot -0.5
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
Simplified99.6%
Taylor expanded in th around 0 67.1%
Applied egg-rr19.8%
Final simplification19.8%
(FPCore (a1 a2 th) :precision binary64 1.0)
double code(double a1, double a2, double th) {
return 1.0;
}
real(8) function code(a1, a2, th)
real(8), intent (in) :: a1
real(8), intent (in) :: a2
real(8), intent (in) :: th
code = 1.0d0
end function
public static double code(double a1, double a2, double th) {
return 1.0;
}
def code(a1, a2, th): return 1.0
function code(a1, a2, th) return 1.0 end
function tmp = code(a1, a2, th) tmp = 1.0; end
code[a1_, a2_, th_] := 1.0
\begin{array}{l}
\\
1
\end{array}
Initial program 99.6%
distribute-lft-out99.6%
cos-neg99.6%
associate-*l/99.6%
associate-/l*99.6%
cos-neg99.6%
+-commutative99.6%
fma-define99.6%
Simplified99.6%
div-inv99.6%
add-sqr-sqrt99.6%
associate-*l*99.5%
fma-undefine99.5%
hypot-define99.5%
fma-undefine99.5%
hypot-define99.5%
pow1/299.5%
pow-flip99.6%
metadata-eval99.6%
Applied egg-rr99.6%
Applied egg-rr3.4%
*-inverses3.4%
Simplified3.4%
herbie shell --seed 2024125
(FPCore (a1 a2 th)
:name "Migdal et al, Equation (64)"
:precision binary64
(+ (* (/ (cos th) (sqrt 2.0)) (* a1 a1)) (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))