Average Error: 0.5 → 0.4
Time: 10.5s
Precision: binary64
\[\frac{\cos th}{\sqrt{2}} \cdot \left(a1 \cdot a1\right) + \frac{\cos th}{\sqrt{2}} \cdot \left(a2 \cdot a2\right) \]
\[\cos th \cdot \left(\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt[3]{\sqrt{2}}} \cdot \sqrt[3]{0.5}\right) \]
\frac{\cos th}{\sqrt{2}} \cdot \left(a1 \cdot a1\right) + \frac{\cos th}{\sqrt{2}} \cdot \left(a2 \cdot a2\right)
\cos th \cdot \left(\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt[3]{\sqrt{2}}} \cdot \sqrt[3]{0.5}\right)
(FPCore (a1 a2 th)
 :precision binary64
 (+
  (* (/ (cos th) (sqrt 2.0)) (* a1 a1))
  (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))
(FPCore (a1 a2 th)
 :precision binary64
 (* (cos th) (* (/ (fma a2 a2 (* a1 a1)) (cbrt (sqrt 2.0))) (cbrt 0.5))))
double code(double a1, double a2, double th) {
	return ((cos(th) / sqrt(2.0)) * (a1 * a1)) + ((cos(th) / sqrt(2.0)) * (a2 * a2));
}
double code(double a1, double a2, double th) {
	return cos(th) * ((fma(a2, a2, (a1 * a1)) / cbrt(sqrt(2.0))) * cbrt(0.5));
}

Error

Bits error versus a1

Bits error versus a2

Bits error versus th

Derivation

  1. Initial program 0.5

    \[\frac{\cos th}{\sqrt{2}} \cdot \left(a1 \cdot a1\right) + \frac{\cos th}{\sqrt{2}} \cdot \left(a2 \cdot a2\right) \]
  2. Simplified0.5

    \[\leadsto \color{blue}{\cos th \cdot \frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right)}{\sqrt{2}}} \]
  3. Applied add-cube-cbrt_binary640.5

    \[\leadsto \cos th \cdot \frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right)}{\color{blue}{\left(\sqrt[3]{\sqrt{2}} \cdot \sqrt[3]{\sqrt{2}}\right) \cdot \sqrt[3]{\sqrt{2}}}} \]
  4. Applied associate-/r*_binary640.5

    \[\leadsto \cos th \cdot \color{blue}{\frac{\frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right)}{\sqrt[3]{\sqrt{2}} \cdot \sqrt[3]{\sqrt{2}}}}{\sqrt[3]{\sqrt{2}}}} \]
  5. Applied associate-*r/_binary640.5

    \[\leadsto \color{blue}{\frac{\cos th \cdot \frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right)}{\sqrt[3]{\sqrt{2}} \cdot \sqrt[3]{\sqrt{2}}}}{\sqrt[3]{\sqrt{2}}}} \]
  6. Taylor expanded in th around inf 0.6

    \[\leadsto \frac{\color{blue}{\left(\left({a1}^{2} + {a2}^{2}\right) \cdot \cos th\right) \cdot {\left(\frac{1}{{\left(\sqrt{2}\right)}^{2}}\right)}^{0.3333333333333333}}}{\sqrt[3]{\sqrt{2}}} \]
  7. Simplified0.4

    \[\leadsto \frac{\color{blue}{\cos th \cdot \left(\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}\right)}}{\sqrt[3]{\sqrt{2}}} \]
  8. Applied *-un-lft-identity_binary640.4

    \[\leadsto \frac{\cos th \cdot \left(\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}\right)}{\sqrt[3]{\sqrt{\color{blue}{1 \cdot 2}}}} \]
  9. Applied sqrt-prod_binary640.4

    \[\leadsto \frac{\cos th \cdot \left(\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}\right)}{\sqrt[3]{\color{blue}{\sqrt{1} \cdot \sqrt{2}}}} \]
  10. Applied cbrt-prod_binary640.4

    \[\leadsto \frac{\cos th \cdot \left(\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}\right)}{\color{blue}{\sqrt[3]{\sqrt{1}} \cdot \sqrt[3]{\sqrt{2}}}} \]
  11. Applied times-frac_binary640.4

    \[\leadsto \color{blue}{\frac{\cos th}{\sqrt[3]{\sqrt{1}}} \cdot \frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}}{\sqrt[3]{\sqrt{2}}}} \]
  12. Simplified0.4

    \[\leadsto \color{blue}{\cos th} \cdot \frac{\mathsf{fma}\left(a1, a1, a2 \cdot a2\right) \cdot \sqrt[3]{0.5}}{\sqrt[3]{\sqrt{2}}} \]
  13. Simplified0.4

    \[\leadsto \cos th \cdot \color{blue}{\left(\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt[3]{\sqrt{2}}} \cdot \sqrt[3]{0.5}\right)} \]
  14. Final simplification0.4

    \[\leadsto \cos th \cdot \left(\frac{\mathsf{fma}\left(a2, a2, a1 \cdot a1\right)}{\sqrt[3]{\sqrt{2}}} \cdot \sqrt[3]{0.5}\right) \]

Reproduce

herbie shell --seed 2021332 
(FPCore (a1 a2 th)
  :name "Migdal et al, Equation (64)"
  :precision binary64
  (+ (* (/ (cos th) (sqrt 2.0)) (* a1 a1)) (* (/ (cos th) (sqrt 2.0)) (* a2 a2))))