Toniolo and Linder, Equation (3a)

Percentage Accurate: 98.4% → 98.3%
Time: 16.0s
Alternatives: 9
Speedup: 1.0×

Specification

?
\[\begin{array}{l} \\ \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \end{array} \]
(FPCore (l Om kx ky)
 :precision binary64
 (sqrt
  (*
   (/ 1.0 2.0)
   (+
    1.0
    (/
     1.0
     (sqrt
      (+
       1.0
       (*
        (pow (/ (* 2.0 l) Om) 2.0)
        (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))
double code(double l, double Om, double kx, double ky) {
	return sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + (pow(((2.0 * l) / Om), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0)))))))));
}
real(8) function code(l, om, kx, ky)
    real(8), intent (in) :: l
    real(8), intent (in) :: om
    real(8), intent (in) :: kx
    real(8), intent (in) :: ky
    code = sqrt(((1.0d0 / 2.0d0) * (1.0d0 + (1.0d0 / sqrt((1.0d0 + ((((2.0d0 * l) / om) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0)))))))))
end function
public static double code(double l, double Om, double kx, double ky) {
	return Math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / Math.sqrt((1.0 + (Math.pow(((2.0 * l) / Om), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0)))))))));
}
def code(l, Om, kx, ky):
	return math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / math.sqrt((1.0 + (math.pow(((2.0 * l) / Om), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0)))))))))
function code(l, Om, kx, ky)
	return sqrt(Float64(Float64(1.0 / 2.0) * Float64(1.0 + Float64(1.0 / sqrt(Float64(1.0 + Float64((Float64(Float64(2.0 * l) / Om) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))))
end
function tmp = code(l, Om, kx, ky)
	tmp = sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + ((((2.0 * l) / Om) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))));
end
code[l_, Om_, kx_, ky_] := N[Sqrt[N[(N[(1.0 / 2.0), $MachinePrecision] * N[(1.0 + N[(1.0 / N[Sqrt[N[(1.0 + N[(N[Power[N[(N[(2.0 * l), $MachinePrecision] / Om), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}

\\
\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)}
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 9 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 98.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \end{array} \]
(FPCore (l Om kx ky)
 :precision binary64
 (sqrt
  (*
   (/ 1.0 2.0)
   (+
    1.0
    (/
     1.0
     (sqrt
      (+
       1.0
       (*
        (pow (/ (* 2.0 l) Om) 2.0)
        (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))
double code(double l, double Om, double kx, double ky) {
	return sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + (pow(((2.0 * l) / Om), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0)))))))));
}
real(8) function code(l, om, kx, ky)
    real(8), intent (in) :: l
    real(8), intent (in) :: om
    real(8), intent (in) :: kx
    real(8), intent (in) :: ky
    code = sqrt(((1.0d0 / 2.0d0) * (1.0d0 + (1.0d0 / sqrt((1.0d0 + ((((2.0d0 * l) / om) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0)))))))))
end function
public static double code(double l, double Om, double kx, double ky) {
	return Math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / Math.sqrt((1.0 + (Math.pow(((2.0 * l) / Om), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0)))))))));
}
def code(l, Om, kx, ky):
	return math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / math.sqrt((1.0 + (math.pow(((2.0 * l) / Om), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0)))))))))
function code(l, Om, kx, ky)
	return sqrt(Float64(Float64(1.0 / 2.0) * Float64(1.0 + Float64(1.0 / sqrt(Float64(1.0 + Float64((Float64(Float64(2.0 * l) / Om) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))))
end
function tmp = code(l, Om, kx, ky)
	tmp = sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + ((((2.0 * l) / Om) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))));
end
code[l_, Om_, kx_, ky_] := N[Sqrt[N[(N[(1.0 / 2.0), $MachinePrecision] * N[(1.0 + N[(1.0 / N[Sqrt[N[(1.0 + N[(N[Power[N[(N[(2.0 * l), $MachinePrecision] / Om), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}

\\
\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)}
\end{array}

Alternative 1: 98.3% accurate, 1.8× speedup?

\[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\ \;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{l\_m}{Om\_m} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)}\\ \mathbf{else}:\\ \;\;\;\;\sqrt{0.5}\\ \end{array} \end{array} \]
l_m = (fabs.f64 l)
Om_m = (fabs.f64 Om)
(FPCore (l_m Om_m kx ky)
 :precision binary64
 (if (<= (/ (* 2.0 l_m) Om_m) 2.5e+96)
   (sqrt
    (*
     0.5
     (+
      1.0
      (/
       1.0
       (sqrt
        (fma
         (* (/ l_m Om_m) 4.0)
         (*
          (/ l_m Om_m)
          (+
           (+ 0.5 (* -0.5 (cos (+ kx kx))))
           (+ 0.5 (* -0.5 (cos (+ ky ky))))))
         1.0))))))
   (sqrt 0.5)))
l_m = fabs(l);
Om_m = fabs(Om);
double code(double l_m, double Om_m, double kx, double ky) {
	double tmp;
	if (((2.0 * l_m) / Om_m) <= 2.5e+96) {
		tmp = sqrt((0.5 * (1.0 + (1.0 / sqrt(fma(((l_m / Om_m) * 4.0), ((l_m / Om_m) * ((0.5 + (-0.5 * cos((kx + kx)))) + (0.5 + (-0.5 * cos((ky + ky)))))), 1.0))))));
	} else {
		tmp = sqrt(0.5);
	}
	return tmp;
}
l_m = abs(l)
Om_m = abs(Om)
function code(l_m, Om_m, kx, ky)
	tmp = 0.0
	if (Float64(Float64(2.0 * l_m) / Om_m) <= 2.5e+96)
		tmp = sqrt(Float64(0.5 * Float64(1.0 + Float64(1.0 / sqrt(fma(Float64(Float64(l_m / Om_m) * 4.0), Float64(Float64(l_m / Om_m) * Float64(Float64(0.5 + Float64(-0.5 * cos(Float64(kx + kx)))) + Float64(0.5 + Float64(-0.5 * cos(Float64(ky + ky)))))), 1.0))))));
	else
		tmp = sqrt(0.5);
	end
	return tmp
end
l_m = N[Abs[l], $MachinePrecision]
Om_m = N[Abs[Om], $MachinePrecision]
code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.5e+96], N[Sqrt[N[(0.5 * N[(1.0 + N[(1.0 / N[Sqrt[N[(N[(N[(l$95$m / Om$95$m), $MachinePrecision] * 4.0), $MachinePrecision] * N[(N[(l$95$m / Om$95$m), $MachinePrecision] * N[(N[(0.5 + N[(-0.5 * N[Cos[N[(kx + kx), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + N[(0.5 + N[(-0.5 * N[Cos[N[(ky + ky), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], N[Sqrt[0.5], $MachinePrecision]]
\begin{array}{l}
l_m = \left|\ell\right|
\\
Om_m = \left|Om\right|

\\
\begin{array}{l}
\mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\
\;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{l\_m}{Om\_m} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)}\\

\mathbf{else}:\\
\;\;\;\;\sqrt{0.5}\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (/.f64 (*.f64 #s(literal 2 binary64) l) Om) < 2.5000000000000002e96

    1. Initial program 100.0%

      \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
    2. Add Preprocessing
    3. Applied egg-rr96.4%

      \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\color{blue}{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}}\right)} \]
    4. Step-by-step derivation
      1. metadata-eval96.4

        \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]
    5. Applied egg-rr96.4%

      \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]

    if 2.5000000000000002e96 < (/.f64 (*.f64 #s(literal 2 binary64) l) Om)

    1. Initial program 91.8%

      \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
    2. Add Preprocessing
    3. Taylor expanded in l around inf

      \[\leadsto \sqrt{\color{blue}{\frac{1}{2}}} \]
    4. Step-by-step derivation
      1. Simplified98.4%

        \[\leadsto \sqrt{\color{blue}{0.5}} \]
    5. Recombined 2 regimes into one program.
    6. Add Preprocessing

    Alternative 2: 91.7% accurate, 0.9× speedup?

    \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\ \;\;\;\;\mathsf{fma}\left(-0.5, \frac{l\_m}{Om\_m} \cdot \frac{l\_m \cdot \mathsf{fma}\left(-0.5, \cos \left(kx \cdot -2\right), 0.5\right)}{Om\_m}, 1\right)\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(-0.25, \frac{Om\_m}{l\_m \cdot \sin ky}, 0.5\right)}\\ \end{array} \end{array} \]
    l_m = (fabs.f64 l)
    Om_m = (fabs.f64 Om)
    (FPCore (l_m Om_m kx ky)
     :precision binary64
     (if (<=
          (*
           (pow (/ (* 2.0 l_m) Om_m) 2.0)
           (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0)))
          0.5)
       (fma
        -0.5
        (* (/ l_m Om_m) (/ (* l_m (fma -0.5 (cos (* kx -2.0)) 0.5)) Om_m))
        1.0)
       (sqrt (fma -0.25 (/ Om_m (* l_m (sin ky))) 0.5))))
    l_m = fabs(l);
    Om_m = fabs(Om);
    double code(double l_m, double Om_m, double kx, double ky) {
    	double tmp;
    	if ((pow(((2.0 * l_m) / Om_m), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0))) <= 0.5) {
    		tmp = fma(-0.5, ((l_m / Om_m) * ((l_m * fma(-0.5, cos((kx * -2.0)), 0.5)) / Om_m)), 1.0);
    	} else {
    		tmp = sqrt(fma(-0.25, (Om_m / (l_m * sin(ky))), 0.5));
    	}
    	return tmp;
    }
    
    l_m = abs(l)
    Om_m = abs(Om)
    function code(l_m, Om_m, kx, ky)
    	tmp = 0.0
    	if (Float64((Float64(Float64(2.0 * l_m) / Om_m) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))) <= 0.5)
    		tmp = fma(-0.5, Float64(Float64(l_m / Om_m) * Float64(Float64(l_m * fma(-0.5, cos(Float64(kx * -2.0)), 0.5)) / Om_m)), 1.0);
    	else
    		tmp = sqrt(fma(-0.25, Float64(Om_m / Float64(l_m * sin(ky))), 0.5));
    	end
    	return tmp
    end
    
    l_m = N[Abs[l], $MachinePrecision]
    Om_m = N[Abs[Om], $MachinePrecision]
    code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[Power[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], 0.5], N[(-0.5 * N[(N[(l$95$m / Om$95$m), $MachinePrecision] * N[(N[(l$95$m * N[(-0.5 * N[Cos[N[(kx * -2.0), $MachinePrecision]], $MachinePrecision] + 0.5), $MachinePrecision]), $MachinePrecision] / Om$95$m), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision], N[Sqrt[N[(-0.25 * N[(Om$95$m / N[(l$95$m * N[Sin[ky], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + 0.5), $MachinePrecision]], $MachinePrecision]]
    
    \begin{array}{l}
    l_m = \left|\ell\right|
    \\
    Om_m = \left|Om\right|
    
    \\
    \begin{array}{l}
    \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\
    \;\;\;\;\mathsf{fma}\left(-0.5, \frac{l\_m}{Om\_m} \cdot \frac{l\_m \cdot \mathsf{fma}\left(-0.5, \cos \left(kx \cdot -2\right), 0.5\right)}{Om\_m}, 1\right)\\
    
    \mathbf{else}:\\
    \;\;\;\;\sqrt{\mathsf{fma}\left(-0.25, \frac{Om\_m}{l\_m \cdot \sin ky}, 0.5\right)}\\
    
    
    \end{array}
    \end{array}
    
    Derivation
    1. Split input into 2 regimes
    2. if (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64)))) < 0.5

      1. Initial program 100.0%

        \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
      2. Add Preprocessing
      3. Taylor expanded in ky around 0

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin kx}^{2}}{{Om}^{2}}}}\right)}} \]
      4. Step-by-step derivation
        1. +-commutativeN/A

          \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin kx}^{2}}{{Om}^{2}}}} + 1\right)}} \]
        2. distribute-lft-inN/A

          \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin kx}^{2}}{{Om}^{2}}}} + \frac{1}{2} \cdot 1}} \]
        3. metadata-evalN/A

          \[\leadsto \sqrt{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin kx}^{2}}{{Om}^{2}}}} + \color{blue}{\frac{1}{2}}} \]
        4. accelerator-lowering-fma.f64N/A

          \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin kx}^{2}}{{Om}^{2}}}}, \frac{1}{2}\right)}} \]
      5. Simplified80.7%

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4, \frac{\left(\ell \cdot \ell\right) \cdot {\sin kx}^{2}}{Om \cdot Om}, 1\right)}}, 0.5\right)}} \]
      6. Applied egg-rr80.7%

        \[\leadsto \sqrt{\color{blue}{\frac{0.5}{\sqrt{\mathsf{fma}\left(4, \left(0.5 - 0.5 \cdot \cos \left(kx + kx\right)\right) \cdot \frac{\ell \cdot \ell}{Om \cdot Om}, 1\right)}} + 0.5}} \]
      7. Taylor expanded in l around 0

        \[\leadsto \color{blue}{1 + \frac{-1}{2} \cdot \frac{{\ell}^{2} \cdot \left(\frac{1}{2} - \frac{1}{2} \cdot \cos \left(2 \cdot kx\right)\right)}{{Om}^{2}}} \]
      8. Step-by-step derivation
        1. +-commutativeN/A

          \[\leadsto \color{blue}{\frac{-1}{2} \cdot \frac{{\ell}^{2} \cdot \left(\frac{1}{2} - \frac{1}{2} \cdot \cos \left(2 \cdot kx\right)\right)}{{Om}^{2}} + 1} \]
        2. accelerator-lowering-fma.f64N/A

          \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{-1}{2}, \frac{{\ell}^{2} \cdot \left(\frac{1}{2} - \frac{1}{2} \cdot \cos \left(2 \cdot kx\right)\right)}{{Om}^{2}}, 1\right)} \]
      9. Simplified80.7%

        \[\leadsto \color{blue}{\mathsf{fma}\left(-0.5, \frac{\left(\ell \cdot \ell\right) \cdot \mathsf{fma}\left(-0.5, \cos \left(kx \cdot -2\right), 0.5\right)}{Om \cdot Om}, 1\right)} \]
      10. Step-by-step derivation
        1. associate-*l*N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\color{blue}{\ell \cdot \left(\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)\right)}}{Om \cdot Om}, 1\right) \]
        2. times-fracN/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\frac{\ell}{Om} \cdot \frac{\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)}{Om}}, 1\right) \]
        3. *-lowering-*.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\frac{\ell}{Om} \cdot \frac{\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)}{Om}}, 1\right) \]
        4. /-lowering-/.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\frac{\ell}{Om}} \cdot \frac{\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)}{Om}, 1\right) \]
        5. /-lowering-/.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\ell}{Om} \cdot \color{blue}{\frac{\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)}{Om}}, 1\right) \]
        6. *-lowering-*.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\ell}{Om} \cdot \frac{\color{blue}{\ell \cdot \left(\frac{-1}{2} \cdot \cos \left(kx \cdot -2\right) + \frac{1}{2}\right)}}{Om}, 1\right) \]
        7. accelerator-lowering-fma.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\ell}{Om} \cdot \frac{\ell \cdot \color{blue}{\mathsf{fma}\left(\frac{-1}{2}, \cos \left(kx \cdot -2\right), \frac{1}{2}\right)}}{Om}, 1\right) \]
        8. cos-lowering-cos.f64N/A

          \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\ell}{Om} \cdot \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\cos \left(kx \cdot -2\right)}, \frac{1}{2}\right)}{Om}, 1\right) \]
        9. *-lowering-*.f6498.6

          \[\leadsto \mathsf{fma}\left(-0.5, \frac{\ell}{Om} \cdot \frac{\ell \cdot \mathsf{fma}\left(-0.5, \cos \color{blue}{\left(kx \cdot -2\right)}, 0.5\right)}{Om}, 1\right) \]
      11. Applied egg-rr98.6%

        \[\leadsto \mathsf{fma}\left(-0.5, \color{blue}{\frac{\ell}{Om} \cdot \frac{\ell \cdot \mathsf{fma}\left(-0.5, \cos \left(kx \cdot -2\right), 0.5\right)}{Om}}, 1\right) \]

      if 0.5 < (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))

      1. Initial program 96.6%

        \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
      2. Add Preprocessing
      3. Taylor expanded in kx around 0

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}\right)}} \]
      4. Step-by-step derivation
        1. +-commutativeN/A

          \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + 1\right)}} \]
        2. distribute-lft-inN/A

          \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \frac{1}{2} \cdot 1}} \]
        3. metadata-evalN/A

          \[\leadsto \sqrt{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \color{blue}{\frac{1}{2}}} \]
        4. accelerator-lowering-fma.f64N/A

          \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}, \frac{1}{2}\right)}} \]
      5. Simplified70.1%

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{{\sin ky}^{2}}{Om \cdot Om}, 1\right)}}, 0.5\right)}} \]
      6. Taylor expanded in l around -inf

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} + \frac{-1}{4} \cdot \frac{Om}{\ell \cdot \sin ky}}} \]
      7. Step-by-step derivation
        1. +-commutativeN/A

          \[\leadsto \sqrt{\color{blue}{\frac{-1}{4} \cdot \frac{Om}{\ell \cdot \sin ky} + \frac{1}{2}}} \]
        2. accelerator-lowering-fma.f64N/A

          \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{-1}{4}, \frac{Om}{\ell \cdot \sin ky}, \frac{1}{2}\right)}} \]
        3. /-lowering-/.f64N/A

          \[\leadsto \sqrt{\mathsf{fma}\left(\frac{-1}{4}, \color{blue}{\frac{Om}{\ell \cdot \sin ky}}, \frac{1}{2}\right)} \]
        4. *-lowering-*.f64N/A

          \[\leadsto \sqrt{\mathsf{fma}\left(\frac{-1}{4}, \frac{Om}{\color{blue}{\ell \cdot \sin ky}}, \frac{1}{2}\right)} \]
        5. sin-lowering-sin.f6482.5

          \[\leadsto \sqrt{\mathsf{fma}\left(-0.25, \frac{Om}{\ell \cdot \color{blue}{\sin ky}}, 0.5\right)} \]
      8. Simplified82.5%

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(-0.25, \frac{Om}{\ell \cdot \sin ky}, 0.5\right)}} \]
    3. Recombined 2 regimes into one program.
    4. Add Preprocessing

    Alternative 3: 91.6% accurate, 0.9× speedup?

    \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(-0.25, \frac{Om\_m}{l\_m \cdot \sin ky}, 0.5\right)}\\ \end{array} \end{array} \]
    l_m = (fabs.f64 l)
    Om_m = (fabs.f64 Om)
    (FPCore (l_m Om_m kx ky)
     :precision binary64
     (if (<=
          (*
           (pow (/ (* 2.0 l_m) Om_m) 2.0)
           (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0)))
          0.5)
       1.0
       (sqrt (fma -0.25 (/ Om_m (* l_m (sin ky))) 0.5))))
    l_m = fabs(l);
    Om_m = fabs(Om);
    double code(double l_m, double Om_m, double kx, double ky) {
    	double tmp;
    	if ((pow(((2.0 * l_m) / Om_m), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0))) <= 0.5) {
    		tmp = 1.0;
    	} else {
    		tmp = sqrt(fma(-0.25, (Om_m / (l_m * sin(ky))), 0.5));
    	}
    	return tmp;
    }
    
    l_m = abs(l)
    Om_m = abs(Om)
    function code(l_m, Om_m, kx, ky)
    	tmp = 0.0
    	if (Float64((Float64(Float64(2.0 * l_m) / Om_m) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))) <= 0.5)
    		tmp = 1.0;
    	else
    		tmp = sqrt(fma(-0.25, Float64(Om_m / Float64(l_m * sin(ky))), 0.5));
    	end
    	return tmp
    end
    
    l_m = N[Abs[l], $MachinePrecision]
    Om_m = N[Abs[Om], $MachinePrecision]
    code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[Power[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], 0.5], 1.0, N[Sqrt[N[(-0.25 * N[(Om$95$m / N[(l$95$m * N[Sin[ky], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + 0.5), $MachinePrecision]], $MachinePrecision]]
    
    \begin{array}{l}
    l_m = \left|\ell\right|
    \\
    Om_m = \left|Om\right|
    
    \\
    \begin{array}{l}
    \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\
    \;\;\;\;1\\
    
    \mathbf{else}:\\
    \;\;\;\;\sqrt{\mathsf{fma}\left(-0.25, \frac{Om\_m}{l\_m \cdot \sin ky}, 0.5\right)}\\
    
    
    \end{array}
    \end{array}
    
    Derivation
    1. Split input into 2 regimes
    2. if (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64)))) < 0.5

      1. Initial program 100.0%

        \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
      2. Add Preprocessing
      3. Taylor expanded in l around 0

        \[\leadsto \sqrt{\color{blue}{1}} \]
      4. Step-by-step derivation
        1. Simplified98.2%

          \[\leadsto \sqrt{\color{blue}{1}} \]
        2. Step-by-step derivation
          1. metadata-eval98.2

            \[\leadsto \color{blue}{1} \]
        3. Applied egg-rr98.2%

          \[\leadsto \color{blue}{1} \]

        if 0.5 < (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))

        1. Initial program 96.6%

          \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
        2. Add Preprocessing
        3. Taylor expanded in kx around 0

          \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}\right)}} \]
        4. Step-by-step derivation
          1. +-commutativeN/A

            \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + 1\right)}} \]
          2. distribute-lft-inN/A

            \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \frac{1}{2} \cdot 1}} \]
          3. metadata-evalN/A

            \[\leadsto \sqrt{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \color{blue}{\frac{1}{2}}} \]
          4. accelerator-lowering-fma.f64N/A

            \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}, \frac{1}{2}\right)}} \]
        5. Simplified70.1%

          \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{{\sin ky}^{2}}{Om \cdot Om}, 1\right)}}, 0.5\right)}} \]
        6. Taylor expanded in l around -inf

          \[\leadsto \sqrt{\color{blue}{\frac{1}{2} + \frac{-1}{4} \cdot \frac{Om}{\ell \cdot \sin ky}}} \]
        7. Step-by-step derivation
          1. +-commutativeN/A

            \[\leadsto \sqrt{\color{blue}{\frac{-1}{4} \cdot \frac{Om}{\ell \cdot \sin ky} + \frac{1}{2}}} \]
          2. accelerator-lowering-fma.f64N/A

            \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{-1}{4}, \frac{Om}{\ell \cdot \sin ky}, \frac{1}{2}\right)}} \]
          3. /-lowering-/.f64N/A

            \[\leadsto \sqrt{\mathsf{fma}\left(\frac{-1}{4}, \color{blue}{\frac{Om}{\ell \cdot \sin ky}}, \frac{1}{2}\right)} \]
          4. *-lowering-*.f64N/A

            \[\leadsto \sqrt{\mathsf{fma}\left(\frac{-1}{4}, \frac{Om}{\color{blue}{\ell \cdot \sin ky}}, \frac{1}{2}\right)} \]
          5. sin-lowering-sin.f6482.5

            \[\leadsto \sqrt{\mathsf{fma}\left(-0.25, \frac{Om}{\ell \cdot \color{blue}{\sin ky}}, 0.5\right)} \]
        8. Simplified82.5%

          \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(-0.25, \frac{Om}{\ell \cdot \sin ky}, 0.5\right)}} \]
      5. Recombined 2 regimes into one program.
      6. Add Preprocessing

      Alternative 4: 98.4% accurate, 1.0× speedup?

      \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \end{array} \]
      l_m = (fabs.f64 l)
      Om_m = (fabs.f64 Om)
      (FPCore (l_m Om_m kx ky)
       :precision binary64
       (sqrt
        (*
         (/ 1.0 2.0)
         (+
          1.0
          (/
           1.0
           (sqrt
            (+
             1.0
             (*
              (pow (/ (* 2.0 l_m) Om_m) 2.0)
              (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))
      l_m = fabs(l);
      Om_m = fabs(Om);
      double code(double l_m, double Om_m, double kx, double ky) {
      	return sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + (pow(((2.0 * l_m) / Om_m), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0)))))))));
      }
      
      l_m = abs(l)
      Om_m = abs(om)
      real(8) function code(l_m, om_m, kx, ky)
          real(8), intent (in) :: l_m
          real(8), intent (in) :: om_m
          real(8), intent (in) :: kx
          real(8), intent (in) :: ky
          code = sqrt(((1.0d0 / 2.0d0) * (1.0d0 + (1.0d0 / sqrt((1.0d0 + ((((2.0d0 * l_m) / om_m) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0)))))))))
      end function
      
      l_m = Math.abs(l);
      Om_m = Math.abs(Om);
      public static double code(double l_m, double Om_m, double kx, double ky) {
      	return Math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / Math.sqrt((1.0 + (Math.pow(((2.0 * l_m) / Om_m), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0)))))))));
      }
      
      l_m = math.fabs(l)
      Om_m = math.fabs(Om)
      def code(l_m, Om_m, kx, ky):
      	return math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / math.sqrt((1.0 + (math.pow(((2.0 * l_m) / Om_m), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0)))))))))
      
      l_m = abs(l)
      Om_m = abs(Om)
      function code(l_m, Om_m, kx, ky)
      	return sqrt(Float64(Float64(1.0 / 2.0) * Float64(1.0 + Float64(1.0 / sqrt(Float64(1.0 + Float64((Float64(Float64(2.0 * l_m) / Om_m) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))))
      end
      
      l_m = abs(l);
      Om_m = abs(Om);
      function tmp = code(l_m, Om_m, kx, ky)
      	tmp = sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + ((((2.0 * l_m) / Om_m) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0)))))))));
      end
      
      l_m = N[Abs[l], $MachinePrecision]
      Om_m = N[Abs[Om], $MachinePrecision]
      code[l$95$m_, Om$95$m_, kx_, ky_] := N[Sqrt[N[(N[(1.0 / 2.0), $MachinePrecision] * N[(1.0 + N[(1.0 / N[Sqrt[N[(1.0 + N[(N[Power[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
      
      \begin{array}{l}
      l_m = \left|\ell\right|
      \\
      Om_m = \left|Om\right|
      
      \\
      \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)}
      \end{array}
      
      Derivation
      1. Initial program 98.4%

        \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
      2. Add Preprocessing
      3. Add Preprocessing

      Alternative 5: 91.6% accurate, 1.0× speedup?

      \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{Om\_m}{l\_m \cdot ky}, 0.5\right)}\\ \end{array} \end{array} \]
      l_m = (fabs.f64 l)
      Om_m = (fabs.f64 Om)
      (FPCore (l_m Om_m kx ky)
       :precision binary64
       (if (<=
            (*
             (pow (/ (* 2.0 l_m) Om_m) 2.0)
             (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0)))
            0.5)
         1.0
         (sqrt (fma 0.25 (/ Om_m (* l_m ky)) 0.5))))
      l_m = fabs(l);
      Om_m = fabs(Om);
      double code(double l_m, double Om_m, double kx, double ky) {
      	double tmp;
      	if ((pow(((2.0 * l_m) / Om_m), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0))) <= 0.5) {
      		tmp = 1.0;
      	} else {
      		tmp = sqrt(fma(0.25, (Om_m / (l_m * ky)), 0.5));
      	}
      	return tmp;
      }
      
      l_m = abs(l)
      Om_m = abs(Om)
      function code(l_m, Om_m, kx, ky)
      	tmp = 0.0
      	if (Float64((Float64(Float64(2.0 * l_m) / Om_m) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))) <= 0.5)
      		tmp = 1.0;
      	else
      		tmp = sqrt(fma(0.25, Float64(Om_m / Float64(l_m * ky)), 0.5));
      	end
      	return tmp
      end
      
      l_m = N[Abs[l], $MachinePrecision]
      Om_m = N[Abs[Om], $MachinePrecision]
      code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[Power[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], 0.5], 1.0, N[Sqrt[N[(0.25 * N[(Om$95$m / N[(l$95$m * ky), $MachinePrecision]), $MachinePrecision] + 0.5), $MachinePrecision]], $MachinePrecision]]
      
      \begin{array}{l}
      l_m = \left|\ell\right|
      \\
      Om_m = \left|Om\right|
      
      \\
      \begin{array}{l}
      \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\
      \;\;\;\;1\\
      
      \mathbf{else}:\\
      \;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{Om\_m}{l\_m \cdot ky}, 0.5\right)}\\
      
      
      \end{array}
      \end{array}
      
      Derivation
      1. Split input into 2 regimes
      2. if (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64)))) < 0.5

        1. Initial program 100.0%

          \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
        2. Add Preprocessing
        3. Taylor expanded in l around 0

          \[\leadsto \sqrt{\color{blue}{1}} \]
        4. Step-by-step derivation
          1. Simplified98.2%

            \[\leadsto \sqrt{\color{blue}{1}} \]
          2. Step-by-step derivation
            1. metadata-eval98.2

              \[\leadsto \color{blue}{1} \]
          3. Applied egg-rr98.2%

            \[\leadsto \color{blue}{1} \]

          if 0.5 < (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))

          1. Initial program 96.6%

            \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
          2. Add Preprocessing
          3. Taylor expanded in kx around 0

            \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}\right)}} \]
          4. Step-by-step derivation
            1. +-commutativeN/A

              \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + 1\right)}} \]
            2. distribute-lft-inN/A

              \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \frac{1}{2} \cdot 1}} \]
            3. metadata-evalN/A

              \[\leadsto \sqrt{\frac{1}{2} \cdot \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}} + \color{blue}{\frac{1}{2}}} \]
            4. accelerator-lowering-fma.f64N/A

              \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{1 + 4 \cdot \frac{{\ell}^{2} \cdot {\sin ky}^{2}}{{Om}^{2}}}}, \frac{1}{2}\right)}} \]
          5. Simplified70.1%

            \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{{\sin ky}^{2}}{Om \cdot Om}, 1\right)}}, 0.5\right)}} \]
          6. Taylor expanded in ky around 0

            \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \color{blue}{\frac{{ky}^{2}}{{Om}^{2}}}, 1\right)}}, \frac{1}{2}\right)} \]
          7. Step-by-step derivation
            1. /-lowering-/.f64N/A

              \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \color{blue}{\frac{{ky}^{2}}{{Om}^{2}}}, 1\right)}}, \frac{1}{2}\right)} \]
            2. unpow2N/A

              \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{\color{blue}{ky \cdot ky}}{{Om}^{2}}, 1\right)}}, \frac{1}{2}\right)} \]
            3. *-lowering-*.f64N/A

              \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{\color{blue}{ky \cdot ky}}{{Om}^{2}}, 1\right)}}, \frac{1}{2}\right)} \]
            4. unpow2N/A

              \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{2}, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{ky \cdot ky}{\color{blue}{Om \cdot Om}}, 1\right)}}, \frac{1}{2}\right)} \]
            5. *-lowering-*.f6469.8

              \[\leadsto \sqrt{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \frac{ky \cdot ky}{\color{blue}{Om \cdot Om}}, 1\right)}}, 0.5\right)} \]
          8. Simplified69.8%

            \[\leadsto \sqrt{\mathsf{fma}\left(0.5, \sqrt{\frac{1}{\mathsf{fma}\left(4 \cdot \left(\ell \cdot \ell\right), \color{blue}{\frac{ky \cdot ky}{Om \cdot Om}}, 1\right)}}, 0.5\right)} \]
          9. Taylor expanded in l around inf

            \[\leadsto \sqrt{\color{blue}{\frac{1}{2} + \frac{1}{4} \cdot \frac{Om}{ky \cdot \ell}}} \]
          10. Step-by-step derivation
            1. +-commutativeN/A

              \[\leadsto \sqrt{\color{blue}{\frac{1}{4} \cdot \frac{Om}{ky \cdot \ell} + \frac{1}{2}}} \]
            2. accelerator-lowering-fma.f64N/A

              \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{4}, \frac{Om}{ky \cdot \ell}, \frac{1}{2}\right)}} \]
            3. /-lowering-/.f64N/A

              \[\leadsto \sqrt{\mathsf{fma}\left(\frac{1}{4}, \color{blue}{\frac{Om}{ky \cdot \ell}}, \frac{1}{2}\right)} \]
            4. *-lowering-*.f6483.2

              \[\leadsto \sqrt{\mathsf{fma}\left(0.25, \frac{Om}{\color{blue}{ky \cdot \ell}}, 0.5\right)} \]
          11. Simplified83.2%

            \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.25, \frac{Om}{ky \cdot \ell}, 0.5\right)}} \]
        5. Recombined 2 regimes into one program.
        6. Final simplification91.4%

          \[\leadsto \begin{array}{l} \mathbf{if}\;{\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 0.5:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{Om}{\ell \cdot ky}, 0.5\right)}\\ \end{array} \]
        7. Add Preprocessing

        Alternative 6: 98.1% accurate, 1.1× speedup?

        \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 3.8:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;\sqrt{0.5}\\ \end{array} \end{array} \]
        l_m = (fabs.f64 l)
        Om_m = (fabs.f64 Om)
        (FPCore (l_m Om_m kx ky)
         :precision binary64
         (if (<=
              (*
               (pow (/ (* 2.0 l_m) Om_m) 2.0)
               (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0)))
              3.8)
           1.0
           (sqrt 0.5)))
        l_m = fabs(l);
        Om_m = fabs(Om);
        double code(double l_m, double Om_m, double kx, double ky) {
        	double tmp;
        	if ((pow(((2.0 * l_m) / Om_m), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0))) <= 3.8) {
        		tmp = 1.0;
        	} else {
        		tmp = sqrt(0.5);
        	}
        	return tmp;
        }
        
        l_m = abs(l)
        Om_m = abs(om)
        real(8) function code(l_m, om_m, kx, ky)
            real(8), intent (in) :: l_m
            real(8), intent (in) :: om_m
            real(8), intent (in) :: kx
            real(8), intent (in) :: ky
            real(8) :: tmp
            if (((((2.0d0 * l_m) / om_m) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0))) <= 3.8d0) then
                tmp = 1.0d0
            else
                tmp = sqrt(0.5d0)
            end if
            code = tmp
        end function
        
        l_m = Math.abs(l);
        Om_m = Math.abs(Om);
        public static double code(double l_m, double Om_m, double kx, double ky) {
        	double tmp;
        	if ((Math.pow(((2.0 * l_m) / Om_m), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0))) <= 3.8) {
        		tmp = 1.0;
        	} else {
        		tmp = Math.sqrt(0.5);
        	}
        	return tmp;
        }
        
        l_m = math.fabs(l)
        Om_m = math.fabs(Om)
        def code(l_m, Om_m, kx, ky):
        	tmp = 0
        	if (math.pow(((2.0 * l_m) / Om_m), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0))) <= 3.8:
        		tmp = 1.0
        	else:
        		tmp = math.sqrt(0.5)
        	return tmp
        
        l_m = abs(l)
        Om_m = abs(Om)
        function code(l_m, Om_m, kx, ky)
        	tmp = 0.0
        	if (Float64((Float64(Float64(2.0 * l_m) / Om_m) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))) <= 3.8)
        		tmp = 1.0;
        	else
        		tmp = sqrt(0.5);
        	end
        	return tmp
        end
        
        l_m = abs(l);
        Om_m = abs(Om);
        function tmp_2 = code(l_m, Om_m, kx, ky)
        	tmp = 0.0;
        	if (((((2.0 * l_m) / Om_m) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))) <= 3.8)
        		tmp = 1.0;
        	else
        		tmp = sqrt(0.5);
        	end
        	tmp_2 = tmp;
        end
        
        l_m = N[Abs[l], $MachinePrecision]
        Om_m = N[Abs[Om], $MachinePrecision]
        code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[Power[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision], 3.8], 1.0, N[Sqrt[0.5], $MachinePrecision]]
        
        \begin{array}{l}
        l_m = \left|\ell\right|
        \\
        Om_m = \left|Om\right|
        
        \\
        \begin{array}{l}
        \mathbf{if}\;{\left(\frac{2 \cdot l\_m}{Om\_m}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right) \leq 3.8:\\
        \;\;\;\;1\\
        
        \mathbf{else}:\\
        \;\;\;\;\sqrt{0.5}\\
        
        
        \end{array}
        \end{array}
        
        Derivation
        1. Split input into 2 regimes
        2. if (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64)))) < 3.7999999999999998

          1. Initial program 100.0%

            \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
          2. Add Preprocessing
          3. Taylor expanded in l around 0

            \[\leadsto \sqrt{\color{blue}{1}} \]
          4. Step-by-step derivation
            1. Simplified98.2%

              \[\leadsto \sqrt{\color{blue}{1}} \]
            2. Step-by-step derivation
              1. metadata-eval98.2

                \[\leadsto \color{blue}{1} \]
            3. Applied egg-rr98.2%

              \[\leadsto \color{blue}{1} \]

            if 3.7999999999999998 < (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))

            1. Initial program 96.6%

              \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
            2. Add Preprocessing
            3. Taylor expanded in l around inf

              \[\leadsto \sqrt{\color{blue}{\frac{1}{2}}} \]
            4. Step-by-step derivation
              1. Simplified97.0%

                \[\leadsto \sqrt{\color{blue}{0.5}} \]
            5. Recombined 2 regimes into one program.
            6. Add Preprocessing

            Alternative 7: 98.3% accurate, 1.8× speedup?

            \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\ \;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{\mathsf{fma}\left(l\_m, -0.5 \cdot \left(\cos \left(kx \cdot -2\right) + \cos \left(ky \cdot -2\right)\right), l\_m\right)}{Om\_m}, 1\right)}}\right)}\\ \mathbf{else}:\\ \;\;\;\;\sqrt{0.5}\\ \end{array} \end{array} \]
            l_m = (fabs.f64 l)
            Om_m = (fabs.f64 Om)
            (FPCore (l_m Om_m kx ky)
             :precision binary64
             (if (<= (/ (* 2.0 l_m) Om_m) 2.5e+96)
               (sqrt
                (*
                 0.5
                 (+
                  1.0
                  (/
                   1.0
                   (sqrt
                    (fma
                     (* (/ l_m Om_m) 4.0)
                     (/
                      (fma l_m (* -0.5 (+ (cos (* kx -2.0)) (cos (* ky -2.0)))) l_m)
                      Om_m)
                     1.0))))))
               (sqrt 0.5)))
            l_m = fabs(l);
            Om_m = fabs(Om);
            double code(double l_m, double Om_m, double kx, double ky) {
            	double tmp;
            	if (((2.0 * l_m) / Om_m) <= 2.5e+96) {
            		tmp = sqrt((0.5 * (1.0 + (1.0 / sqrt(fma(((l_m / Om_m) * 4.0), (fma(l_m, (-0.5 * (cos((kx * -2.0)) + cos((ky * -2.0)))), l_m) / Om_m), 1.0))))));
            	} else {
            		tmp = sqrt(0.5);
            	}
            	return tmp;
            }
            
            l_m = abs(l)
            Om_m = abs(Om)
            function code(l_m, Om_m, kx, ky)
            	tmp = 0.0
            	if (Float64(Float64(2.0 * l_m) / Om_m) <= 2.5e+96)
            		tmp = sqrt(Float64(0.5 * Float64(1.0 + Float64(1.0 / sqrt(fma(Float64(Float64(l_m / Om_m) * 4.0), Float64(fma(l_m, Float64(-0.5 * Float64(cos(Float64(kx * -2.0)) + cos(Float64(ky * -2.0)))), l_m) / Om_m), 1.0))))));
            	else
            		tmp = sqrt(0.5);
            	end
            	return tmp
            end
            
            l_m = N[Abs[l], $MachinePrecision]
            Om_m = N[Abs[Om], $MachinePrecision]
            code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.5e+96], N[Sqrt[N[(0.5 * N[(1.0 + N[(1.0 / N[Sqrt[N[(N[(N[(l$95$m / Om$95$m), $MachinePrecision] * 4.0), $MachinePrecision] * N[(N[(l$95$m * N[(-0.5 * N[(N[Cos[N[(kx * -2.0), $MachinePrecision]], $MachinePrecision] + N[Cos[N[(ky * -2.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], N[Sqrt[0.5], $MachinePrecision]]
            
            \begin{array}{l}
            l_m = \left|\ell\right|
            \\
            Om_m = \left|Om\right|
            
            \\
            \begin{array}{l}
            \mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\
            \;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{\mathsf{fma}\left(l\_m, -0.5 \cdot \left(\cos \left(kx \cdot -2\right) + \cos \left(ky \cdot -2\right)\right), l\_m\right)}{Om\_m}, 1\right)}}\right)}\\
            
            \mathbf{else}:\\
            \;\;\;\;\sqrt{0.5}\\
            
            
            \end{array}
            \end{array}
            
            Derivation
            1. Split input into 2 regimes
            2. if (/.f64 (*.f64 #s(literal 2 binary64) l) Om) < 2.5000000000000002e96

              1. Initial program 100.0%

                \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
              2. Add Preprocessing
              3. Applied egg-rr96.4%

                \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\color{blue}{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}}\right)} \]
              4. Step-by-step derivation
                1. metadata-eval96.4

                  \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]
              5. Applied egg-rr96.4%

                \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]
              6. Taylor expanded in l around 0

                \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\ell \cdot \left(1 + \left(\frac{-1}{2} \cdot \cos \left(2 \cdot kx\right) + \frac{-1}{2} \cdot \cos \left(2 \cdot ky\right)\right)\right)}{Om}}, 1\right)}}\right)} \]
              7. Step-by-step derivation
                1. /-lowering-/.f64N/A

                  \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\ell \cdot \left(1 + \left(\frac{-1}{2} \cdot \cos \left(2 \cdot kx\right) + \frac{-1}{2} \cdot \cos \left(2 \cdot ky\right)\right)\right)}{Om}}, 1\right)}}\right)} \]
              8. Simplified96.3%

                \[\leadsto \sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\mathsf{fma}\left(\ell, -0.5 \cdot \left(\cos \left(kx \cdot -2\right) + \cos \left(ky \cdot -2\right)\right), \ell\right)}{Om}}, 1\right)}}\right)} \]

              if 2.5000000000000002e96 < (/.f64 (*.f64 #s(literal 2 binary64) l) Om)

              1. Initial program 91.8%

                \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
              2. Add Preprocessing
              3. Taylor expanded in l around inf

                \[\leadsto \sqrt{\color{blue}{\frac{1}{2}}} \]
              4. Step-by-step derivation
                1. Simplified98.4%

                  \[\leadsto \sqrt{\color{blue}{0.5}} \]
              5. Recombined 2 regimes into one program.
              6. Add Preprocessing

              Alternative 8: 94.9% accurate, 2.8× speedup?

              \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ \begin{array}{l} \mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\ \;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{l\_m \cdot \mathsf{fma}\left(-0.5, \cos \left(ky \cdot -2\right), 0.5\right)}{Om\_m}, 1\right)}}\right)}\\ \mathbf{else}:\\ \;\;\;\;\sqrt{0.5}\\ \end{array} \end{array} \]
              l_m = (fabs.f64 l)
              Om_m = (fabs.f64 Om)
              (FPCore (l_m Om_m kx ky)
               :precision binary64
               (if (<= (/ (* 2.0 l_m) Om_m) 2.5e+96)
                 (sqrt
                  (*
                   0.5
                   (+
                    1.0
                    (/
                     1.0
                     (sqrt
                      (fma
                       (* (/ l_m Om_m) 4.0)
                       (/ (* l_m (fma -0.5 (cos (* ky -2.0)) 0.5)) Om_m)
                       1.0))))))
                 (sqrt 0.5)))
              l_m = fabs(l);
              Om_m = fabs(Om);
              double code(double l_m, double Om_m, double kx, double ky) {
              	double tmp;
              	if (((2.0 * l_m) / Om_m) <= 2.5e+96) {
              		tmp = sqrt((0.5 * (1.0 + (1.0 / sqrt(fma(((l_m / Om_m) * 4.0), ((l_m * fma(-0.5, cos((ky * -2.0)), 0.5)) / Om_m), 1.0))))));
              	} else {
              		tmp = sqrt(0.5);
              	}
              	return tmp;
              }
              
              l_m = abs(l)
              Om_m = abs(Om)
              function code(l_m, Om_m, kx, ky)
              	tmp = 0.0
              	if (Float64(Float64(2.0 * l_m) / Om_m) <= 2.5e+96)
              		tmp = sqrt(Float64(0.5 * Float64(1.0 + Float64(1.0 / sqrt(fma(Float64(Float64(l_m / Om_m) * 4.0), Float64(Float64(l_m * fma(-0.5, cos(Float64(ky * -2.0)), 0.5)) / Om_m), 1.0))))));
              	else
              		tmp = sqrt(0.5);
              	end
              	return tmp
              end
              
              l_m = N[Abs[l], $MachinePrecision]
              Om_m = N[Abs[Om], $MachinePrecision]
              code[l$95$m_, Om$95$m_, kx_, ky_] := If[LessEqual[N[(N[(2.0 * l$95$m), $MachinePrecision] / Om$95$m), $MachinePrecision], 2.5e+96], N[Sqrt[N[(0.5 * N[(1.0 + N[(1.0 / N[Sqrt[N[(N[(N[(l$95$m / Om$95$m), $MachinePrecision] * 4.0), $MachinePrecision] * N[(N[(l$95$m * N[(-0.5 * N[Cos[N[(ky * -2.0), $MachinePrecision]], $MachinePrecision] + 0.5), $MachinePrecision]), $MachinePrecision] / Om$95$m), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], N[Sqrt[0.5], $MachinePrecision]]
              
              \begin{array}{l}
              l_m = \left|\ell\right|
              \\
              Om_m = \left|Om\right|
              
              \\
              \begin{array}{l}
              \mathbf{if}\;\frac{2 \cdot l\_m}{Om\_m} \leq 2.5 \cdot 10^{+96}:\\
              \;\;\;\;\sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{l\_m}{Om\_m} \cdot 4, \frac{l\_m \cdot \mathsf{fma}\left(-0.5, \cos \left(ky \cdot -2\right), 0.5\right)}{Om\_m}, 1\right)}}\right)}\\
              
              \mathbf{else}:\\
              \;\;\;\;\sqrt{0.5}\\
              
              
              \end{array}
              \end{array}
              
              Derivation
              1. Split input into 2 regimes
              2. if (/.f64 (*.f64 #s(literal 2 binary64) l) Om) < 2.5000000000000002e96

                1. Initial program 100.0%

                  \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
                2. Add Preprocessing
                3. Applied egg-rr96.4%

                  \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\color{blue}{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}}\right)} \]
                4. Step-by-step derivation
                  1. metadata-eval96.4

                    \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]
                5. Applied egg-rr96.4%

                  \[\leadsto \sqrt{\color{blue}{0.5} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell}{Om} \cdot \left(\left(0.5 + -0.5 \cdot \cos \left(kx + kx\right)\right) + \left(0.5 + -0.5 \cdot \cos \left(ky + ky\right)\right)\right), 1\right)}}\right)} \]
                6. Taylor expanded in kx around 0

                  \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\ell \cdot \left(\frac{1}{2} + \frac{-1}{2} \cdot \cos \left(2 \cdot ky\right)\right)}{Om}}, 1\right)}}\right)} \]
                7. Step-by-step derivation
                  1. /-lowering-/.f64N/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\ell \cdot \left(\frac{1}{2} + \frac{-1}{2} \cdot \cos \left(2 \cdot ky\right)\right)}{Om}}, 1\right)}}\right)} \]
                  2. *-lowering-*.f64N/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\color{blue}{\ell \cdot \left(\frac{1}{2} + \frac{-1}{2} \cdot \cos \left(2 \cdot ky\right)\right)}}{Om}, 1\right)}}\right)} \]
                  3. +-commutativeN/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \color{blue}{\left(\frac{-1}{2} \cdot \cos \left(2 \cdot ky\right) + \frac{1}{2}\right)}}{Om}, 1\right)}}\right)} \]
                  4. accelerator-lowering-fma.f64N/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \color{blue}{\mathsf{fma}\left(\frac{-1}{2}, \cos \left(2 \cdot ky\right), \frac{1}{2}\right)}}{Om}, 1\right)}}\right)} \]
                  5. metadata-evalN/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \cos \left(\color{blue}{\left(\mathsf{neg}\left(-2\right)\right)} \cdot ky\right), \frac{1}{2}\right)}{Om}, 1\right)}}\right)} \]
                  6. distribute-lft-neg-inN/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \cos \color{blue}{\left(\mathsf{neg}\left(-2 \cdot ky\right)\right)}, \frac{1}{2}\right)}{Om}, 1\right)}}\right)} \]
                  7. cos-negN/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\cos \left(-2 \cdot ky\right)}, \frac{1}{2}\right)}{Om}, 1\right)}}\right)} \]
                  8. cos-lowering-cos.f64N/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\cos \left(-2 \cdot ky\right)}, \frac{1}{2}\right)}{Om}, 1\right)}}\right)} \]
                  9. *-commutativeN/A

                    \[\leadsto \sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(\frac{-1}{2}, \cos \color{blue}{\left(ky \cdot -2\right)}, \frac{1}{2}\right)}{Om}, 1\right)}}\right)} \]
                  10. *-lowering-*.f6488.1

                    \[\leadsto \sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \frac{\ell \cdot \mathsf{fma}\left(-0.5, \cos \color{blue}{\left(ky \cdot -2\right)}, 0.5\right)}{Om}, 1\right)}}\right)} \]
                8. Simplified88.1%

                  \[\leadsto \sqrt{0.5 \cdot \left(1 + \frac{1}{\sqrt{\mathsf{fma}\left(\frac{\ell}{Om} \cdot 4, \color{blue}{\frac{\ell \cdot \mathsf{fma}\left(-0.5, \cos \left(ky \cdot -2\right), 0.5\right)}{Om}}, 1\right)}}\right)} \]

                if 2.5000000000000002e96 < (/.f64 (*.f64 #s(literal 2 binary64) l) Om)

                1. Initial program 91.8%

                  \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
                2. Add Preprocessing
                3. Taylor expanded in l around inf

                  \[\leadsto \sqrt{\color{blue}{\frac{1}{2}}} \]
                4. Step-by-step derivation
                  1. Simplified98.4%

                    \[\leadsto \sqrt{\color{blue}{0.5}} \]
                5. Recombined 2 regimes into one program.
                6. Add Preprocessing

                Alternative 9: 62.5% accurate, 581.0× speedup?

                \[\begin{array}{l} l_m = \left|\ell\right| \\ Om_m = \left|Om\right| \\ 1 \end{array} \]
                l_m = (fabs.f64 l)
                Om_m = (fabs.f64 Om)
                (FPCore (l_m Om_m kx ky) :precision binary64 1.0)
                l_m = fabs(l);
                Om_m = fabs(Om);
                double code(double l_m, double Om_m, double kx, double ky) {
                	return 1.0;
                }
                
                l_m = abs(l)
                Om_m = abs(om)
                real(8) function code(l_m, om_m, kx, ky)
                    real(8), intent (in) :: l_m
                    real(8), intent (in) :: om_m
                    real(8), intent (in) :: kx
                    real(8), intent (in) :: ky
                    code = 1.0d0
                end function
                
                l_m = Math.abs(l);
                Om_m = Math.abs(Om);
                public static double code(double l_m, double Om_m, double kx, double ky) {
                	return 1.0;
                }
                
                l_m = math.fabs(l)
                Om_m = math.fabs(Om)
                def code(l_m, Om_m, kx, ky):
                	return 1.0
                
                l_m = abs(l)
                Om_m = abs(Om)
                function code(l_m, Om_m, kx, ky)
                	return 1.0
                end
                
                l_m = abs(l);
                Om_m = abs(Om);
                function tmp = code(l_m, Om_m, kx, ky)
                	tmp = 1.0;
                end
                
                l_m = N[Abs[l], $MachinePrecision]
                Om_m = N[Abs[Om], $MachinePrecision]
                code[l$95$m_, Om$95$m_, kx_, ky_] := 1.0
                
                \begin{array}{l}
                l_m = \left|\ell\right|
                \\
                Om_m = \left|Om\right|
                
                \\
                1
                \end{array}
                
                Derivation
                1. Initial program 98.4%

                  \[\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)} \]
                2. Add Preprocessing
                3. Taylor expanded in l around 0

                  \[\leadsto \sqrt{\color{blue}{1}} \]
                4. Step-by-step derivation
                  1. Simplified63.1%

                    \[\leadsto \sqrt{\color{blue}{1}} \]
                  2. Step-by-step derivation
                    1. metadata-eval63.1

                      \[\leadsto \color{blue}{1} \]
                  3. Applied egg-rr63.1%

                    \[\leadsto \color{blue}{1} \]
                  4. Add Preprocessing

                  Reproduce

                  ?
                  herbie shell --seed 2024199 
                  (FPCore (l Om kx ky)
                    :name "Toniolo and Linder, Equation (3a)"
                    :precision binary64
                    (sqrt (* (/ 1.0 2.0) (+ 1.0 (/ 1.0 (sqrt (+ 1.0 (* (pow (/ (* 2.0 l) Om) 2.0) (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))