Bouland and Aaronson, Equation (26)

Percentage Accurate: 99.9% → 99.9%
Time: 11.2s
Alternatives: 8
Speedup: 3.3×

Specification

?
\[\begin{array}{l} \\ \left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \end{array} \]
(FPCore (a b)
 :precision binary64
 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (* b b))) 1.0))
double code(double a, double b) {
	return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0;
}
real(8) function code(a, b)
    real(8), intent (in) :: a
    real(8), intent (in) :: b
    code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (b * b))) - 1.0d0
end function
public static double code(double a, double b) {
	return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0;
}
def code(a, b):
	return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0
function code(a, b)
	return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(b * b))) - 1.0)
end
function tmp = code(a, b)
	tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (b * b))) - 1.0;
end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}

\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 8 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 99.9% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \end{array} \]
(FPCore (a b)
 :precision binary64
 (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (* b b))) 1.0))
double code(double a, double b) {
	return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0;
}
real(8) function code(a, b)
    real(8), intent (in) :: a
    real(8), intent (in) :: b
    code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (b * b))) - 1.0d0
end function
public static double code(double a, double b) {
	return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0;
}
def code(a, b):
	return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (b * b))) - 1.0
function code(a, b)
	return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(b * b))) - 1.0)
end
function tmp = code(a, b)
	tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (b * b))) - 1.0;
end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}

\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1
\end{array}

Alternative 1: 99.9% accurate, 3.3× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \mathsf{fma}\left(a, a, b \cdot b\right)\\ \mathsf{fma}\left(t\_0, t\_0, \mathsf{fma}\left(b, b \cdot 4, -1\right)\right) \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (let* ((t_0 (fma a a (* b b)))) (fma t_0 t_0 (fma b (* b 4.0) -1.0))))
double code(double a, double b) {
	double t_0 = fma(a, a, (b * b));
	return fma(t_0, t_0, fma(b, (b * 4.0), -1.0));
}
function code(a, b)
	t_0 = fma(a, a, Float64(b * b))
	return fma(t_0, t_0, fma(b, Float64(b * 4.0), -1.0))
end
code[a_, b_] := Block[{t$95$0 = N[(a * a + N[(b * b), $MachinePrecision]), $MachinePrecision]}, N[(t$95$0 * t$95$0 + N[(b * N[(b * 4.0), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \mathsf{fma}\left(a, a, b \cdot b\right)\\
\mathsf{fma}\left(t\_0, t\_0, \mathsf{fma}\left(b, b \cdot 4, -1\right)\right)
\end{array}
\end{array}
Derivation
  1. Initial program 99.9%

    \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
  2. Add Preprocessing
  3. Step-by-step derivation
    1. associate--l+N/A

      \[\leadsto \color{blue}{{\left(a \cdot a + b \cdot b\right)}^{2} + \left(4 \cdot \left(b \cdot b\right) - 1\right)} \]
    2. unpow2N/A

      \[\leadsto \color{blue}{\left(a \cdot a + b \cdot b\right) \cdot \left(a \cdot a + b \cdot b\right)} + \left(4 \cdot \left(b \cdot b\right) - 1\right) \]
    3. accelerator-lowering-fma.f64N/A

      \[\leadsto \color{blue}{\mathsf{fma}\left(a \cdot a + b \cdot b, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right)} \]
    4. accelerator-lowering-fma.f64N/A

      \[\leadsto \mathsf{fma}\left(\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
    5. *-lowering-*.f64N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
    6. accelerator-lowering-fma.f64N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, 4 \cdot \left(b \cdot b\right) - 1\right) \]
    7. *-lowering-*.f64N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), 4 \cdot \left(b \cdot b\right) - 1\right) \]
    8. sub-negN/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{4 \cdot \left(b \cdot b\right) + \left(\mathsf{neg}\left(1\right)\right)}\right) \]
    9. associate-*r*N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\left(4 \cdot b\right) \cdot b} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
    10. *-commutativeN/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{b \cdot \left(4 \cdot b\right)} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
    11. accelerator-lowering-fma.f64N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(b, 4 \cdot b, \mathsf{neg}\left(1\right)\right)}\right) \]
    12. *-commutativeN/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
    13. *-lowering-*.f64N/A

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
    14. metadata-eval99.9

      \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, \color{blue}{-1}\right)\right) \]
  4. Applied egg-rr99.9%

    \[\leadsto \color{blue}{\mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, -1\right)\right)} \]
  5. Add Preprocessing

Alternative 2: 98.3% accurate, 3.3× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;b \cdot b \leq 5 \cdot 10^{-10}:\\ \;\;\;\;\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, \mathsf{fma}\left(2, a \cdot a, 4\right)\right), -1\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* b b) 5e-10)
   (fma a (* a (* a a)) -1.0)
   (fma (* b b) (fma b b (fma 2.0 (* a a) 4.0)) -1.0)))
double code(double a, double b) {
	double tmp;
	if ((b * b) <= 5e-10) {
		tmp = fma(a, (a * (a * a)), -1.0);
	} else {
		tmp = fma((b * b), fma(b, b, fma(2.0, (a * a), 4.0)), -1.0);
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(b * b) <= 5e-10)
		tmp = fma(a, Float64(a * Float64(a * a)), -1.0);
	else
		tmp = fma(Float64(b * b), fma(b, b, fma(2.0, Float64(a * a), 4.0)), -1.0);
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 5e-10], N[(a * N[(a * N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(N[(b * b), $MachinePrecision] * N[(b * b + N[(2.0 * N[(a * a), $MachinePrecision] + 4.0), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 5 \cdot 10^{-10}:\\
\;\;\;\;\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)\\

\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, \mathsf{fma}\left(2, a \cdot a, 4\right)\right), -1\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (*.f64 b b) < 5.00000000000000031e-10

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in b around 0

      \[\leadsto \color{blue}{{a}^{4} - 1} \]
    4. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{{a}^{4} + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. metadata-evalN/A

        \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} + \left(\mathsf{neg}\left(1\right)\right) \]
      3. pow-sqrN/A

        \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} + \left(\mathsf{neg}\left(1\right)\right) \]
      4. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} + \left(\mathsf{neg}\left(1\right)\right) \]
      5. associate-*l*N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot {a}^{2}, \mathsf{neg}\left(1\right)\right)} \]
      7. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(a, \color{blue}{a \cdot {a}^{2}}, \mathsf{neg}\left(1\right)\right) \]
      8. unpow2N/A

        \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
      9. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
      10. metadata-eval99.8

        \[\leadsto \mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), \color{blue}{-1}\right) \]
    5. Simplified99.8%

      \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)} \]

    if 5.00000000000000031e-10 < (*.f64 b b)

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in a around 0

      \[\leadsto \color{blue}{\left(2 \cdot \left({a}^{2} \cdot {b}^{2}\right) + \left(4 \cdot {b}^{2} + {b}^{4}\right)\right) - 1} \]
    4. Step-by-step derivation
      1. associate-+r-N/A

        \[\leadsto \color{blue}{2 \cdot \left({a}^{2} \cdot {b}^{2}\right) + \left(\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1\right)} \]
      2. associate--l+N/A

        \[\leadsto 2 \cdot \left({a}^{2} \cdot {b}^{2}\right) + \color{blue}{\left(4 \cdot {b}^{2} + \left({b}^{4} - 1\right)\right)} \]
      3. associate-+r+N/A

        \[\leadsto \color{blue}{\left(2 \cdot \left({a}^{2} \cdot {b}^{2}\right) + 4 \cdot {b}^{2}\right) + \left({b}^{4} - 1\right)} \]
      4. associate-*r*N/A

        \[\leadsto \left(\color{blue}{\left(2 \cdot {a}^{2}\right) \cdot {b}^{2}} + 4 \cdot {b}^{2}\right) + \left({b}^{4} - 1\right) \]
      5. distribute-rgt-inN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot \left(2 \cdot {a}^{2} + 4\right)} + \left({b}^{4} - 1\right) \]
      6. +-commutativeN/A

        \[\leadsto {b}^{2} \cdot \color{blue}{\left(4 + 2 \cdot {a}^{2}\right)} + \left({b}^{4} - 1\right) \]
      7. sub-negN/A

        \[\leadsto {b}^{2} \cdot \left(4 + 2 \cdot {a}^{2}\right) + \color{blue}{\left({b}^{4} + \left(\mathsf{neg}\left(1\right)\right)\right)} \]
      8. associate-+l+N/A

        \[\leadsto \color{blue}{\left({b}^{2} \cdot \left(4 + 2 \cdot {a}^{2}\right) + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      9. metadata-evalN/A

        \[\leadsto \left({b}^{2} \cdot \left(4 + 2 \cdot {a}^{2}\right) + {b}^{\color{blue}{\left(2 \cdot 2\right)}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      10. pow-sqrN/A

        \[\leadsto \left({b}^{2} \cdot \left(4 + 2 \cdot {a}^{2}\right) + \color{blue}{{b}^{2} \cdot {b}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      11. distribute-lft-inN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot \left(\left(4 + 2 \cdot {a}^{2}\right) + {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      12. associate-+r+N/A

        \[\leadsto {b}^{2} \cdot \color{blue}{\left(4 + \left(2 \cdot {a}^{2} + {b}^{2}\right)\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      13. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left({b}^{2}, 4 + \left(2 \cdot {a}^{2} + {b}^{2}\right), \mathsf{neg}\left(1\right)\right)} \]
    5. Simplified98.5%

      \[\leadsto \color{blue}{\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, \mathsf{fma}\left(2, a \cdot a, 4\right)\right), -1\right)} \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 3: 94.4% accurate, 4.5× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;a \cdot a \leq 12000000000000:\\ \;\;\;\;\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)\\ \mathbf{else}:\\ \;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* a a) 12000000000000.0)
   (fma (* b b) (fma b b 4.0) -1.0)
   (* a (* a (* a a)))))
double code(double a, double b) {
	double tmp;
	if ((a * a) <= 12000000000000.0) {
		tmp = fma((b * b), fma(b, b, 4.0), -1.0);
	} else {
		tmp = a * (a * (a * a));
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(a * a) <= 12000000000000.0)
		tmp = fma(Float64(b * b), fma(b, b, 4.0), -1.0);
	else
		tmp = Float64(a * Float64(a * Float64(a * a)));
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(a * a), $MachinePrecision], 12000000000000.0], N[(N[(b * b), $MachinePrecision] * N[(b * b + 4.0), $MachinePrecision] + -1.0), $MachinePrecision], N[(a * N[(a * N[(a * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;a \cdot a \leq 12000000000000:\\
\;\;\;\;\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)\\

\mathbf{else}:\\
\;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (*.f64 a a) < 1.2e13

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. associate--l+N/A

        \[\leadsto \color{blue}{{\left(a \cdot a + b \cdot b\right)}^{2} + \left(4 \cdot \left(b \cdot b\right) - 1\right)} \]
      2. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a + b \cdot b\right) \cdot \left(a \cdot a + b \cdot b\right)} + \left(4 \cdot \left(b \cdot b\right) - 1\right) \]
      3. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(a \cdot a + b \cdot b, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right)} \]
      4. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      5. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      7. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), 4 \cdot \left(b \cdot b\right) - 1\right) \]
      8. sub-negN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{4 \cdot \left(b \cdot b\right) + \left(\mathsf{neg}\left(1\right)\right)}\right) \]
      9. associate-*r*N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\left(4 \cdot b\right) \cdot b} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      10. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{b \cdot \left(4 \cdot b\right)} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      11. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(b, 4 \cdot b, \mathsf{neg}\left(1\right)\right)}\right) \]
      12. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      13. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      14. metadata-eval99.9

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, \color{blue}{-1}\right)\right) \]
    4. Applied egg-rr99.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, -1\right)\right)} \]
    5. Taylor expanded in a around 0

      \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1} \]
    6. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. metadata-evalN/A

        \[\leadsto \left(4 \cdot {b}^{2} + {b}^{\color{blue}{\left(2 \cdot 2\right)}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      3. pow-sqrN/A

        \[\leadsto \left(4 \cdot {b}^{2} + \color{blue}{{b}^{2} \cdot {b}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      4. distribute-rgt-inN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot \left(4 + {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      5. metadata-evalN/A

        \[\leadsto {b}^{2} \cdot \left(4 + {b}^{2}\right) + \color{blue}{-1} \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left({b}^{2}, 4 + {b}^{2}, -1\right)} \]
      7. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      8. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      9. +-commutativeN/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{{b}^{2} + 4}, -1\right) \]
      10. unpow2N/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{b \cdot b} + 4, -1\right) \]
      11. accelerator-lowering-fma.f64100.0

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{\mathsf{fma}\left(b, b, 4\right)}, -1\right) \]
    7. Simplified100.0%

      \[\leadsto \color{blue}{\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)} \]

    if 1.2e13 < (*.f64 a a)

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in a around inf

      \[\leadsto \color{blue}{{a}^{4}} \]
    4. Step-by-step derivation
      1. metadata-evalN/A

        \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} \]
      2. pow-sqrN/A

        \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} \]
      3. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} \]
      4. associate-*l*N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
      5. *-lowering-*.f64N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
      6. *-lowering-*.f64N/A

        \[\leadsto a \cdot \color{blue}{\left(a \cdot {a}^{2}\right)} \]
      7. unpow2N/A

        \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
      8. *-lowering-*.f6494.3

        \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
    5. Simplified94.3%

      \[\leadsto \color{blue}{a \cdot \left(a \cdot \left(a \cdot a\right)\right)} \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 4: 94.4% accurate, 4.5× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;a \cdot a \leq 12000000000000:\\ \;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), -1\right)\\ \mathbf{else}:\\ \;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* a a) 12000000000000.0)
   (fma b (* b (fma b b 4.0)) -1.0)
   (* a (* a (* a a)))))
double code(double a, double b) {
	double tmp;
	if ((a * a) <= 12000000000000.0) {
		tmp = fma(b, (b * fma(b, b, 4.0)), -1.0);
	} else {
		tmp = a * (a * (a * a));
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(a * a) <= 12000000000000.0)
		tmp = fma(b, Float64(b * fma(b, b, 4.0)), -1.0);
	else
		tmp = Float64(a * Float64(a * Float64(a * a)));
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(a * a), $MachinePrecision], 12000000000000.0], N[(b * N[(b * N[(b * b + 4.0), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(a * N[(a * N[(a * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;a \cdot a \leq 12000000000000:\\
\;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), -1\right)\\

\mathbf{else}:\\
\;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (*.f64 a a) < 1.2e13

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in a around 0

      \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1} \]
    4. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. *-commutativeN/A

        \[\leadsto \left(\color{blue}{{b}^{2} \cdot 4} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      3. unpow2N/A

        \[\leadsto \left(\color{blue}{\left(b \cdot b\right)} \cdot 4 + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      4. associate-*l*N/A

        \[\leadsto \left(\color{blue}{b \cdot \left(b \cdot 4\right)} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      5. metadata-evalN/A

        \[\leadsto \left(b \cdot \left(b \cdot 4\right) + {b}^{\color{blue}{\left(2 \cdot 2\right)}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      6. pow-sqrN/A

        \[\leadsto \left(b \cdot \left(b \cdot 4\right) + \color{blue}{{b}^{2} \cdot {b}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      7. unpow2N/A

        \[\leadsto \left(b \cdot \left(b \cdot 4\right) + \color{blue}{\left(b \cdot b\right)} \cdot {b}^{2}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      8. associate-*l*N/A

        \[\leadsto \left(b \cdot \left(b \cdot 4\right) + \color{blue}{b \cdot \left(b \cdot {b}^{2}\right)}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      9. distribute-lft-outN/A

        \[\leadsto \color{blue}{b \cdot \left(b \cdot 4 + b \cdot {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      10. distribute-lft-outN/A

        \[\leadsto b \cdot \color{blue}{\left(b \cdot \left(4 + {b}^{2}\right)\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      11. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(b, b \cdot \left(4 + {b}^{2}\right), \mathsf{neg}\left(1\right)\right)} \]
      12. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(b, \color{blue}{b \cdot \left(4 + {b}^{2}\right)}, \mathsf{neg}\left(1\right)\right) \]
      13. +-commutativeN/A

        \[\leadsto \mathsf{fma}\left(b, b \cdot \color{blue}{\left({b}^{2} + 4\right)}, \mathsf{neg}\left(1\right)\right) \]
      14. unpow2N/A

        \[\leadsto \mathsf{fma}\left(b, b \cdot \left(\color{blue}{b \cdot b} + 4\right), \mathsf{neg}\left(1\right)\right) \]
      15. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(b, b \cdot \color{blue}{\mathsf{fma}\left(b, b, 4\right)}, \mathsf{neg}\left(1\right)\right) \]
      16. metadata-eval99.9

        \[\leadsto \mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \color{blue}{-1}\right) \]
    5. Simplified99.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), -1\right)} \]

    if 1.2e13 < (*.f64 a a)

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in a around inf

      \[\leadsto \color{blue}{{a}^{4}} \]
    4. Step-by-step derivation
      1. metadata-evalN/A

        \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} \]
      2. pow-sqrN/A

        \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} \]
      3. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} \]
      4. associate-*l*N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
      5. *-lowering-*.f64N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
      6. *-lowering-*.f64N/A

        \[\leadsto a \cdot \color{blue}{\left(a \cdot {a}^{2}\right)} \]
      7. unpow2N/A

        \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
      8. *-lowering-*.f6494.3

        \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
    5. Simplified94.3%

      \[\leadsto \color{blue}{a \cdot \left(a \cdot \left(a \cdot a\right)\right)} \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 5: 94.4% accurate, 4.7× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;b \cdot b \leq 10^{+16}:\\ \;\;\;\;\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)\\ \mathbf{else}:\\ \;\;\;\;b \cdot \left(b \cdot \left(b \cdot b\right)\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* b b) 1e+16) (fma a (* a (* a a)) -1.0) (* b (* b (* b b)))))
double code(double a, double b) {
	double tmp;
	if ((b * b) <= 1e+16) {
		tmp = fma(a, (a * (a * a)), -1.0);
	} else {
		tmp = b * (b * (b * b));
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(b * b) <= 1e+16)
		tmp = fma(a, Float64(a * Float64(a * a)), -1.0);
	else
		tmp = Float64(b * Float64(b * Float64(b * b)));
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 1e+16], N[(a * N[(a * N[(a * a), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision], N[(b * N[(b * N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 10^{+16}:\\
\;\;\;\;\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)\\

\mathbf{else}:\\
\;\;\;\;b \cdot \left(b \cdot \left(b \cdot b\right)\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (*.f64 b b) < 1e16

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in b around 0

      \[\leadsto \color{blue}{{a}^{4} - 1} \]
    4. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{{a}^{4} + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. metadata-evalN/A

        \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} + \left(\mathsf{neg}\left(1\right)\right) \]
      3. pow-sqrN/A

        \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} + \left(\mathsf{neg}\left(1\right)\right) \]
      4. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} + \left(\mathsf{neg}\left(1\right)\right) \]
      5. associate-*l*N/A

        \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot {a}^{2}, \mathsf{neg}\left(1\right)\right)} \]
      7. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(a, \color{blue}{a \cdot {a}^{2}}, \mathsf{neg}\left(1\right)\right) \]
      8. unpow2N/A

        \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
      9. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
      10. metadata-eval97.7

        \[\leadsto \mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), \color{blue}{-1}\right) \]
    5. Simplified97.7%

      \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)} \]

    if 1e16 < (*.f64 b b)

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in b around inf

      \[\leadsto \color{blue}{{b}^{4}} \]
    4. Step-by-step derivation
      1. metadata-evalN/A

        \[\leadsto {b}^{\color{blue}{\left(2 \cdot 2\right)}} \]
      2. pow-sqrN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot {b}^{2}} \]
      3. unpow2N/A

        \[\leadsto \color{blue}{\left(b \cdot b\right)} \cdot {b}^{2} \]
      4. associate-*l*N/A

        \[\leadsto \color{blue}{b \cdot \left(b \cdot {b}^{2}\right)} \]
      5. *-lowering-*.f64N/A

        \[\leadsto \color{blue}{b \cdot \left(b \cdot {b}^{2}\right)} \]
      6. *-lowering-*.f64N/A

        \[\leadsto b \cdot \color{blue}{\left(b \cdot {b}^{2}\right)} \]
      7. unpow2N/A

        \[\leadsto b \cdot \left(b \cdot \color{blue}{\left(b \cdot b\right)}\right) \]
      8. *-lowering-*.f6495.2

        \[\leadsto b \cdot \left(b \cdot \color{blue}{\left(b \cdot b\right)}\right) \]
    5. Simplified95.2%

      \[\leadsto \color{blue}{b \cdot \left(b \cdot \left(b \cdot b\right)\right)} \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 6: 82.0% accurate, 4.8× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;a \cdot a \leq 12000000000000:\\ \;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\ \mathbf{else}:\\ \;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* a a) 12000000000000.0) (fma (* b b) 4.0 -1.0) (* a (* a (* a a)))))
double code(double a, double b) {
	double tmp;
	if ((a * a) <= 12000000000000.0) {
		tmp = fma((b * b), 4.0, -1.0);
	} else {
		tmp = a * (a * (a * a));
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(a * a) <= 12000000000000.0)
		tmp = fma(Float64(b * b), 4.0, -1.0);
	else
		tmp = Float64(a * Float64(a * Float64(a * a)));
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(a * a), $MachinePrecision], 12000000000000.0], N[(N[(b * b), $MachinePrecision] * 4.0 + -1.0), $MachinePrecision], N[(a * N[(a * N[(a * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;a \cdot a \leq 12000000000000:\\
\;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\

\mathbf{else}:\\
\;\;\;\;a \cdot \left(a \cdot \left(a \cdot a\right)\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (*.f64 a a) < 1.2e13

    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. associate--l+N/A

        \[\leadsto \color{blue}{{\left(a \cdot a + b \cdot b\right)}^{2} + \left(4 \cdot \left(b \cdot b\right) - 1\right)} \]
      2. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a + b \cdot b\right) \cdot \left(a \cdot a + b \cdot b\right)} + \left(4 \cdot \left(b \cdot b\right) - 1\right) \]
      3. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(a \cdot a + b \cdot b, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right)} \]
      4. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      5. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      7. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), 4 \cdot \left(b \cdot b\right) - 1\right) \]
      8. sub-negN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{4 \cdot \left(b \cdot b\right) + \left(\mathsf{neg}\left(1\right)\right)}\right) \]
      9. associate-*r*N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\left(4 \cdot b\right) \cdot b} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      10. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{b \cdot \left(4 \cdot b\right)} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      11. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(b, 4 \cdot b, \mathsf{neg}\left(1\right)\right)}\right) \]
      12. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      13. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      14. metadata-eval99.9

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, \color{blue}{-1}\right)\right) \]
    4. Applied egg-rr99.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, -1\right)\right)} \]
    5. Taylor expanded in a around 0

      \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1} \]
    6. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. metadata-evalN/A

        \[\leadsto \left(4 \cdot {b}^{2} + {b}^{\color{blue}{\left(2 \cdot 2\right)}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      3. pow-sqrN/A

        \[\leadsto \left(4 \cdot {b}^{2} + \color{blue}{{b}^{2} \cdot {b}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      4. distribute-rgt-inN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot \left(4 + {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      5. metadata-evalN/A

        \[\leadsto {b}^{2} \cdot \left(4 + {b}^{2}\right) + \color{blue}{-1} \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left({b}^{2}, 4 + {b}^{2}, -1\right)} \]
      7. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      8. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      9. +-commutativeN/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{{b}^{2} + 4}, -1\right) \]
      10. unpow2N/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{b \cdot b} + 4, -1\right) \]
      11. accelerator-lowering-fma.f64100.0

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{\mathsf{fma}\left(b, b, 4\right)}, -1\right) \]
    7. Simplified100.0%

      \[\leadsto \color{blue}{\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)} \]
    8. Taylor expanded in b around 0

      \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{4}, -1\right) \]
    9. Step-by-step derivation
      1. Simplified78.0%

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{4}, -1\right) \]

      if 1.2e13 < (*.f64 a a)

      1. Initial program 99.9%

        \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
      2. Add Preprocessing
      3. Taylor expanded in a around inf

        \[\leadsto \color{blue}{{a}^{4}} \]
      4. Step-by-step derivation
        1. metadata-evalN/A

          \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} \]
        2. pow-sqrN/A

          \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} \]
        3. unpow2N/A

          \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} \]
        4. associate-*l*N/A

          \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
        5. *-lowering-*.f64N/A

          \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} \]
        6. *-lowering-*.f64N/A

          \[\leadsto a \cdot \color{blue}{\left(a \cdot {a}^{2}\right)} \]
        7. unpow2N/A

          \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
        8. *-lowering-*.f6494.3

          \[\leadsto a \cdot \left(a \cdot \color{blue}{\left(a \cdot a\right)}\right) \]
      5. Simplified94.3%

        \[\leadsto \color{blue}{a \cdot \left(a \cdot \left(a \cdot a\right)\right)} \]
    10. Recombined 2 regimes into one program.
    11. Add Preprocessing

    Alternative 7: 50.7% accurate, 10.9× speedup?

    \[\begin{array}{l} \\ \mathsf{fma}\left(b \cdot b, 4, -1\right) \end{array} \]
    (FPCore (a b) :precision binary64 (fma (* b b) 4.0 -1.0))
    double code(double a, double b) {
    	return fma((b * b), 4.0, -1.0);
    }
    
    function code(a, b)
    	return fma(Float64(b * b), 4.0, -1.0)
    end
    
    code[a_, b_] := N[(N[(b * b), $MachinePrecision] * 4.0 + -1.0), $MachinePrecision]
    
    \begin{array}{l}
    
    \\
    \mathsf{fma}\left(b \cdot b, 4, -1\right)
    \end{array}
    
    Derivation
    1. Initial program 99.9%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. associate--l+N/A

        \[\leadsto \color{blue}{{\left(a \cdot a + b \cdot b\right)}^{2} + \left(4 \cdot \left(b \cdot b\right) - 1\right)} \]
      2. unpow2N/A

        \[\leadsto \color{blue}{\left(a \cdot a + b \cdot b\right) \cdot \left(a \cdot a + b \cdot b\right)} + \left(4 \cdot \left(b \cdot b\right) - 1\right) \]
      3. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(a \cdot a + b \cdot b, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right)} \]
      4. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      5. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), a \cdot a + b \cdot b, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}, 4 \cdot \left(b \cdot b\right) - 1\right) \]
      7. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, \color{blue}{b \cdot b}\right), 4 \cdot \left(b \cdot b\right) - 1\right) \]
      8. sub-negN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{4 \cdot \left(b \cdot b\right) + \left(\mathsf{neg}\left(1\right)\right)}\right) \]
      9. associate-*r*N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\left(4 \cdot b\right) \cdot b} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      10. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{b \cdot \left(4 \cdot b\right)} + \left(\mathsf{neg}\left(1\right)\right)\right) \]
      11. accelerator-lowering-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \color{blue}{\mathsf{fma}\left(b, 4 \cdot b, \mathsf{neg}\left(1\right)\right)}\right) \]
      12. *-commutativeN/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      13. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, \color{blue}{b \cdot 4}, \mathsf{neg}\left(1\right)\right)\right) \]
      14. metadata-eval99.9

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, \color{blue}{-1}\right)\right) \]
    4. Applied egg-rr99.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(\mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(a, a, b \cdot b\right), \mathsf{fma}\left(b, b \cdot 4, -1\right)\right)} \]
    5. Taylor expanded in a around 0

      \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1} \]
    6. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. metadata-evalN/A

        \[\leadsto \left(4 \cdot {b}^{2} + {b}^{\color{blue}{\left(2 \cdot 2\right)}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      3. pow-sqrN/A

        \[\leadsto \left(4 \cdot {b}^{2} + \color{blue}{{b}^{2} \cdot {b}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      4. distribute-rgt-inN/A

        \[\leadsto \color{blue}{{b}^{2} \cdot \left(4 + {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      5. metadata-evalN/A

        \[\leadsto {b}^{2} \cdot \left(4 + {b}^{2}\right) + \color{blue}{-1} \]
      6. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left({b}^{2}, 4 + {b}^{2}, -1\right)} \]
      7. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      8. *-lowering-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, 4 + {b}^{2}, -1\right) \]
      9. +-commutativeN/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{{b}^{2} + 4}, -1\right) \]
      10. unpow2N/A

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{b \cdot b} + 4, -1\right) \]
      11. accelerator-lowering-fma.f6473.0

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{\mathsf{fma}\left(b, b, 4\right)}, -1\right) \]
    7. Simplified73.0%

      \[\leadsto \color{blue}{\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)} \]
    8. Taylor expanded in b around 0

      \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{4}, -1\right) \]
    9. Step-by-step derivation
      1. Simplified54.1%

        \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{4}, -1\right) \]
      2. Add Preprocessing

      Alternative 8: 24.7% accurate, 131.0× speedup?

      \[\begin{array}{l} \\ -1 \end{array} \]
      (FPCore (a b) :precision binary64 -1.0)
      double code(double a, double b) {
      	return -1.0;
      }
      
      real(8) function code(a, b)
          real(8), intent (in) :: a
          real(8), intent (in) :: b
          code = -1.0d0
      end function
      
      public static double code(double a, double b) {
      	return -1.0;
      }
      
      def code(a, b):
      	return -1.0
      
      function code(a, b)
      	return -1.0
      end
      
      function tmp = code(a, b)
      	tmp = -1.0;
      end
      
      code[a_, b_] := -1.0
      
      \begin{array}{l}
      
      \\
      -1
      \end{array}
      
      Derivation
      1. Initial program 99.9%

        \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(b \cdot b\right)\right) - 1 \]
      2. Add Preprocessing
      3. Taylor expanded in b around 0

        \[\leadsto \color{blue}{{a}^{4} - 1} \]
      4. Step-by-step derivation
        1. sub-negN/A

          \[\leadsto \color{blue}{{a}^{4} + \left(\mathsf{neg}\left(1\right)\right)} \]
        2. metadata-evalN/A

          \[\leadsto {a}^{\color{blue}{\left(2 \cdot 2\right)}} + \left(\mathsf{neg}\left(1\right)\right) \]
        3. pow-sqrN/A

          \[\leadsto \color{blue}{{a}^{2} \cdot {a}^{2}} + \left(\mathsf{neg}\left(1\right)\right) \]
        4. unpow2N/A

          \[\leadsto \color{blue}{\left(a \cdot a\right)} \cdot {a}^{2} + \left(\mathsf{neg}\left(1\right)\right) \]
        5. associate-*l*N/A

          \[\leadsto \color{blue}{a \cdot \left(a \cdot {a}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
        6. accelerator-lowering-fma.f64N/A

          \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot {a}^{2}, \mathsf{neg}\left(1\right)\right)} \]
        7. *-lowering-*.f64N/A

          \[\leadsto \mathsf{fma}\left(a, \color{blue}{a \cdot {a}^{2}}, \mathsf{neg}\left(1\right)\right) \]
        8. unpow2N/A

          \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
        9. *-lowering-*.f64N/A

          \[\leadsto \mathsf{fma}\left(a, a \cdot \color{blue}{\left(a \cdot a\right)}, \mathsf{neg}\left(1\right)\right) \]
        10. metadata-eval70.3

          \[\leadsto \mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), \color{blue}{-1}\right) \]
      5. Simplified70.3%

        \[\leadsto \color{blue}{\mathsf{fma}\left(a, a \cdot \left(a \cdot a\right), -1\right)} \]
      6. Taylor expanded in a around 0

        \[\leadsto \color{blue}{-1} \]
      7. Step-by-step derivation
        1. Simplified27.4%

          \[\leadsto \color{blue}{-1} \]
        2. Add Preprocessing

        Reproduce

        ?
        herbie shell --seed 2024198 
        (FPCore (a b)
          :name "Bouland and Aaronson, Equation (26)"
          :precision binary64
          (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (* b b))) 1.0))