Bouland and Aaronson, Equation (25)

Percentage Accurate: 74.6% → 98.9%
Time: 10.6s
Alternatives: 10
Speedup: 5.7×

Specification

?
\[\begin{array}{l} \\ \left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \end{array} \]
(FPCore (a b)
 :precision binary64
 (-
  (+
   (pow (+ (* a a) (* b b)) 2.0)
   (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a))))))
  1.0))
double code(double a, double b) {
	return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
    real(8), intent (in) :: a
    real(8), intent (in) :: b
    code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
	return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b):
	return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b)
	return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0)
end
function tmp = code(a, b)
	tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}

\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 10 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 74.6% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \end{array} \]
(FPCore (a b)
 :precision binary64
 (-
  (+
   (pow (+ (* a a) (* b b)) 2.0)
   (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a))))))
  1.0))
double code(double a, double b) {
	return (pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
real(8) function code(a, b)
    real(8), intent (in) :: a
    real(8), intent (in) :: b
    code = ((((a * a) + (b * b)) ** 2.0d0) + (4.0d0 * (((a * a) * (1.0d0 + a)) + ((b * b) * (1.0d0 - (3.0d0 * a)))))) - 1.0d0
end function
public static double code(double a, double b) {
	return (Math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
}
def code(a, b):
	return (math.pow(((a * a) + (b * b)), 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0
function code(a, b)
	return Float64(Float64((Float64(Float64(a * a) + Float64(b * b)) ^ 2.0) + Float64(4.0 * Float64(Float64(Float64(a * a) * Float64(1.0 + a)) + Float64(Float64(b * b) * Float64(1.0 - Float64(3.0 * a)))))) - 1.0)
end
function tmp = code(a, b)
	tmp = ((((a * a) + (b * b)) ^ 2.0) + (4.0 * (((a * a) * (1.0 + a)) + ((b * b) * (1.0 - (3.0 * a)))))) - 1.0;
end
code[a_, b_] := N[(N[(N[Power[N[(N[(a * a), $MachinePrecision] + N[(b * b), $MachinePrecision]), $MachinePrecision], 2.0], $MachinePrecision] + N[(4.0 * N[(N[(N[(a * a), $MachinePrecision] * N[(1.0 + a), $MachinePrecision]), $MachinePrecision] + N[(N[(b * b), $MachinePrecision] * N[(1.0 - N[(3.0 * a), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] - 1.0), $MachinePrecision]
\begin{array}{l}

\\
\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1
\end{array}

Alternative 1: 98.9% accurate, 2.6× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \mathsf{fma}\left(a, a, b \cdot b\right)\\ \left(\frac{t\_0}{\frac{1}{t\_0}} + 4 \cdot \left(b \cdot b\right)\right) + -1 \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (let* ((t_0 (fma a a (* b b))))
   (+ (+ (/ t_0 (/ 1.0 t_0)) (* 4.0 (* b b))) -1.0)))
double code(double a, double b) {
	double t_0 = fma(a, a, (b * b));
	return ((t_0 / (1.0 / t_0)) + (4.0 * (b * b))) + -1.0;
}
function code(a, b)
	t_0 = fma(a, a, Float64(b * b))
	return Float64(Float64(Float64(t_0 / Float64(1.0 / t_0)) + Float64(4.0 * Float64(b * b))) + -1.0)
end
code[a_, b_] := Block[{t$95$0 = N[(a * a + N[(b * b), $MachinePrecision]), $MachinePrecision]}, N[(N[(N[(t$95$0 / N[(1.0 / t$95$0), $MachinePrecision]), $MachinePrecision] + N[(4.0 * N[(b * b), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]]
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \mathsf{fma}\left(a, a, b \cdot b\right)\\
\left(\frac{t\_0}{\frac{1}{t\_0}} + 4 \cdot \left(b \cdot b\right)\right) + -1
\end{array}
\end{array}
Derivation
  1. Initial program 74.1%

    \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
  2. Add Preprocessing
  3. Step-by-step derivation
    1. lift-pow.f64N/A

      \[\leadsto \left(\color{blue}{{\left(a \cdot a + b \cdot b\right)}^{2}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    2. unpow2N/A

      \[\leadsto \left(\color{blue}{\left(a \cdot a + b \cdot b\right) \cdot \left(a \cdot a + b \cdot b\right)} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    3. lift-+.f64N/A

      \[\leadsto \left(\left(a \cdot a + b \cdot b\right) \cdot \color{blue}{\left(a \cdot a + b \cdot b\right)} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    4. flip-+N/A

      \[\leadsto \left(\left(a \cdot a + b \cdot b\right) \cdot \color{blue}{\frac{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}{a \cdot a - b \cdot b}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    5. clear-numN/A

      \[\leadsto \left(\left(a \cdot a + b \cdot b\right) \cdot \color{blue}{\frac{1}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    6. un-div-invN/A

      \[\leadsto \left(\color{blue}{\frac{a \cdot a + b \cdot b}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    7. lower-/.f64N/A

      \[\leadsto \left(\color{blue}{\frac{a \cdot a + b \cdot b}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    8. lift-+.f64N/A

      \[\leadsto \left(\frac{\color{blue}{a \cdot a + b \cdot b}}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    9. lift-*.f64N/A

      \[\leadsto \left(\frac{\color{blue}{a \cdot a} + b \cdot b}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    10. lower-fma.f64N/A

      \[\leadsto \left(\frac{\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}}{\frac{a \cdot a - b \cdot b}{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    11. clear-numN/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\color{blue}{\frac{1}{\frac{\left(a \cdot a\right) \cdot \left(a \cdot a\right) - \left(b \cdot b\right) \cdot \left(b \cdot b\right)}{a \cdot a - b \cdot b}}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    12. flip-+N/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\color{blue}{a \cdot a + b \cdot b}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    13. lift-+.f64N/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\color{blue}{a \cdot a + b \cdot b}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    14. lower-/.f6474.1

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\color{blue}{\frac{1}{a \cdot a + b \cdot b}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    15. lift-+.f64N/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\color{blue}{a \cdot a + b \cdot b}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    16. lift-*.f64N/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\color{blue}{a \cdot a} + b \cdot b}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    17. lower-fma.f6474.1

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\color{blue}{\mathsf{fma}\left(a, a, b \cdot b\right)}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
  4. Applied rewrites74.1%

    \[\leadsto \left(\color{blue}{\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}}} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
  5. Taylor expanded in a around 0

    \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}} + 4 \cdot \color{blue}{{b}^{2}}\right) - 1 \]
  6. Step-by-step derivation
    1. unpow2N/A

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}} + 4 \cdot \color{blue}{\left(b \cdot b\right)}\right) - 1 \]
    2. lower-*.f6499.5

      \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}} + 4 \cdot \color{blue}{\left(b \cdot b\right)}\right) - 1 \]
  7. Applied rewrites99.5%

    \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}} + 4 \cdot \color{blue}{\left(b \cdot b\right)}\right) - 1 \]
  8. Final simplification99.5%

    \[\leadsto \left(\frac{\mathsf{fma}\left(a, a, b \cdot b\right)}{\frac{1}{\mathsf{fma}\left(a, a, b \cdot b\right)}} + 4 \cdot \left(b \cdot b\right)\right) + -1 \]
  9. Add Preprocessing

Alternative 2: 97.8% accurate, 2.4× speedup?

\[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;b \cdot b \leq 5:\\ \;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(a, a + 4, 4\right), a \cdot a, -1\right)\\ \mathbf{elif}\;b \cdot b \leq 5 \cdot 10^{+302}:\\ \;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \mathsf{fma}\left(a, \mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(2, a, -12\right), a \cdot 4\right), -1\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\ \end{array} \end{array} \]
(FPCore (a b)
 :precision binary64
 (if (<= (* b b) 5.0)
   (fma (fma a (+ a 4.0) 4.0) (* a a) -1.0)
   (if (<= (* b b) 5e+302)
     (fma
      b
      (* b (fma b b 4.0))
      (fma a (fma (* b b) (fma 2.0 a -12.0) (* a 4.0)) -1.0))
     (fma (* b b) 4.0 -1.0))))
double code(double a, double b) {
	double tmp;
	if ((b * b) <= 5.0) {
		tmp = fma(fma(a, (a + 4.0), 4.0), (a * a), -1.0);
	} else if ((b * b) <= 5e+302) {
		tmp = fma(b, (b * fma(b, b, 4.0)), fma(a, fma((b * b), fma(2.0, a, -12.0), (a * 4.0)), -1.0));
	} else {
		tmp = fma((b * b), 4.0, -1.0);
	}
	return tmp;
}
function code(a, b)
	tmp = 0.0
	if (Float64(b * b) <= 5.0)
		tmp = fma(fma(a, Float64(a + 4.0), 4.0), Float64(a * a), -1.0);
	elseif (Float64(b * b) <= 5e+302)
		tmp = fma(b, Float64(b * fma(b, b, 4.0)), fma(a, fma(Float64(b * b), fma(2.0, a, -12.0), Float64(a * 4.0)), -1.0));
	else
		tmp = fma(Float64(b * b), 4.0, -1.0);
	end
	return tmp
end
code[a_, b_] := If[LessEqual[N[(b * b), $MachinePrecision], 5.0], N[(N[(a * N[(a + 4.0), $MachinePrecision] + 4.0), $MachinePrecision] * N[(a * a), $MachinePrecision] + -1.0), $MachinePrecision], If[LessEqual[N[(b * b), $MachinePrecision], 5e+302], N[(b * N[(b * N[(b * b + 4.0), $MachinePrecision]), $MachinePrecision] + N[(a * N[(N[(b * b), $MachinePrecision] * N[(2.0 * a + -12.0), $MachinePrecision] + N[(a * 4.0), $MachinePrecision]), $MachinePrecision] + -1.0), $MachinePrecision]), $MachinePrecision], N[(N[(b * b), $MachinePrecision] * 4.0 + -1.0), $MachinePrecision]]]
\begin{array}{l}

\\
\begin{array}{l}
\mathbf{if}\;b \cdot b \leq 5:\\
\;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(a, a + 4, 4\right), a \cdot a, -1\right)\\

\mathbf{elif}\;b \cdot b \leq 5 \cdot 10^{+302}:\\
\;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \mathsf{fma}\left(a, \mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(2, a, -12\right), a \cdot 4\right), -1\right)\right)\\

\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 3 regimes
  2. if (*.f64 b b) < 5

    1. Initial program 83.7%

      \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
    2. Add Preprocessing
    3. Taylor expanded in b around 0

      \[\leadsto \color{blue}{\left(4 \cdot \left({a}^{2} \cdot \left(1 + a\right)\right) + {a}^{4}\right) - 1} \]
    4. Step-by-step derivation
      1. sub-negN/A

        \[\leadsto \color{blue}{\left(4 \cdot \left({a}^{2} \cdot \left(1 + a\right)\right) + {a}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
      2. +-commutativeN/A

        \[\leadsto \color{blue}{\left({a}^{4} + 4 \cdot \left({a}^{2} \cdot \left(1 + a\right)\right)\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      3. metadata-evalN/A

        \[\leadsto \left({a}^{\color{blue}{\left(2 \cdot 2\right)}} + 4 \cdot \left({a}^{2} \cdot \left(1 + a\right)\right)\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      4. pow-sqrN/A

        \[\leadsto \left(\color{blue}{{a}^{2} \cdot {a}^{2}} + 4 \cdot \left({a}^{2} \cdot \left(1 + a\right)\right)\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      5. *-commutativeN/A

        \[\leadsto \left({a}^{2} \cdot {a}^{2} + 4 \cdot \color{blue}{\left(\left(1 + a\right) \cdot {a}^{2}\right)}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      6. associate-*r*N/A

        \[\leadsto \left({a}^{2} \cdot {a}^{2} + \color{blue}{\left(4 \cdot \left(1 + a\right)\right) \cdot {a}^{2}}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
      7. distribute-rgt-outN/A

        \[\leadsto \color{blue}{{a}^{2} \cdot \left({a}^{2} + 4 \cdot \left(1 + a\right)\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
      8. metadata-evalN/A

        \[\leadsto {a}^{2} \cdot \left({a}^{2} + 4 \cdot \left(1 + a\right)\right) + \color{blue}{-1} \]
      9. lower-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left({a}^{2}, {a}^{2} + 4 \cdot \left(1 + a\right), -1\right)} \]
      10. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{a \cdot a}, {a}^{2} + 4 \cdot \left(1 + a\right), -1\right) \]
      11. lower-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{a \cdot a}, {a}^{2} + 4 \cdot \left(1 + a\right), -1\right) \]
      12. unpow2N/A

        \[\leadsto \mathsf{fma}\left(a \cdot a, \color{blue}{a \cdot a} + 4 \cdot \left(1 + a\right), -1\right) \]
      13. lower-fma.f64N/A

        \[\leadsto \mathsf{fma}\left(a \cdot a, \color{blue}{\mathsf{fma}\left(a, a, 4 \cdot \left(1 + a\right)\right)}, -1\right) \]
      14. +-commutativeN/A

        \[\leadsto \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, 4 \cdot \color{blue}{\left(a + 1\right)}\right), -1\right) \]
      15. distribute-lft-inN/A

        \[\leadsto \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, \color{blue}{4 \cdot a + 4 \cdot 1}\right), -1\right) \]
      16. metadata-evalN/A

        \[\leadsto \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, 4 \cdot a + \color{blue}{4}\right), -1\right) \]
      17. lower-fma.f6499.3

        \[\leadsto \mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, \color{blue}{\mathsf{fma}\left(4, a, 4\right)}\right), -1\right) \]
    5. Applied rewrites99.3%

      \[\leadsto \color{blue}{\mathsf{fma}\left(a \cdot a, \mathsf{fma}\left(a, a, \mathsf{fma}\left(4, a, 4\right)\right), -1\right)} \]
    6. Step-by-step derivation
      1. Applied rewrites99.4%

        \[\leadsto \mathsf{fma}\left(\mathsf{fma}\left(a, a + 4, 4\right), \color{blue}{a \cdot a}, -1\right) \]

      if 5 < (*.f64 b b) < 5e302

      1. Initial program 70.9%

        \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
      2. Add Preprocessing
      3. Taylor expanded in a around 0

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) + {b}^{4}\right)\right) - 1} \]
      4. Step-by-step derivation
        1. +-commutativeN/A

          \[\leadsto \left(4 \cdot {b}^{2} + \color{blue}{\left({b}^{4} + a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right)\right)}\right) - 1 \]
        2. associate-+r+N/A

          \[\leadsto \color{blue}{\left(\left(4 \cdot {b}^{2} + {b}^{4}\right) + a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right)\right)} - 1 \]
        3. associate--l+N/A

          \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right)} \]
        4. +-commutativeN/A

          \[\leadsto \color{blue}{\left({b}^{4} + 4 \cdot {b}^{2}\right)} + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        5. metadata-evalN/A

          \[\leadsto \left({b}^{\color{blue}{\left(3 + 1\right)}} + 4 \cdot {b}^{2}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        6. pow-plusN/A

          \[\leadsto \left(\color{blue}{{b}^{3} \cdot b} + 4 \cdot {b}^{2}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        7. cube-unmultN/A

          \[\leadsto \left(\color{blue}{\left(b \cdot \left(b \cdot b\right)\right)} \cdot b + 4 \cdot {b}^{2}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        8. unpow2N/A

          \[\leadsto \left(\left(b \cdot \color{blue}{{b}^{2}}\right) \cdot b + 4 \cdot {b}^{2}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        9. unpow2N/A

          \[\leadsto \left(\left(b \cdot {b}^{2}\right) \cdot b + 4 \cdot \color{blue}{\left(b \cdot b\right)}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        10. associate-*r*N/A

          \[\leadsto \left(\left(b \cdot {b}^{2}\right) \cdot b + \color{blue}{\left(4 \cdot b\right) \cdot b}\right) + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        11. distribute-rgt-outN/A

          \[\leadsto \color{blue}{b \cdot \left(b \cdot {b}^{2} + 4 \cdot b\right)} + \left(a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right) \]
        12. lower-fma.f64N/A

          \[\leadsto \color{blue}{\mathsf{fma}\left(b, b \cdot {b}^{2} + 4 \cdot b, a \cdot \left(-12 \cdot {b}^{2} + a \cdot \left(4 + 2 \cdot {b}^{2}\right)\right) - 1\right)} \]
      5. Applied rewrites93.7%

        \[\leadsto \color{blue}{\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \mathsf{fma}\left(a, \mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(2, a, -12\right), 4 \cdot a\right), -1\right)\right)} \]

      if 5e302 < (*.f64 b b)

      1. Initial program 60.0%

        \[\left({\left(a \cdot a + b \cdot b\right)}^{2} + 4 \cdot \left(\left(a \cdot a\right) \cdot \left(1 + a\right) + \left(b \cdot b\right) \cdot \left(1 - 3 \cdot a\right)\right)\right) - 1 \]
      2. Add Preprocessing
      3. Taylor expanded in a around 0

        \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) - 1} \]
      4. Step-by-step derivation
        1. sub-negN/A

          \[\leadsto \color{blue}{\left(4 \cdot {b}^{2} + {b}^{4}\right) + \left(\mathsf{neg}\left(1\right)\right)} \]
        2. +-commutativeN/A

          \[\leadsto \color{blue}{\left({b}^{4} + 4 \cdot {b}^{2}\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
        3. metadata-evalN/A

          \[\leadsto \left({b}^{\color{blue}{\left(2 \cdot 2\right)}} + 4 \cdot {b}^{2}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
        4. pow-sqrN/A

          \[\leadsto \left(\color{blue}{{b}^{2} \cdot {b}^{2}} + 4 \cdot {b}^{2}\right) + \left(\mathsf{neg}\left(1\right)\right) \]
        5. distribute-rgt-outN/A

          \[\leadsto \color{blue}{{b}^{2} \cdot \left({b}^{2} + 4\right)} + \left(\mathsf{neg}\left(1\right)\right) \]
        6. metadata-evalN/A

          \[\leadsto {b}^{2} \cdot \left({b}^{2} + 4\right) + \color{blue}{-1} \]
        7. lower-fma.f64N/A

          \[\leadsto \color{blue}{\mathsf{fma}\left({b}^{2}, {b}^{2} + 4, -1\right)} \]
        8. unpow2N/A

          \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, {b}^{2} + 4, -1\right) \]
        9. lower-*.f64N/A

          \[\leadsto \mathsf{fma}\left(\color{blue}{b \cdot b}, {b}^{2} + 4, -1\right) \]
        10. unpow2N/A

          \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{b \cdot b} + 4, -1\right) \]
        11. lower-fma.f64100.0

          \[\leadsto \mathsf{fma}\left(b \cdot b, \color{blue}{\mathsf{fma}\left(b, b, 4\right)}, -1\right) \]
      5. Applied rewrites100.0%

        \[\leadsto \color{blue}{\mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(b, b, 4\right), -1\right)} \]
      6. Taylor expanded in b around 0

        \[\leadsto \mathsf{fma}\left(b \cdot b, 4, -1\right) \]
      7. Step-by-step derivation
        1. Applied rewrites98.6%

          \[\leadsto \mathsf{fma}\left(b \cdot b, 4, -1\right) \]
      8. Recombined 3 regimes into one program.
      9. Final simplification97.8%

        \[\leadsto \begin{array}{l} \mathbf{if}\;b \cdot b \leq 5:\\ \;\;\;\;\mathsf{fma}\left(\mathsf{fma}\left(a, a + 4, 4\right), a \cdot a, -1\right)\\ \mathbf{elif}\;b \cdot b \leq 5 \cdot 10^{+302}:\\ \;\;\;\;\mathsf{fma}\left(b, b \cdot \mathsf{fma}\left(b, b, 4\right), \mathsf{fma}\left(a, \mathsf{fma}\left(b \cdot b, \mathsf{fma}\left(2, a, -12\right), a \cdot 4\right), -1\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(b \cdot b, 4, -1\right)\\ \end{array} \]
      10. Add Preprocessing

      Reproduce

      ?
      herbie shell --seed 2024229 
      (FPCore (a b)
        :name "Bouland and Aaronson, Equation (25)"
        :precision binary64
        (- (+ (pow (+ (* a a) (* b b)) 2.0) (* 4.0 (+ (* (* a a) (+ 1.0 a)) (* (* b b) (- 1.0 (* 3.0 a)))))) 1.0))