bug333 (missed optimization)

Percentage Accurate: 8.4% → 99.8%
Time: 5.2s
Alternatives: 5
Speedup: 207.0×

Specification

?
\[-1 \leq x \land x \leq 1\]
\[\begin{array}{l} \\ \sqrt{1 + x} - \sqrt{1 - x} \end{array} \]
(FPCore (x) :precision binary64 (- (sqrt (+ 1.0 x)) (sqrt (- 1.0 x))))
double code(double x) {
	return sqrt((1.0 + x)) - sqrt((1.0 - x));
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = sqrt((1.0d0 + x)) - sqrt((1.0d0 - x))
end function
public static double code(double x) {
	return Math.sqrt((1.0 + x)) - Math.sqrt((1.0 - x));
}
def code(x):
	return math.sqrt((1.0 + x)) - math.sqrt((1.0 - x))
function code(x)
	return Float64(sqrt(Float64(1.0 + x)) - sqrt(Float64(1.0 - x)))
end
function tmp = code(x)
	tmp = sqrt((1.0 + x)) - sqrt((1.0 - x));
end
code[x_] := N[(N[Sqrt[N[(1.0 + x), $MachinePrecision]], $MachinePrecision] - N[Sqrt[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
\sqrt{1 + x} - \sqrt{1 - x}
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 5 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 8.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \sqrt{1 + x} - \sqrt{1 - x} \end{array} \]
(FPCore (x) :precision binary64 (- (sqrt (+ 1.0 x)) (sqrt (- 1.0 x))))
double code(double x) {
	return sqrt((1.0 + x)) - sqrt((1.0 - x));
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = sqrt((1.0d0 + x)) - sqrt((1.0d0 - x))
end function
public static double code(double x) {
	return Math.sqrt((1.0 + x)) - Math.sqrt((1.0 - x));
}
def code(x):
	return math.sqrt((1.0 + x)) - math.sqrt((1.0 - x))
function code(x)
	return Float64(sqrt(Float64(1.0 + x)) - sqrt(Float64(1.0 - x)))
end
function tmp = code(x)
	tmp = sqrt((1.0 + x)) - sqrt((1.0 - x));
end
code[x_] := N[(N[Sqrt[N[(1.0 + x), $MachinePrecision]], $MachinePrecision] - N[Sqrt[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
\sqrt{1 + x} - \sqrt{1 - x}
\end{array}

Alternative 1: 99.8% accurate, 9.9× speedup?

\[\begin{array}{l} \\ x + x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right) \end{array} \]
(FPCore (x)
 :precision binary64
 (+
  x
  (*
   x
   (* (* x x) (+ 0.125 (* x (* x (+ 0.0546875 (* (* x x) 0.0322265625)))))))))
double code(double x) {
	return x + (x * ((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))));
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = x + (x * ((x * x) * (0.125d0 + (x * (x * (0.0546875d0 + ((x * x) * 0.0322265625d0)))))))
end function
public static double code(double x) {
	return x + (x * ((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))));
}
def code(x):
	return x + (x * ((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))))
function code(x)
	return Float64(x + Float64(x * Float64(Float64(x * x) * Float64(0.125 + Float64(x * Float64(x * Float64(0.0546875 + Float64(Float64(x * x) * 0.0322265625))))))))
end
function tmp = code(x)
	tmp = x + (x * ((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))));
end
code[x_] := N[(x + N[(x * N[(N[(x * x), $MachinePrecision] * N[(0.125 + N[(x * N[(x * N[(0.0546875 + N[(N[(x * x), $MachinePrecision] * 0.0322265625), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
x + x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right)
\end{array}
Derivation
  1. Initial program 7.3%

    \[\sqrt{1 + x} - \sqrt{1 - x} \]
  2. Add Preprocessing
  3. Taylor expanded in x around 0

    \[\leadsto \color{blue}{x \cdot \left(1 + {x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)} \]
  4. Step-by-step derivation
    1. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \color{blue}{\left(1 + {x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)}\right) \]
    2. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \color{blue}{\left({x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)}\right)\right) \]
    3. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right) \]
    4. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left(x \cdot x\right), \left(\color{blue}{\frac{1}{8}} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right) \]
    5. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \left(\color{blue}{\frac{1}{8}} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right) \]
    6. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \color{blue}{\left({x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right) \]
    7. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \left(\left(x \cdot x\right) \cdot \left(\color{blue}{\frac{7}{128}} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right)\right) \]
    8. associate-*l*N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \left(x \cdot \color{blue}{\left(x \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right)\right) \]
    9. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \color{blue}{\left(x \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right)\right) \]
    10. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \color{blue}{\left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)}\right)\right)\right)\right)\right)\right) \]
    11. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \color{blue}{\left(\frac{33}{1024} \cdot {x}^{2}\right)}\right)\right)\right)\right)\right)\right)\right) \]
    12. *-commutativeN/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \left({x}^{2} \cdot \color{blue}{\frac{33}{1024}}\right)\right)\right)\right)\right)\right)\right)\right) \]
    13. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\frac{33}{1024}}\right)\right)\right)\right)\right)\right)\right)\right) \]
    14. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\left(x \cdot x\right), \frac{33}{1024}\right)\right)\right)\right)\right)\right)\right)\right) \]
    15. *-lowering-*.f64100.0%

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \frac{33}{1024}\right)\right)\right)\right)\right)\right)\right)\right) \]
  5. Simplified100.0%

    \[\leadsto \color{blue}{x \cdot \left(1 + \left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right)} \]
  6. Step-by-step derivation
    1. +-commutativeN/A

      \[\leadsto x \cdot \left(\left(x \cdot x\right) \cdot \left(\frac{1}{8} + x \cdot \left(x \cdot \left(\frac{7}{128} + \left(x \cdot x\right) \cdot \frac{33}{1024}\right)\right)\right) + \color{blue}{1}\right) \]
    2. distribute-rgt-inN/A

      \[\leadsto \left(\left(x \cdot x\right) \cdot \left(\frac{1}{8} + x \cdot \left(x \cdot \left(\frac{7}{128} + \left(x \cdot x\right) \cdot \frac{33}{1024}\right)\right)\right)\right) \cdot x + \color{blue}{1 \cdot x} \]
    3. *-lft-identityN/A

      \[\leadsto \left(\left(x \cdot x\right) \cdot \left(\frac{1}{8} + x \cdot \left(x \cdot \left(\frac{7}{128} + \left(x \cdot x\right) \cdot \frac{33}{1024}\right)\right)\right)\right) \cdot x + x \]
    4. +-lowering-+.f64N/A

      \[\leadsto \mathsf{+.f64}\left(\left(\left(\left(x \cdot x\right) \cdot \left(\frac{1}{8} + x \cdot \left(x \cdot \left(\frac{7}{128} + \left(x \cdot x\right) \cdot \frac{33}{1024}\right)\right)\right)\right) \cdot x\right), \color{blue}{x}\right) \]
  7. Applied egg-rr100.0%

    \[\leadsto \color{blue}{x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right) + x} \]
  8. Final simplification100.0%

    \[\leadsto x + x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right) \]
  9. Add Preprocessing

Alternative 2: 99.8% accurate, 9.9× speedup?

\[\begin{array}{l} \\ x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right) + 1\right) \end{array} \]
(FPCore (x)
 :precision binary64
 (*
  x
  (+
   (* (* x x) (+ 0.125 (* x (* x (+ 0.0546875 (* (* x x) 0.0322265625))))))
   1.0)))
double code(double x) {
	return x * (((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))) + 1.0);
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = x * (((x * x) * (0.125d0 + (x * (x * (0.0546875d0 + ((x * x) * 0.0322265625d0)))))) + 1.0d0)
end function
public static double code(double x) {
	return x * (((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))) + 1.0);
}
def code(x):
	return x * (((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))) + 1.0)
function code(x)
	return Float64(x * Float64(Float64(Float64(x * x) * Float64(0.125 + Float64(x * Float64(x * Float64(0.0546875 + Float64(Float64(x * x) * 0.0322265625)))))) + 1.0))
end
function tmp = code(x)
	tmp = x * (((x * x) * (0.125 + (x * (x * (0.0546875 + ((x * x) * 0.0322265625)))))) + 1.0);
end
code[x_] := N[(x * N[(N[(N[(x * x), $MachinePrecision] * N[(0.125 + N[(x * N[(x * N[(0.0546875 + N[(N[(x * x), $MachinePrecision] * 0.0322265625), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right) + 1\right)
\end{array}
Derivation
  1. Initial program 7.3%

    \[\sqrt{1 + x} - \sqrt{1 - x} \]
  2. Add Preprocessing
  3. Taylor expanded in x around 0

    \[\leadsto \color{blue}{x \cdot \left(1 + {x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)} \]
  4. Step-by-step derivation
    1. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \color{blue}{\left(1 + {x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)}\right) \]
    2. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \color{blue}{\left({x}^{2} \cdot \left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)}\right)\right) \]
    3. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\left(\frac{1}{8} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right) \]
    4. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left(x \cdot x\right), \left(\color{blue}{\frac{1}{8}} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right) \]
    5. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \left(\color{blue}{\frac{1}{8}} + {x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right) \]
    6. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \color{blue}{\left({x}^{2} \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right) \]
    7. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \left(\left(x \cdot x\right) \cdot \left(\color{blue}{\frac{7}{128}} + \frac{33}{1024} \cdot {x}^{2}\right)\right)\right)\right)\right)\right) \]
    8. associate-*l*N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \left(x \cdot \color{blue}{\left(x \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right)\right) \]
    9. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \color{blue}{\left(x \cdot \left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)\right)}\right)\right)\right)\right)\right) \]
    10. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \color{blue}{\left(\frac{7}{128} + \frac{33}{1024} \cdot {x}^{2}\right)}\right)\right)\right)\right)\right)\right) \]
    11. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \color{blue}{\left(\frac{33}{1024} \cdot {x}^{2}\right)}\right)\right)\right)\right)\right)\right)\right) \]
    12. *-commutativeN/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \left({x}^{2} \cdot \color{blue}{\frac{33}{1024}}\right)\right)\right)\right)\right)\right)\right)\right) \]
    13. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\frac{33}{1024}}\right)\right)\right)\right)\right)\right)\right)\right) \]
    14. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\left(x \cdot x\right), \frac{33}{1024}\right)\right)\right)\right)\right)\right)\right)\right) \]
    15. *-lowering-*.f64100.0%

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(\frac{7}{128}, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \frac{33}{1024}\right)\right)\right)\right)\right)\right)\right)\right) \]
  5. Simplified100.0%

    \[\leadsto \color{blue}{x \cdot \left(1 + \left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right)\right)} \]
  6. Final simplification100.0%

    \[\leadsto x \cdot \left(\left(x \cdot x\right) \cdot \left(0.125 + x \cdot \left(x \cdot \left(0.0546875 + \left(x \cdot x\right) \cdot 0.0322265625\right)\right)\right) + 1\right) \]
  7. Add Preprocessing

Alternative 3: 99.7% accurate, 13.8× speedup?

\[\begin{array}{l} \\ x \cdot \left(1 + \left(x \cdot x\right) \cdot \left(0.125 + \left(x \cdot x\right) \cdot 0.0546875\right)\right) \end{array} \]
(FPCore (x)
 :precision binary64
 (* x (+ 1.0 (* (* x x) (+ 0.125 (* (* x x) 0.0546875))))))
double code(double x) {
	return x * (1.0 + ((x * x) * (0.125 + ((x * x) * 0.0546875))));
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = x * (1.0d0 + ((x * x) * (0.125d0 + ((x * x) * 0.0546875d0))))
end function
public static double code(double x) {
	return x * (1.0 + ((x * x) * (0.125 + ((x * x) * 0.0546875))));
}
def code(x):
	return x * (1.0 + ((x * x) * (0.125 + ((x * x) * 0.0546875))))
function code(x)
	return Float64(x * Float64(1.0 + Float64(Float64(x * x) * Float64(0.125 + Float64(Float64(x * x) * 0.0546875)))))
end
function tmp = code(x)
	tmp = x * (1.0 + ((x * x) * (0.125 + ((x * x) * 0.0546875))));
end
code[x_] := N[(x * N[(1.0 + N[(N[(x * x), $MachinePrecision] * N[(0.125 + N[(N[(x * x), $MachinePrecision] * 0.0546875), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
x \cdot \left(1 + \left(x \cdot x\right) \cdot \left(0.125 + \left(x \cdot x\right) \cdot 0.0546875\right)\right)
\end{array}
Derivation
  1. Initial program 7.3%

    \[\sqrt{1 + x} - \sqrt{1 - x} \]
  2. Add Preprocessing
  3. Taylor expanded in x around 0

    \[\leadsto \color{blue}{x \cdot \left(1 + {x}^{2} \cdot \left(\frac{1}{8} + \frac{7}{128} \cdot {x}^{2}\right)\right)} \]
  4. Step-by-step derivation
    1. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \color{blue}{\left(1 + {x}^{2} \cdot \left(\frac{1}{8} + \frac{7}{128} \cdot {x}^{2}\right)\right)}\right) \]
    2. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \color{blue}{\left({x}^{2} \cdot \left(\frac{1}{8} + \frac{7}{128} \cdot {x}^{2}\right)\right)}\right)\right) \]
    3. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\left(\frac{1}{8} + \frac{7}{128} \cdot {x}^{2}\right)}\right)\right)\right) \]
    4. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\left(x \cdot x\right), \left(\color{blue}{\frac{1}{8}} + \frac{7}{128} \cdot {x}^{2}\right)\right)\right)\right) \]
    5. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \left(\color{blue}{\frac{1}{8}} + \frac{7}{128} \cdot {x}^{2}\right)\right)\right)\right) \]
    6. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \color{blue}{\left(\frac{7}{128} \cdot {x}^{2}\right)}\right)\right)\right)\right) \]
    7. *-commutativeN/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \left({x}^{2} \cdot \color{blue}{\frac{7}{128}}\right)\right)\right)\right)\right) \]
    8. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(\left({x}^{2}\right), \color{blue}{\frac{7}{128}}\right)\right)\right)\right)\right) \]
    9. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(\left(x \cdot x\right), \frac{7}{128}\right)\right)\right)\right)\right) \]
    10. *-lowering-*.f6499.9%

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \mathsf{+.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(\mathsf{*.f64}\left(x, x\right), \frac{7}{128}\right)\right)\right)\right)\right) \]
  5. Simplified99.9%

    \[\leadsto \color{blue}{x \cdot \left(1 + \left(x \cdot x\right) \cdot \left(0.125 + \left(x \cdot x\right) \cdot 0.0546875\right)\right)} \]
  6. Add Preprocessing

Alternative 4: 99.5% accurate, 23.0× speedup?

\[\begin{array}{l} \\ x \cdot \left(1 + \left(x \cdot x\right) \cdot 0.125\right) \end{array} \]
(FPCore (x) :precision binary64 (* x (+ 1.0 (* (* x x) 0.125))))
double code(double x) {
	return x * (1.0 + ((x * x) * 0.125));
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = x * (1.0d0 + ((x * x) * 0.125d0))
end function
public static double code(double x) {
	return x * (1.0 + ((x * x) * 0.125));
}
def code(x):
	return x * (1.0 + ((x * x) * 0.125))
function code(x)
	return Float64(x * Float64(1.0 + Float64(Float64(x * x) * 0.125)))
end
function tmp = code(x)
	tmp = x * (1.0 + ((x * x) * 0.125));
end
code[x_] := N[(x * N[(1.0 + N[(N[(x * x), $MachinePrecision] * 0.125), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
x \cdot \left(1 + \left(x \cdot x\right) \cdot 0.125\right)
\end{array}
Derivation
  1. Initial program 7.3%

    \[\sqrt{1 + x} - \sqrt{1 - x} \]
  2. Add Preprocessing
  3. Taylor expanded in x around 0

    \[\leadsto \color{blue}{x \cdot \left(1 + \frac{1}{8} \cdot {x}^{2}\right)} \]
  4. Step-by-step derivation
    1. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \color{blue}{\left(1 + \frac{1}{8} \cdot {x}^{2}\right)}\right) \]
    2. +-lowering-+.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \color{blue}{\left(\frac{1}{8} \cdot {x}^{2}\right)}\right)\right) \]
    3. *-lowering-*.f64N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\frac{1}{8}, \color{blue}{\left({x}^{2}\right)}\right)\right)\right) \]
    4. unpow2N/A

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\frac{1}{8}, \left(x \cdot \color{blue}{x}\right)\right)\right)\right) \]
    5. *-lowering-*.f6499.7%

      \[\leadsto \mathsf{*.f64}\left(x, \mathsf{+.f64}\left(1, \mathsf{*.f64}\left(\frac{1}{8}, \mathsf{*.f64}\left(x, \color{blue}{x}\right)\right)\right)\right) \]
  5. Simplified99.7%

    \[\leadsto \color{blue}{x \cdot \left(1 + 0.125 \cdot \left(x \cdot x\right)\right)} \]
  6. Final simplification99.7%

    \[\leadsto x \cdot \left(1 + \left(x \cdot x\right) \cdot 0.125\right) \]
  7. Add Preprocessing

Alternative 5: 99.0% accurate, 207.0× speedup?

\[\begin{array}{l} \\ x \end{array} \]
(FPCore (x) :precision binary64 x)
double code(double x) {
	return x;
}
real(8) function code(x)
    real(8), intent (in) :: x
    code = x
end function
public static double code(double x) {
	return x;
}
def code(x):
	return x
function code(x)
	return x
end
function tmp = code(x)
	tmp = x;
end
code[x_] := x
\begin{array}{l}

\\
x
\end{array}
Derivation
  1. Initial program 7.3%

    \[\sqrt{1 + x} - \sqrt{1 - x} \]
  2. Add Preprocessing
  3. Taylor expanded in x around 0

    \[\leadsto \color{blue}{x} \]
  4. Step-by-step derivation
    1. Simplified99.4%

      \[\leadsto \color{blue}{x} \]
    2. Add Preprocessing

    Developer Target 1: 100.0% accurate, 1.0× speedup?

    \[\begin{array}{l} \\ \frac{2 \cdot x}{\sqrt{1 + x} + \sqrt{1 - x}} \end{array} \]
    (FPCore (x)
     :precision binary64
     (/ (* 2.0 x) (+ (sqrt (+ 1.0 x)) (sqrt (- 1.0 x)))))
    double code(double x) {
    	return (2.0 * x) / (sqrt((1.0 + x)) + sqrt((1.0 - x)));
    }
    
    real(8) function code(x)
        real(8), intent (in) :: x
        code = (2.0d0 * x) / (sqrt((1.0d0 + x)) + sqrt((1.0d0 - x)))
    end function
    
    public static double code(double x) {
    	return (2.0 * x) / (Math.sqrt((1.0 + x)) + Math.sqrt((1.0 - x)));
    }
    
    def code(x):
    	return (2.0 * x) / (math.sqrt((1.0 + x)) + math.sqrt((1.0 - x)))
    
    function code(x)
    	return Float64(Float64(2.0 * x) / Float64(sqrt(Float64(1.0 + x)) + sqrt(Float64(1.0 - x))))
    end
    
    function tmp = code(x)
    	tmp = (2.0 * x) / (sqrt((1.0 + x)) + sqrt((1.0 - x)));
    end
    
    code[x_] := N[(N[(2.0 * x), $MachinePrecision] / N[(N[Sqrt[N[(1.0 + x), $MachinePrecision]], $MachinePrecision] + N[Sqrt[N[(1.0 - x), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
    
    \begin{array}{l}
    
    \\
    \frac{2 \cdot x}{\sqrt{1 + x} + \sqrt{1 - x}}
    \end{array}
    

    Reproduce

    ?
    herbie shell --seed 2024161 
    (FPCore (x)
      :name "bug333 (missed optimization)"
      :precision binary64
      :pre (and (<= -1.0 x) (<= x 1.0))
    
      :alt
      (! :herbie-platform default (/ (* 2 x) (+ (sqrt (+ 1 x)) (sqrt (- 1 x)))))
    
      (- (sqrt (+ 1.0 x)) (sqrt (- 1.0 x))))