Kahan p9 Example

Percentage Accurate: 68.8% → 92.6%
Time: 8.7s
Alternatives: 5
Speedup: 0.8×

Specification

?
\[\left(0 < x \land x < 1\right) \land y < 1\]
\[\begin{array}{l} \\ \frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \end{array} \]
(FPCore (x y) :precision binary64 (/ (* (- x y) (+ x y)) (+ (* x x) (* y y))))
double code(double x, double y) {
	return ((x - y) * (x + y)) / ((x * x) + (y * y));
}
real(8) function code(x, y)
    real(8), intent (in) :: x
    real(8), intent (in) :: y
    code = ((x - y) * (x + y)) / ((x * x) + (y * y))
end function
public static double code(double x, double y) {
	return ((x - y) * (x + y)) / ((x * x) + (y * y));
}
def code(x, y):
	return ((x - y) * (x + y)) / ((x * x) + (y * y))
function code(x, y)
	return Float64(Float64(Float64(x - y) * Float64(x + y)) / Float64(Float64(x * x) + Float64(y * y)))
end
function tmp = code(x, y)
	tmp = ((x - y) * (x + y)) / ((x * x) + (y * y));
end
code[x_, y_] := N[(N[(N[(x - y), $MachinePrecision] * N[(x + y), $MachinePrecision]), $MachinePrecision] / N[(N[(x * x), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y}
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 5 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 68.8% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \end{array} \]
(FPCore (x y) :precision binary64 (/ (* (- x y) (+ x y)) (+ (* x x) (* y y))))
double code(double x, double y) {
	return ((x - y) * (x + y)) / ((x * x) + (y * y));
}
real(8) function code(x, y)
    real(8), intent (in) :: x
    real(8), intent (in) :: y
    code = ((x - y) * (x + y)) / ((x * x) + (y * y))
end function
public static double code(double x, double y) {
	return ((x - y) * (x + y)) / ((x * x) + (y * y));
}
def code(x, y):
	return ((x - y) * (x + y)) / ((x * x) + (y * y))
function code(x, y)
	return Float64(Float64(Float64(x - y) * Float64(x + y)) / Float64(Float64(x * x) + Float64(y * y)))
end
function tmp = code(x, y)
	tmp = ((x - y) * (x + y)) / ((x * x) + (y * y));
end
code[x_, y_] := N[(N[(N[(x - y), $MachinePrecision] * N[(x + y), $MachinePrecision]), $MachinePrecision] / N[(N[(x * x), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}

\\
\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y}
\end{array}

Alternative 1: 92.6% accurate, 0.7× speedup?

\[\begin{array}{l} y_m = \left|y\right| \\ \begin{array}{l} \mathbf{if}\;y\_m \leq 1.6 \cdot 10^{-162}:\\ \;\;\;\;\mathsf{fma}\left(\frac{y\_m}{x}, \frac{y\_m \cdot -2}{x}, 1\right)\\ \mathbf{elif}\;y\_m \leq 10^{-19}:\\ \;\;\;\;\frac{\left(x - y\_m\right) \cdot \left(y\_m + x\right)}{x \cdot x + y\_m \cdot y\_m}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \end{array} \]
y_m = (fabs.f64 y)
(FPCore (x y_m)
 :precision binary64
 (if (<= y_m 1.6e-162)
   (fma (/ y_m x) (/ (* y_m -2.0) x) 1.0)
   (if (<= y_m 1e-19)
     (/ (* (- x y_m) (+ y_m x)) (+ (* x x) (* y_m y_m)))
     -1.0)))
y_m = fabs(y);
double code(double x, double y_m) {
	double tmp;
	if (y_m <= 1.6e-162) {
		tmp = fma((y_m / x), ((y_m * -2.0) / x), 1.0);
	} else if (y_m <= 1e-19) {
		tmp = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m));
	} else {
		tmp = -1.0;
	}
	return tmp;
}
y_m = abs(y)
function code(x, y_m)
	tmp = 0.0
	if (y_m <= 1.6e-162)
		tmp = fma(Float64(y_m / x), Float64(Float64(y_m * -2.0) / x), 1.0);
	elseif (y_m <= 1e-19)
		tmp = Float64(Float64(Float64(x - y_m) * Float64(y_m + x)) / Float64(Float64(x * x) + Float64(y_m * y_m)));
	else
		tmp = -1.0;
	end
	return tmp
end
y_m = N[Abs[y], $MachinePrecision]
code[x_, y$95$m_] := If[LessEqual[y$95$m, 1.6e-162], N[(N[(y$95$m / x), $MachinePrecision] * N[(N[(y$95$m * -2.0), $MachinePrecision] / x), $MachinePrecision] + 1.0), $MachinePrecision], If[LessEqual[y$95$m, 1e-19], N[(N[(N[(x - y$95$m), $MachinePrecision] * N[(y$95$m + x), $MachinePrecision]), $MachinePrecision] / N[(N[(x * x), $MachinePrecision] + N[(y$95$m * y$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], -1.0]]
\begin{array}{l}
y_m = \left|y\right|

\\
\begin{array}{l}
\mathbf{if}\;y\_m \leq 1.6 \cdot 10^{-162}:\\
\;\;\;\;\mathsf{fma}\left(\frac{y\_m}{x}, \frac{y\_m \cdot -2}{x}, 1\right)\\

\mathbf{elif}\;y\_m \leq 10^{-19}:\\
\;\;\;\;\frac{\left(x - y\_m\right) \cdot \left(y\_m + x\right)}{x \cdot x + y\_m \cdot y\_m}\\

\mathbf{else}:\\
\;\;\;\;-1\\


\end{array}
\end{array}
Derivation
  1. Split input into 3 regimes
  2. if y < 1.59999999999999988e-162

    1. Initial program 59.6%

      \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
    2. Add Preprocessing
    3. Taylor expanded in x around inf

      \[\leadsto \color{blue}{\left(1 + \left(-1 \cdot \frac{y}{x} + \left(-1 \cdot \frac{{y}^{2}}{{x}^{2}} + \frac{y}{x}\right)\right)\right) - \frac{{y}^{2}}{{x}^{2}}} \]
    4. Simplified23.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(y \cdot y, \frac{-2}{x \cdot x}, 1\right)} \]
    5. Step-by-step derivation
      1. associate-*r/N/A

        \[\leadsto \color{blue}{\frac{\left(y \cdot y\right) \cdot -2}{x \cdot x}} + 1 \]
      2. associate-*l*N/A

        \[\leadsto \frac{\color{blue}{y \cdot \left(y \cdot -2\right)}}{x \cdot x} + 1 \]
      3. times-fracN/A

        \[\leadsto \color{blue}{\frac{y}{x} \cdot \frac{y \cdot -2}{x}} + 1 \]
      4. accelerator-lowering-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)} \]
      5. /-lowering-/.f64N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{\frac{y}{x}}, \frac{y \cdot -2}{x}, 1\right) \]
      6. /-lowering-/.f64N/A

        \[\leadsto \mathsf{fma}\left(\frac{y}{x}, \color{blue}{\frac{y \cdot -2}{x}}, 1\right) \]
      7. *-lowering-*.f6437.9

        \[\leadsto \mathsf{fma}\left(\frac{y}{x}, \frac{\color{blue}{y \cdot -2}}{x}, 1\right) \]
    6. Applied egg-rr37.9%

      \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)} \]

    if 1.59999999999999988e-162 < y < 9.9999999999999998e-20

    1. Initial program 99.9%

      \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
    2. Add Preprocessing

    if 9.9999999999999998e-20 < y

    1. Initial program 100.0%

      \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
    2. Add Preprocessing
    3. Taylor expanded in x around 0

      \[\leadsto \color{blue}{-1} \]
    4. Step-by-step derivation
      1. Simplified100.0%

        \[\leadsto \color{blue}{-1} \]
    5. Recombined 3 regimes into one program.
    6. Final simplification48.4%

      \[\leadsto \begin{array}{l} \mathbf{if}\;y \leq 1.6 \cdot 10^{-162}:\\ \;\;\;\;\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)\\ \mathbf{elif}\;y \leq 10^{-19}:\\ \;\;\;\;\frac{\left(x - y\right) \cdot \left(y + x\right)}{x \cdot x + y \cdot y}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \]
    7. Add Preprocessing

    Alternative 2: 92.1% accurate, 0.4× speedup?

    \[\begin{array}{l} y_m = \left|y\right| \\ \begin{array}{l} t_0 := \frac{\left(x - y\_m\right) \cdot \left(y\_m + x\right)}{x \cdot x + y\_m \cdot y\_m}\\ \mathbf{if}\;t\_0 \leq -0.5:\\ \;\;\;\;-1\\ \mathbf{elif}\;t\_0 \leq 2:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \end{array} \]
    y_m = (fabs.f64 y)
    (FPCore (x y_m)
     :precision binary64
     (let* ((t_0 (/ (* (- x y_m) (+ y_m x)) (+ (* x x) (* y_m y_m)))))
       (if (<= t_0 -0.5) -1.0 (if (<= t_0 2.0) 1.0 -1.0))))
    y_m = fabs(y);
    double code(double x, double y_m) {
    	double t_0 = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m));
    	double tmp;
    	if (t_0 <= -0.5) {
    		tmp = -1.0;
    	} else if (t_0 <= 2.0) {
    		tmp = 1.0;
    	} else {
    		tmp = -1.0;
    	}
    	return tmp;
    }
    
    y_m = abs(y)
    real(8) function code(x, y_m)
        real(8), intent (in) :: x
        real(8), intent (in) :: y_m
        real(8) :: t_0
        real(8) :: tmp
        t_0 = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m))
        if (t_0 <= (-0.5d0)) then
            tmp = -1.0d0
        else if (t_0 <= 2.0d0) then
            tmp = 1.0d0
        else
            tmp = -1.0d0
        end if
        code = tmp
    end function
    
    y_m = Math.abs(y);
    public static double code(double x, double y_m) {
    	double t_0 = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m));
    	double tmp;
    	if (t_0 <= -0.5) {
    		tmp = -1.0;
    	} else if (t_0 <= 2.0) {
    		tmp = 1.0;
    	} else {
    		tmp = -1.0;
    	}
    	return tmp;
    }
    
    y_m = math.fabs(y)
    def code(x, y_m):
    	t_0 = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m))
    	tmp = 0
    	if t_0 <= -0.5:
    		tmp = -1.0
    	elif t_0 <= 2.0:
    		tmp = 1.0
    	else:
    		tmp = -1.0
    	return tmp
    
    y_m = abs(y)
    function code(x, y_m)
    	t_0 = Float64(Float64(Float64(x - y_m) * Float64(y_m + x)) / Float64(Float64(x * x) + Float64(y_m * y_m)))
    	tmp = 0.0
    	if (t_0 <= -0.5)
    		tmp = -1.0;
    	elseif (t_0 <= 2.0)
    		tmp = 1.0;
    	else
    		tmp = -1.0;
    	end
    	return tmp
    end
    
    y_m = abs(y);
    function tmp_2 = code(x, y_m)
    	t_0 = ((x - y_m) * (y_m + x)) / ((x * x) + (y_m * y_m));
    	tmp = 0.0;
    	if (t_0 <= -0.5)
    		tmp = -1.0;
    	elseif (t_0 <= 2.0)
    		tmp = 1.0;
    	else
    		tmp = -1.0;
    	end
    	tmp_2 = tmp;
    end
    
    y_m = N[Abs[y], $MachinePrecision]
    code[x_, y$95$m_] := Block[{t$95$0 = N[(N[(N[(x - y$95$m), $MachinePrecision] * N[(y$95$m + x), $MachinePrecision]), $MachinePrecision] / N[(N[(x * x), $MachinePrecision] + N[(y$95$m * y$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]}, If[LessEqual[t$95$0, -0.5], -1.0, If[LessEqual[t$95$0, 2.0], 1.0, -1.0]]]
    
    \begin{array}{l}
    y_m = \left|y\right|
    
    \\
    \begin{array}{l}
    t_0 := \frac{\left(x - y\_m\right) \cdot \left(y\_m + x\right)}{x \cdot x + y\_m \cdot y\_m}\\
    \mathbf{if}\;t\_0 \leq -0.5:\\
    \;\;\;\;-1\\
    
    \mathbf{elif}\;t\_0 \leq 2:\\
    \;\;\;\;1\\
    
    \mathbf{else}:\\
    \;\;\;\;-1\\
    
    
    \end{array}
    \end{array}
    
    Derivation
    1. Split input into 2 regimes
    2. if (/.f64 (*.f64 (-.f64 x y) (+.f64 x y)) (+.f64 (*.f64 x x) (*.f64 y y))) < -0.5 or 2 < (/.f64 (*.f64 (-.f64 x y) (+.f64 x y)) (+.f64 (*.f64 x x) (*.f64 y y)))

      1. Initial program 56.8%

        \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
      2. Add Preprocessing
      3. Taylor expanded in x around 0

        \[\leadsto \color{blue}{-1} \]
      4. Step-by-step derivation
        1. Simplified86.0%

          \[\leadsto \color{blue}{-1} \]

        if -0.5 < (/.f64 (*.f64 (-.f64 x y) (+.f64 x y)) (+.f64 (*.f64 x x) (*.f64 y y))) < 2

        1. Initial program 99.9%

          \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
        2. Add Preprocessing
        3. Taylor expanded in x around inf

          \[\leadsto \color{blue}{1} \]
        4. Step-by-step derivation
          1. Simplified97.2%

            \[\leadsto \color{blue}{1} \]
        5. Recombined 2 regimes into one program.
        6. Final simplification88.5%

          \[\leadsto \begin{array}{l} \mathbf{if}\;\frac{\left(x - y\right) \cdot \left(y + x\right)}{x \cdot x + y \cdot y} \leq -0.5:\\ \;\;\;\;-1\\ \mathbf{elif}\;\frac{\left(x - y\right) \cdot \left(y + x\right)}{x \cdot x + y \cdot y} \leq 2:\\ \;\;\;\;1\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \]
        7. Add Preprocessing

        Alternative 3: 92.2% accurate, 0.8× speedup?

        \[\begin{array}{l} y_m = \left|y\right| \\ \begin{array}{l} \mathbf{if}\;y\_m \leq 1.6 \cdot 10^{-162}:\\ \;\;\;\;\mathsf{fma}\left(\frac{y\_m}{x}, \frac{y\_m \cdot -2}{x}, 1\right)\\ \mathbf{elif}\;y\_m \leq 10^{-19}:\\ \;\;\;\;\left(x - y\_m\right) \cdot \frac{y\_m + x}{\mathsf{fma}\left(x, x, y\_m \cdot y\_m\right)}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \end{array} \]
        y_m = (fabs.f64 y)
        (FPCore (x y_m)
         :precision binary64
         (if (<= y_m 1.6e-162)
           (fma (/ y_m x) (/ (* y_m -2.0) x) 1.0)
           (if (<= y_m 1e-19) (* (- x y_m) (/ (+ y_m x) (fma x x (* y_m y_m)))) -1.0)))
        y_m = fabs(y);
        double code(double x, double y_m) {
        	double tmp;
        	if (y_m <= 1.6e-162) {
        		tmp = fma((y_m / x), ((y_m * -2.0) / x), 1.0);
        	} else if (y_m <= 1e-19) {
        		tmp = (x - y_m) * ((y_m + x) / fma(x, x, (y_m * y_m)));
        	} else {
        		tmp = -1.0;
        	}
        	return tmp;
        }
        
        y_m = abs(y)
        function code(x, y_m)
        	tmp = 0.0
        	if (y_m <= 1.6e-162)
        		tmp = fma(Float64(y_m / x), Float64(Float64(y_m * -2.0) / x), 1.0);
        	elseif (y_m <= 1e-19)
        		tmp = Float64(Float64(x - y_m) * Float64(Float64(y_m + x) / fma(x, x, Float64(y_m * y_m))));
        	else
        		tmp = -1.0;
        	end
        	return tmp
        end
        
        y_m = N[Abs[y], $MachinePrecision]
        code[x_, y$95$m_] := If[LessEqual[y$95$m, 1.6e-162], N[(N[(y$95$m / x), $MachinePrecision] * N[(N[(y$95$m * -2.0), $MachinePrecision] / x), $MachinePrecision] + 1.0), $MachinePrecision], If[LessEqual[y$95$m, 1e-19], N[(N[(x - y$95$m), $MachinePrecision] * N[(N[(y$95$m + x), $MachinePrecision] / N[(x * x + N[(y$95$m * y$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], -1.0]]
        
        \begin{array}{l}
        y_m = \left|y\right|
        
        \\
        \begin{array}{l}
        \mathbf{if}\;y\_m \leq 1.6 \cdot 10^{-162}:\\
        \;\;\;\;\mathsf{fma}\left(\frac{y\_m}{x}, \frac{y\_m \cdot -2}{x}, 1\right)\\
        
        \mathbf{elif}\;y\_m \leq 10^{-19}:\\
        \;\;\;\;\left(x - y\_m\right) \cdot \frac{y\_m + x}{\mathsf{fma}\left(x, x, y\_m \cdot y\_m\right)}\\
        
        \mathbf{else}:\\
        \;\;\;\;-1\\
        
        
        \end{array}
        \end{array}
        
        Derivation
        1. Split input into 3 regimes
        2. if y < 1.59999999999999988e-162

          1. Initial program 59.6%

            \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
          2. Add Preprocessing
          3. Taylor expanded in x around inf

            \[\leadsto \color{blue}{\left(1 + \left(-1 \cdot \frac{y}{x} + \left(-1 \cdot \frac{{y}^{2}}{{x}^{2}} + \frac{y}{x}\right)\right)\right) - \frac{{y}^{2}}{{x}^{2}}} \]
          4. Simplified23.9%

            \[\leadsto \color{blue}{\mathsf{fma}\left(y \cdot y, \frac{-2}{x \cdot x}, 1\right)} \]
          5. Step-by-step derivation
            1. associate-*r/N/A

              \[\leadsto \color{blue}{\frac{\left(y \cdot y\right) \cdot -2}{x \cdot x}} + 1 \]
            2. associate-*l*N/A

              \[\leadsto \frac{\color{blue}{y \cdot \left(y \cdot -2\right)}}{x \cdot x} + 1 \]
            3. times-fracN/A

              \[\leadsto \color{blue}{\frac{y}{x} \cdot \frac{y \cdot -2}{x}} + 1 \]
            4. accelerator-lowering-fma.f64N/A

              \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)} \]
            5. /-lowering-/.f64N/A

              \[\leadsto \mathsf{fma}\left(\color{blue}{\frac{y}{x}}, \frac{y \cdot -2}{x}, 1\right) \]
            6. /-lowering-/.f64N/A

              \[\leadsto \mathsf{fma}\left(\frac{y}{x}, \color{blue}{\frac{y \cdot -2}{x}}, 1\right) \]
            7. *-lowering-*.f6437.9

              \[\leadsto \mathsf{fma}\left(\frac{y}{x}, \frac{\color{blue}{y \cdot -2}}{x}, 1\right) \]
          6. Applied egg-rr37.9%

            \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)} \]

          if 1.59999999999999988e-162 < y < 9.9999999999999998e-20

          1. Initial program 99.9%

            \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
          2. Add Preprocessing
          3. Step-by-step derivation
            1. associate-*r/N/A

              \[\leadsto \color{blue}{\left(x - y\right) \cdot \frac{x + y}{x \cdot x + y \cdot y}} \]
            2. *-commutativeN/A

              \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y} \cdot \left(x - y\right)} \]
            3. *-lowering-*.f64N/A

              \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y} \cdot \left(x - y\right)} \]
            4. /-lowering-/.f64N/A

              \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y}} \cdot \left(x - y\right) \]
            5. +-lowering-+.f64N/A

              \[\leadsto \frac{\color{blue}{x + y}}{x \cdot x + y \cdot y} \cdot \left(x - y\right) \]
            6. accelerator-lowering-fma.f64N/A

              \[\leadsto \frac{x + y}{\color{blue}{\mathsf{fma}\left(x, x, y \cdot y\right)}} \cdot \left(x - y\right) \]
            7. *-lowering-*.f64N/A

              \[\leadsto \frac{x + y}{\mathsf{fma}\left(x, x, \color{blue}{y \cdot y}\right)} \cdot \left(x - y\right) \]
            8. --lowering--.f6499.7

              \[\leadsto \frac{x + y}{\mathsf{fma}\left(x, x, y \cdot y\right)} \cdot \color{blue}{\left(x - y\right)} \]
          4. Applied egg-rr99.7%

            \[\leadsto \color{blue}{\frac{x + y}{\mathsf{fma}\left(x, x, y \cdot y\right)} \cdot \left(x - y\right)} \]

          if 9.9999999999999998e-20 < y

          1. Initial program 100.0%

            \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
          2. Add Preprocessing
          3. Taylor expanded in x around 0

            \[\leadsto \color{blue}{-1} \]
          4. Step-by-step derivation
            1. Simplified100.0%

              \[\leadsto \color{blue}{-1} \]
          5. Recombined 3 regimes into one program.
          6. Final simplification48.3%

            \[\leadsto \begin{array}{l} \mathbf{if}\;y \leq 1.6 \cdot 10^{-162}:\\ \;\;\;\;\mathsf{fma}\left(\frac{y}{x}, \frac{y \cdot -2}{x}, 1\right)\\ \mathbf{elif}\;y \leq 10^{-19}:\\ \;\;\;\;\left(x - y\right) \cdot \frac{y + x}{\mathsf{fma}\left(x, x, y \cdot y\right)}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \]
          7. Add Preprocessing

          Alternative 4: 91.6% accurate, 0.8× speedup?

          \[\begin{array}{l} y_m = \left|y\right| \\ \begin{array}{l} \mathbf{if}\;y\_m \leq 6.2 \cdot 10^{-178}:\\ \;\;\;\;1\\ \mathbf{elif}\;y\_m \leq 10^{-16}:\\ \;\;\;\;\left(x - y\_m\right) \cdot \frac{y\_m + x}{\mathsf{fma}\left(x, x, y\_m \cdot y\_m\right)}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \end{array} \]
          y_m = (fabs.f64 y)
          (FPCore (x y_m)
           :precision binary64
           (if (<= y_m 6.2e-178)
             1.0
             (if (<= y_m 1e-16) (* (- x y_m) (/ (+ y_m x) (fma x x (* y_m y_m)))) -1.0)))
          y_m = fabs(y);
          double code(double x, double y_m) {
          	double tmp;
          	if (y_m <= 6.2e-178) {
          		tmp = 1.0;
          	} else if (y_m <= 1e-16) {
          		tmp = (x - y_m) * ((y_m + x) / fma(x, x, (y_m * y_m)));
          	} else {
          		tmp = -1.0;
          	}
          	return tmp;
          }
          
          y_m = abs(y)
          function code(x, y_m)
          	tmp = 0.0
          	if (y_m <= 6.2e-178)
          		tmp = 1.0;
          	elseif (y_m <= 1e-16)
          		tmp = Float64(Float64(x - y_m) * Float64(Float64(y_m + x) / fma(x, x, Float64(y_m * y_m))));
          	else
          		tmp = -1.0;
          	end
          	return tmp
          end
          
          y_m = N[Abs[y], $MachinePrecision]
          code[x_, y$95$m_] := If[LessEqual[y$95$m, 6.2e-178], 1.0, If[LessEqual[y$95$m, 1e-16], N[(N[(x - y$95$m), $MachinePrecision] * N[(N[(y$95$m + x), $MachinePrecision] / N[(x * x + N[(y$95$m * y$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], -1.0]]
          
          \begin{array}{l}
          y_m = \left|y\right|
          
          \\
          \begin{array}{l}
          \mathbf{if}\;y\_m \leq 6.2 \cdot 10^{-178}:\\
          \;\;\;\;1\\
          
          \mathbf{elif}\;y\_m \leq 10^{-16}:\\
          \;\;\;\;\left(x - y\_m\right) \cdot \frac{y\_m + x}{\mathsf{fma}\left(x, x, y\_m \cdot y\_m\right)}\\
          
          \mathbf{else}:\\
          \;\;\;\;-1\\
          
          
          \end{array}
          \end{array}
          
          Derivation
          1. Split input into 3 regimes
          2. if y < 6.1999999999999999e-178

            1. Initial program 60.0%

              \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
            2. Add Preprocessing
            3. Taylor expanded in x around inf

              \[\leadsto \color{blue}{1} \]
            4. Step-by-step derivation
              1. Simplified35.1%

                \[\leadsto \color{blue}{1} \]

              if 6.1999999999999999e-178 < y < 9.9999999999999998e-17

              1. Initial program 91.4%

                \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
              2. Add Preprocessing
              3. Step-by-step derivation
                1. associate-*r/N/A

                  \[\leadsto \color{blue}{\left(x - y\right) \cdot \frac{x + y}{x \cdot x + y \cdot y}} \]
                2. *-commutativeN/A

                  \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y} \cdot \left(x - y\right)} \]
                3. *-lowering-*.f64N/A

                  \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y} \cdot \left(x - y\right)} \]
                4. /-lowering-/.f64N/A

                  \[\leadsto \color{blue}{\frac{x + y}{x \cdot x + y \cdot y}} \cdot \left(x - y\right) \]
                5. +-lowering-+.f64N/A

                  \[\leadsto \frac{\color{blue}{x + y}}{x \cdot x + y \cdot y} \cdot \left(x - y\right) \]
                6. accelerator-lowering-fma.f64N/A

                  \[\leadsto \frac{x + y}{\color{blue}{\mathsf{fma}\left(x, x, y \cdot y\right)}} \cdot \left(x - y\right) \]
                7. *-lowering-*.f64N/A

                  \[\leadsto \frac{x + y}{\mathsf{fma}\left(x, x, \color{blue}{y \cdot y}\right)} \cdot \left(x - y\right) \]
                8. --lowering--.f6491.5

                  \[\leadsto \frac{x + y}{\mathsf{fma}\left(x, x, y \cdot y\right)} \cdot \color{blue}{\left(x - y\right)} \]
              4. Applied egg-rr91.5%

                \[\leadsto \color{blue}{\frac{x + y}{\mathsf{fma}\left(x, x, y \cdot y\right)} \cdot \left(x - y\right)} \]

              if 9.9999999999999998e-17 < y

              1. Initial program 100.0%

                \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
              2. Add Preprocessing
              3. Taylor expanded in x around 0

                \[\leadsto \color{blue}{-1} \]
              4. Step-by-step derivation
                1. Simplified100.0%

                  \[\leadsto \color{blue}{-1} \]
              5. Recombined 3 regimes into one program.
              6. Final simplification46.5%

                \[\leadsto \begin{array}{l} \mathbf{if}\;y \leq 6.2 \cdot 10^{-178}:\\ \;\;\;\;1\\ \mathbf{elif}\;y \leq 10^{-16}:\\ \;\;\;\;\left(x - y\right) \cdot \frac{y + x}{\mathsf{fma}\left(x, x, y \cdot y\right)}\\ \mathbf{else}:\\ \;\;\;\;-1\\ \end{array} \]
              7. Add Preprocessing

              Alternative 5: 66.9% accurate, 36.0× speedup?

              \[\begin{array}{l} y_m = \left|y\right| \\ -1 \end{array} \]
              y_m = (fabs.f64 y)
              (FPCore (x y_m) :precision binary64 -1.0)
              y_m = fabs(y);
              double code(double x, double y_m) {
              	return -1.0;
              }
              
              y_m = abs(y)
              real(8) function code(x, y_m)
                  real(8), intent (in) :: x
                  real(8), intent (in) :: y_m
                  code = -1.0d0
              end function
              
              y_m = Math.abs(y);
              public static double code(double x, double y_m) {
              	return -1.0;
              }
              
              y_m = math.fabs(y)
              def code(x, y_m):
              	return -1.0
              
              y_m = abs(y)
              function code(x, y_m)
              	return -1.0
              end
              
              y_m = abs(y);
              function tmp = code(x, y_m)
              	tmp = -1.0;
              end
              
              y_m = N[Abs[y], $MachinePrecision]
              code[x_, y$95$m_] := -1.0
              
              \begin{array}{l}
              y_m = \left|y\right|
              
              \\
              -1
              \end{array}
              
              Derivation
              1. Initial program 66.4%

                \[\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y} \]
              2. Add Preprocessing
              3. Taylor expanded in x around 0

                \[\leadsto \color{blue}{-1} \]
              4. Step-by-step derivation
                1. Simplified67.2%

                  \[\leadsto \color{blue}{-1} \]
                2. Add Preprocessing

                Developer Target 1: 99.9% accurate, 0.4× speedup?

                \[\begin{array}{l} \\ \begin{array}{l} t_0 := \left|\frac{x}{y}\right|\\ \mathbf{if}\;0.5 < t\_0 \land t\_0 < 2:\\ \;\;\;\;\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y}\\ \mathbf{else}:\\ \;\;\;\;1 - \frac{2}{1 + \frac{x}{y} \cdot \frac{x}{y}}\\ \end{array} \end{array} \]
                (FPCore (x y)
                 :precision binary64
                 (let* ((t_0 (fabs (/ x y))))
                   (if (and (< 0.5 t_0) (< t_0 2.0))
                     (/ (* (- x y) (+ x y)) (+ (* x x) (* y y)))
                     (- 1.0 (/ 2.0 (+ 1.0 (* (/ x y) (/ x y))))))))
                double code(double x, double y) {
                	double t_0 = fabs((x / y));
                	double tmp;
                	if ((0.5 < t_0) && (t_0 < 2.0)) {
                		tmp = ((x - y) * (x + y)) / ((x * x) + (y * y));
                	} else {
                		tmp = 1.0 - (2.0 / (1.0 + ((x / y) * (x / y))));
                	}
                	return tmp;
                }
                
                real(8) function code(x, y)
                    real(8), intent (in) :: x
                    real(8), intent (in) :: y
                    real(8) :: t_0
                    real(8) :: tmp
                    t_0 = abs((x / y))
                    if ((0.5d0 < t_0) .and. (t_0 < 2.0d0)) then
                        tmp = ((x - y) * (x + y)) / ((x * x) + (y * y))
                    else
                        tmp = 1.0d0 - (2.0d0 / (1.0d0 + ((x / y) * (x / y))))
                    end if
                    code = tmp
                end function
                
                public static double code(double x, double y) {
                	double t_0 = Math.abs((x / y));
                	double tmp;
                	if ((0.5 < t_0) && (t_0 < 2.0)) {
                		tmp = ((x - y) * (x + y)) / ((x * x) + (y * y));
                	} else {
                		tmp = 1.0 - (2.0 / (1.0 + ((x / y) * (x / y))));
                	}
                	return tmp;
                }
                
                def code(x, y):
                	t_0 = math.fabs((x / y))
                	tmp = 0
                	if (0.5 < t_0) and (t_0 < 2.0):
                		tmp = ((x - y) * (x + y)) / ((x * x) + (y * y))
                	else:
                		tmp = 1.0 - (2.0 / (1.0 + ((x / y) * (x / y))))
                	return tmp
                
                function code(x, y)
                	t_0 = abs(Float64(x / y))
                	tmp = 0.0
                	if ((0.5 < t_0) && (t_0 < 2.0))
                		tmp = Float64(Float64(Float64(x - y) * Float64(x + y)) / Float64(Float64(x * x) + Float64(y * y)));
                	else
                		tmp = Float64(1.0 - Float64(2.0 / Float64(1.0 + Float64(Float64(x / y) * Float64(x / y)))));
                	end
                	return tmp
                end
                
                function tmp_2 = code(x, y)
                	t_0 = abs((x / y));
                	tmp = 0.0;
                	if ((0.5 < t_0) && (t_0 < 2.0))
                		tmp = ((x - y) * (x + y)) / ((x * x) + (y * y));
                	else
                		tmp = 1.0 - (2.0 / (1.0 + ((x / y) * (x / y))));
                	end
                	tmp_2 = tmp;
                end
                
                code[x_, y_] := Block[{t$95$0 = N[Abs[N[(x / y), $MachinePrecision]], $MachinePrecision]}, If[And[Less[0.5, t$95$0], Less[t$95$0, 2.0]], N[(N[(N[(x - y), $MachinePrecision] * N[(x + y), $MachinePrecision]), $MachinePrecision] / N[(N[(x * x), $MachinePrecision] + N[(y * y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(1.0 - N[(2.0 / N[(1.0 + N[(N[(x / y), $MachinePrecision] * N[(x / y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]]]
                
                \begin{array}{l}
                
                \\
                \begin{array}{l}
                t_0 := \left|\frac{x}{y}\right|\\
                \mathbf{if}\;0.5 < t\_0 \land t\_0 < 2:\\
                \;\;\;\;\frac{\left(x - y\right) \cdot \left(x + y\right)}{x \cdot x + y \cdot y}\\
                
                \mathbf{else}:\\
                \;\;\;\;1 - \frac{2}{1 + \frac{x}{y} \cdot \frac{x}{y}}\\
                
                
                \end{array}
                \end{array}
                

                Reproduce

                ?
                herbie shell --seed 2024198 
                (FPCore (x y)
                  :name "Kahan p9 Example"
                  :precision binary64
                  :pre (and (and (< 0.0 x) (< x 1.0)) (< y 1.0))
                
                  :alt
                  (! :herbie-platform default (if (< 1/2 (fabs (/ x y)) 2) (/ (* (- x y) (+ x y)) (+ (* x x) (* y y))) (- 1 (/ 2 (+ 1 (* (/ x y) (/ x y)))))))
                
                  (/ (* (- x y) (+ x y)) (+ (* x x) (* y y))))