Given's Rotation SVD example

Percentage Accurate: 79.2% → 99.7%
Time: 9.9s
Alternatives: 6
Speedup: 0.6×

Specification

?
\[10^{-150} < \left|x\right| \land \left|x\right| < 10^{+150}\]
\[\begin{array}{l} \\ \sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \end{array} \]
(FPCore (p x)
 :precision binary64
 (sqrt (* 0.5 (+ 1.0 (/ x (sqrt (+ (* (* 4.0 p) p) (* x x))))))))
double code(double p, double x) {
	return sqrt((0.5 * (1.0 + (x / sqrt((((4.0 * p) * p) + (x * x)))))));
}
real(8) function code(p, x)
    real(8), intent (in) :: p
    real(8), intent (in) :: x
    code = sqrt((0.5d0 * (1.0d0 + (x / sqrt((((4.0d0 * p) * p) + (x * x)))))))
end function
public static double code(double p, double x) {
	return Math.sqrt((0.5 * (1.0 + (x / Math.sqrt((((4.0 * p) * p) + (x * x)))))));
}
def code(p, x):
	return math.sqrt((0.5 * (1.0 + (x / math.sqrt((((4.0 * p) * p) + (x * x)))))))
function code(p, x)
	return sqrt(Float64(0.5 * Float64(1.0 + Float64(x / sqrt(Float64(Float64(Float64(4.0 * p) * p) + Float64(x * x)))))))
end
function tmp = code(p, x)
	tmp = sqrt((0.5 * (1.0 + (x / sqrt((((4.0 * p) * p) + (x * x)))))));
end
code[p_, x_] := N[Sqrt[N[(0.5 * N[(1.0 + N[(x / N[Sqrt[N[(N[(N[(4.0 * p), $MachinePrecision] * p), $MachinePrecision] + N[(x * x), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}

\\
\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}
\end{array}

Sampling outcomes in binary64 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 6 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 79.2% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \end{array} \]
(FPCore (p x)
 :precision binary64
 (sqrt (* 0.5 (+ 1.0 (/ x (sqrt (+ (* (* 4.0 p) p) (* x x))))))))
double code(double p, double x) {
	return sqrt((0.5 * (1.0 + (x / sqrt((((4.0 * p) * p) + (x * x)))))));
}
real(8) function code(p, x)
    real(8), intent (in) :: p
    real(8), intent (in) :: x
    code = sqrt((0.5d0 * (1.0d0 + (x / sqrt((((4.0d0 * p) * p) + (x * x)))))))
end function
public static double code(double p, double x) {
	return Math.sqrt((0.5 * (1.0 + (x / Math.sqrt((((4.0 * p) * p) + (x * x)))))));
}
def code(p, x):
	return math.sqrt((0.5 * (1.0 + (x / math.sqrt((((4.0 * p) * p) + (x * x)))))))
function code(p, x)
	return sqrt(Float64(0.5 * Float64(1.0 + Float64(x / sqrt(Float64(Float64(Float64(4.0 * p) * p) + Float64(x * x)))))))
end
function tmp = code(p, x)
	tmp = sqrt((0.5 * (1.0 + (x / sqrt((((4.0 * p) * p) + (x * x)))))));
end
code[p_, x_] := N[Sqrt[N[(0.5 * N[(1.0 + N[(x / N[Sqrt[N[(N[(N[(4.0 * p), $MachinePrecision] * p), $MachinePrecision] + N[(x * x), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}

\\
\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}
\end{array}

Alternative 1: 99.7% accurate, 0.6× speedup?

\[\begin{array}{l} p_m = \left|p\right| \\ \begin{array}{l} t_0 := p\_m \cdot \left(4 \cdot p\_m\right)\\ \mathbf{if}\;\frac{x}{\sqrt{t\_0 + x \cdot x}} \leq -0.5:\\ \;\;\;\;\frac{p\_m}{-x}\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, t\_0\right)}}, 0.5, 0.5\right)}\\ \end{array} \end{array} \]
p_m = (fabs.f64 p)
(FPCore (p_m x)
 :precision binary64
 (let* ((t_0 (* p_m (* 4.0 p_m))))
   (if (<= (/ x (sqrt (+ t_0 (* x x)))) -0.5)
     (/ p_m (- x))
     (sqrt (fma (/ x (sqrt (fma x x t_0))) 0.5 0.5)))))
p_m = fabs(p);
double code(double p_m, double x) {
	double t_0 = p_m * (4.0 * p_m);
	double tmp;
	if ((x / sqrt((t_0 + (x * x)))) <= -0.5) {
		tmp = p_m / -x;
	} else {
		tmp = sqrt(fma((x / sqrt(fma(x, x, t_0))), 0.5, 0.5));
	}
	return tmp;
}
p_m = abs(p)
function code(p_m, x)
	t_0 = Float64(p_m * Float64(4.0 * p_m))
	tmp = 0.0
	if (Float64(x / sqrt(Float64(t_0 + Float64(x * x)))) <= -0.5)
		tmp = Float64(p_m / Float64(-x));
	else
		tmp = sqrt(fma(Float64(x / sqrt(fma(x, x, t_0))), 0.5, 0.5));
	end
	return tmp
end
p_m = N[Abs[p], $MachinePrecision]
code[p$95$m_, x_] := Block[{t$95$0 = N[(p$95$m * N[(4.0 * p$95$m), $MachinePrecision]), $MachinePrecision]}, If[LessEqual[N[(x / N[Sqrt[N[(t$95$0 + N[(x * x), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision], -0.5], N[(p$95$m / (-x)), $MachinePrecision], N[Sqrt[N[(N[(x / N[Sqrt[N[(x * x + t$95$0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] * 0.5 + 0.5), $MachinePrecision]], $MachinePrecision]]]
\begin{array}{l}
p_m = \left|p\right|

\\
\begin{array}{l}
t_0 := p\_m \cdot \left(4 \cdot p\_m\right)\\
\mathbf{if}\;\frac{x}{\sqrt{t\_0 + x \cdot x}} \leq -0.5:\\
\;\;\;\;\frac{p\_m}{-x}\\

\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, t\_0\right)}}, 0.5, 0.5\right)}\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (/.f64 x (sqrt.f64 (+.f64 (*.f64 (*.f64 #s(literal 4 binary64) p) p) (*.f64 x x)))) < -0.5

    1. Initial program 23.6%

      \[\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. lift-*.f64N/A

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      2. lift-+.f64N/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      3. +-commutativeN/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} + 1\right)}} \]
      4. distribute-rgt-inN/A

        \[\leadsto \sqrt{\color{blue}{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + 1 \cdot \frac{1}{2}}} \]
      5. metadata-evalN/A

        \[\leadsto \sqrt{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + \color{blue}{\frac{1}{2}}} \]
      6. lower-fma.f6423.6

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}, 0.5, 0.5\right)}} \]
      7. lift-+.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\left(4 \cdot p\right) \cdot p + x \cdot x}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      8. +-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x + \left(4 \cdot p\right) \cdot p}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      9. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x} + \left(4 \cdot p\right) \cdot p}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      10. lower-fma.f6423.6

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\mathsf{fma}\left(x, x, \left(4 \cdot p\right) \cdot p\right)}}}, 0.5, 0.5\right)} \]
      11. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{\left(4 \cdot p\right) \cdot p}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      12. *-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      13. lower-*.f6423.6

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, 0.5, 0.5\right)} \]
    4. Applied rewrites23.6%

      \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, p \cdot \left(4 \cdot p\right)\right)}}, 0.5, 0.5\right)}} \]
    5. Taylor expanded in x around -inf

      \[\leadsto \color{blue}{-1 \cdot \frac{p}{x}} \]
    6. Step-by-step derivation
      1. mul-1-negN/A

        \[\leadsto \color{blue}{\mathsf{neg}\left(\frac{p}{x}\right)} \]
      2. distribute-neg-frac2N/A

        \[\leadsto \color{blue}{\frac{p}{\mathsf{neg}\left(x\right)}} \]
      3. mul-1-negN/A

        \[\leadsto \frac{p}{\color{blue}{-1 \cdot x}} \]
      4. lower-/.f64N/A

        \[\leadsto \color{blue}{\frac{p}{-1 \cdot x}} \]
      5. mul-1-negN/A

        \[\leadsto \frac{p}{\color{blue}{\mathsf{neg}\left(x\right)}} \]
      6. lower-neg.f6499.8

        \[\leadsto \frac{p}{\color{blue}{-x}} \]
    7. Applied rewrites99.8%

      \[\leadsto \color{blue}{\frac{p}{-x}} \]

    if -0.5 < (/.f64 x (sqrt.f64 (+.f64 (*.f64 (*.f64 #s(literal 4 binary64) p) p) (*.f64 x x))))

    1. Initial program 100.0%

      \[\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. lift-*.f64N/A

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      2. lift-+.f64N/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      3. +-commutativeN/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} + 1\right)}} \]
      4. distribute-rgt-inN/A

        \[\leadsto \sqrt{\color{blue}{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + 1 \cdot \frac{1}{2}}} \]
      5. metadata-evalN/A

        \[\leadsto \sqrt{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + \color{blue}{\frac{1}{2}}} \]
      6. lower-fma.f64100.0

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}, 0.5, 0.5\right)}} \]
      7. lift-+.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\left(4 \cdot p\right) \cdot p + x \cdot x}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      8. +-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x + \left(4 \cdot p\right) \cdot p}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      9. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x} + \left(4 \cdot p\right) \cdot p}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      10. lower-fma.f64100.0

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\mathsf{fma}\left(x, x, \left(4 \cdot p\right) \cdot p\right)}}}, 0.5, 0.5\right)} \]
      11. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{\left(4 \cdot p\right) \cdot p}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      12. *-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      13. lower-*.f64100.0

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, 0.5, 0.5\right)} \]
    4. Applied rewrites100.0%

      \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, p \cdot \left(4 \cdot p\right)\right)}}, 0.5, 0.5\right)}} \]
  3. Recombined 2 regimes into one program.
  4. Final simplification99.9%

    \[\leadsto \begin{array}{l} \mathbf{if}\;\frac{x}{\sqrt{p \cdot \left(4 \cdot p\right) + x \cdot x}} \leq -0.5:\\ \;\;\;\;\frac{p}{-x}\\ \mathbf{else}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, p \cdot \left(4 \cdot p\right)\right)}}, 0.5, 0.5\right)}\\ \end{array} \]
  5. Add Preprocessing

Alternative 2: 99.2% accurate, 0.5× speedup?

\[\begin{array}{l} p_m = \left|p\right| \\ \begin{array}{l} t_0 := \frac{x}{\sqrt{p\_m \cdot \left(4 \cdot p\_m\right) + x \cdot x}}\\ \mathbf{if}\;t\_0 \leq -0.5:\\ \;\;\;\;\frac{p\_m}{-x}\\ \mathbf{elif}\;t\_0 \leq 2 \cdot 10^{-5}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{x}{p\_m}, 0.5\right)}\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(-0.5, \frac{p\_m \cdot p\_m}{x \cdot x}, 1\right)\\ \end{array} \end{array} \]
p_m = (fabs.f64 p)
(FPCore (p_m x)
 :precision binary64
 (let* ((t_0 (/ x (sqrt (+ (* p_m (* 4.0 p_m)) (* x x))))))
   (if (<= t_0 -0.5)
     (/ p_m (- x))
     (if (<= t_0 2e-5)
       (sqrt (fma 0.25 (/ x p_m) 0.5))
       (fma -0.5 (/ (* p_m p_m) (* x x)) 1.0)))))
p_m = fabs(p);
double code(double p_m, double x) {
	double t_0 = x / sqrt(((p_m * (4.0 * p_m)) + (x * x)));
	double tmp;
	if (t_0 <= -0.5) {
		tmp = p_m / -x;
	} else if (t_0 <= 2e-5) {
		tmp = sqrt(fma(0.25, (x / p_m), 0.5));
	} else {
		tmp = fma(-0.5, ((p_m * p_m) / (x * x)), 1.0);
	}
	return tmp;
}
p_m = abs(p)
function code(p_m, x)
	t_0 = Float64(x / sqrt(Float64(Float64(p_m * Float64(4.0 * p_m)) + Float64(x * x))))
	tmp = 0.0
	if (t_0 <= -0.5)
		tmp = Float64(p_m / Float64(-x));
	elseif (t_0 <= 2e-5)
		tmp = sqrt(fma(0.25, Float64(x / p_m), 0.5));
	else
		tmp = fma(-0.5, Float64(Float64(p_m * p_m) / Float64(x * x)), 1.0);
	end
	return tmp
end
p_m = N[Abs[p], $MachinePrecision]
code[p$95$m_, x_] := Block[{t$95$0 = N[(x / N[Sqrt[N[(N[(p$95$m * N[(4.0 * p$95$m), $MachinePrecision]), $MachinePrecision] + N[(x * x), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[t$95$0, -0.5], N[(p$95$m / (-x)), $MachinePrecision], If[LessEqual[t$95$0, 2e-5], N[Sqrt[N[(0.25 * N[(x / p$95$m), $MachinePrecision] + 0.5), $MachinePrecision]], $MachinePrecision], N[(-0.5 * N[(N[(p$95$m * p$95$m), $MachinePrecision] / N[(x * x), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]]]]
\begin{array}{l}
p_m = \left|p\right|

\\
\begin{array}{l}
t_0 := \frac{x}{\sqrt{p\_m \cdot \left(4 \cdot p\_m\right) + x \cdot x}}\\
\mathbf{if}\;t\_0 \leq -0.5:\\
\;\;\;\;\frac{p\_m}{-x}\\

\mathbf{elif}\;t\_0 \leq 2 \cdot 10^{-5}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{x}{p\_m}, 0.5\right)}\\

\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(-0.5, \frac{p\_m \cdot p\_m}{x \cdot x}, 1\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 3 regimes
  2. if (/.f64 x (sqrt.f64 (+.f64 (*.f64 (*.f64 #s(literal 4 binary64) p) p) (*.f64 x x)))) < -0.5

    1. Initial program 16.5%

      \[\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. lift-*.f64N/A

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      2. lift-+.f64N/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      3. +-commutativeN/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} + 1\right)}} \]
      4. distribute-rgt-inN/A

        \[\leadsto \sqrt{\color{blue}{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + 1 \cdot \frac{1}{2}}} \]
      5. metadata-evalN/A

        \[\leadsto \sqrt{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + \color{blue}{\frac{1}{2}}} \]
      6. lower-fma.f6416.5

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}, 0.5, 0.5\right)}} \]
      7. lift-+.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\left(4 \cdot p\right) \cdot p + x \cdot x}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      8. +-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x + \left(4 \cdot p\right) \cdot p}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      9. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x} + \left(4 \cdot p\right) \cdot p}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      10. lower-fma.f6416.5

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\mathsf{fma}\left(x, x, \left(4 \cdot p\right) \cdot p\right)}}}, 0.5, 0.5\right)} \]
      11. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{\left(4 \cdot p\right) \cdot p}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      12. *-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      13. lower-*.f6416.5

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, 0.5, 0.5\right)} \]
    4. Applied rewrites16.5%

      \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, p \cdot \left(4 \cdot p\right)\right)}}, 0.5, 0.5\right)}} \]
    5. Taylor expanded in x around -inf

      \[\leadsto \color{blue}{-1 \cdot \frac{p}{x}} \]
    6. Step-by-step derivation
      1. mul-1-negN/A

        \[\leadsto \color{blue}{\mathsf{neg}\left(\frac{p}{x}\right)} \]
      2. distribute-neg-frac2N/A

        \[\leadsto \color{blue}{\frac{p}{\mathsf{neg}\left(x\right)}} \]
      3. mul-1-negN/A

        \[\leadsto \frac{p}{\color{blue}{-1 \cdot x}} \]
      4. lower-/.f64N/A

        \[\leadsto \color{blue}{\frac{p}{-1 \cdot x}} \]
      5. mul-1-negN/A

        \[\leadsto \frac{p}{\color{blue}{\mathsf{neg}\left(x\right)}} \]
      6. lower-neg.f6499.0

        \[\leadsto \frac{p}{\color{blue}{-x}} \]
    7. Applied rewrites99.0%

      \[\leadsto \color{blue}{\frac{p}{-x}} \]

    if -0.5 < (/.f64 x (sqrt.f64 (+.f64 (*.f64 (*.f64 #s(literal 4 binary64) p) p) (*.f64 x x)))) < 2.00000000000000016e-5

    1. Initial program 100.0%

      \[\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \]
    2. Add Preprocessing
    3. Taylor expanded in x around 0

      \[\leadsto \sqrt{\color{blue}{\frac{1}{2} + \frac{1}{4} \cdot \frac{x}{p}}} \]
    4. Step-by-step derivation
      1. +-commutativeN/A

        \[\leadsto \sqrt{\color{blue}{\frac{1}{4} \cdot \frac{x}{p} + \frac{1}{2}}} \]
      2. lower-fma.f64N/A

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{1}{4}, \frac{x}{p}, \frac{1}{2}\right)}} \]
      3. lower-/.f6499.7

        \[\leadsto \sqrt{\mathsf{fma}\left(0.25, \color{blue}{\frac{x}{p}}, 0.5\right)} \]
    5. Applied rewrites99.7%

      \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(0.25, \frac{x}{p}, 0.5\right)}} \]

    if 2.00000000000000016e-5 < (/.f64 x (sqrt.f64 (+.f64 (*.f64 (*.f64 #s(literal 4 binary64) p) p) (*.f64 x x))))

    1. Initial program 100.0%

      \[\sqrt{0.5 \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)} \]
    2. Add Preprocessing
    3. Step-by-step derivation
      1. lift-*.f64N/A

        \[\leadsto \sqrt{\color{blue}{\frac{1}{2} \cdot \left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      2. lift-+.f64N/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(1 + \frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}\right)}} \]
      3. +-commutativeN/A

        \[\leadsto \sqrt{\frac{1}{2} \cdot \color{blue}{\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} + 1\right)}} \]
      4. distribute-rgt-inN/A

        \[\leadsto \sqrt{\color{blue}{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + 1 \cdot \frac{1}{2}}} \]
      5. metadata-evalN/A

        \[\leadsto \sqrt{\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}} \cdot \frac{1}{2} + \color{blue}{\frac{1}{2}}} \]
      6. lower-fma.f64100.0

        \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\left(4 \cdot p\right) \cdot p + x \cdot x}}, 0.5, 0.5\right)}} \]
      7. lift-+.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\left(4 \cdot p\right) \cdot p + x \cdot x}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      8. +-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x + \left(4 \cdot p\right) \cdot p}}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      9. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{x \cdot x} + \left(4 \cdot p\right) \cdot p}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      10. lower-fma.f64100.0

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\color{blue}{\mathsf{fma}\left(x, x, \left(4 \cdot p\right) \cdot p\right)}}}, 0.5, 0.5\right)} \]
      11. lift-*.f64N/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{\left(4 \cdot p\right) \cdot p}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      12. *-commutativeN/A

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, \frac{1}{2}, \frac{1}{2}\right)} \]
      13. lower-*.f64100.0

        \[\leadsto \sqrt{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, \color{blue}{p \cdot \left(4 \cdot p\right)}\right)}}, 0.5, 0.5\right)} \]
    4. Applied rewrites100.0%

      \[\leadsto \sqrt{\color{blue}{\mathsf{fma}\left(\frac{x}{\sqrt{\mathsf{fma}\left(x, x, p \cdot \left(4 \cdot p\right)\right)}}, 0.5, 0.5\right)}} \]
    5. Taylor expanded in x around inf

      \[\leadsto \color{blue}{1 + \frac{-1}{2} \cdot \frac{{p}^{2}}{{x}^{2}}} \]
    6. Step-by-step derivation
      1. +-commutativeN/A

        \[\leadsto \color{blue}{\frac{-1}{2} \cdot \frac{{p}^{2}}{{x}^{2}} + 1} \]
      2. lower-fma.f64N/A

        \[\leadsto \color{blue}{\mathsf{fma}\left(\frac{-1}{2}, \frac{{p}^{2}}{{x}^{2}}, 1\right)} \]
      3. lower-/.f64N/A

        \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \color{blue}{\frac{{p}^{2}}{{x}^{2}}}, 1\right) \]
      4. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\color{blue}{p \cdot p}}{{x}^{2}}, 1\right) \]
      5. lower-*.f64N/A

        \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{\color{blue}{p \cdot p}}{{x}^{2}}, 1\right) \]
      6. unpow2N/A

        \[\leadsto \mathsf{fma}\left(\frac{-1}{2}, \frac{p \cdot p}{\color{blue}{x \cdot x}}, 1\right) \]
      7. lower-*.f6498.4

        \[\leadsto \mathsf{fma}\left(-0.5, \frac{p \cdot p}{\color{blue}{x \cdot x}}, 1\right) \]
    7. Applied rewrites98.4%

      \[\leadsto \color{blue}{\mathsf{fma}\left(-0.5, \frac{p \cdot p}{x \cdot x}, 1\right)} \]
  3. Recombined 3 regimes into one program.
  4. Final simplification99.2%

    \[\leadsto \begin{array}{l} \mathbf{if}\;\frac{x}{\sqrt{p \cdot \left(4 \cdot p\right) + x \cdot x}} \leq -0.5:\\ \;\;\;\;\frac{p}{-x}\\ \mathbf{elif}\;\frac{x}{\sqrt{p \cdot \left(4 \cdot p\right) + x \cdot x}} \leq 2 \cdot 10^{-5}:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(0.25, \frac{x}{p}, 0.5\right)}\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(-0.5, \frac{p \cdot p}{x \cdot x}, 1\right)\\ \end{array} \]
  5. Add Preprocessing

Developer Target 1: 79.2% accurate, 0.2× speedup?

\[\begin{array}{l} \\ \sqrt{0.5 + \frac{\mathsf{copysign}\left(0.5, x\right)}{\mathsf{hypot}\left(1, \frac{2 \cdot p}{x}\right)}} \end{array} \]
(FPCore (p x)
 :precision binary64
 (sqrt (+ 0.5 (/ (copysign 0.5 x) (hypot 1.0 (/ (* 2.0 p) x))))))
double code(double p, double x) {
	return sqrt((0.5 + (copysign(0.5, x) / hypot(1.0, ((2.0 * p) / x)))));
}
public static double code(double p, double x) {
	return Math.sqrt((0.5 + (Math.copySign(0.5, x) / Math.hypot(1.0, ((2.0 * p) / x)))));
}
def code(p, x):
	return math.sqrt((0.5 + (math.copysign(0.5, x) / math.hypot(1.0, ((2.0 * p) / x)))))
function code(p, x)
	return sqrt(Float64(0.5 + Float64(copysign(0.5, x) / hypot(1.0, Float64(Float64(2.0 * p) / x)))))
end
function tmp = code(p, x)
	tmp = sqrt((0.5 + ((sign(x) * abs(0.5)) / hypot(1.0, ((2.0 * p) / x)))));
end
code[p_, x_] := N[Sqrt[N[(0.5 + N[(N[With[{TMP1 = Abs[0.5], TMP2 = Sign[x]}, TMP1 * If[TMP2 == 0, 1, TMP2]], $MachinePrecision] / N[Sqrt[1.0 ^ 2 + N[(N[(2.0 * p), $MachinePrecision] / x), $MachinePrecision] ^ 2], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}

\\
\sqrt{0.5 + \frac{\mathsf{copysign}\left(0.5, x\right)}{\mathsf{hypot}\left(1, \frac{2 \cdot p}{x}\right)}}
\end{array}

Reproduce

?
herbie shell --seed 2024228 
(FPCore (p x)
  :name "Given's Rotation SVD example"
  :precision binary64
  :pre (and (< 1e-150 (fabs x)) (< (fabs x) 1e+150))

  :alt
  (! :herbie-platform default (sqrt (+ 1/2 (/ (copysign 1/2 x) (hypot 1 (/ (* 2 p) x))))))

  (sqrt (* 0.5 (+ 1.0 (/ x (sqrt (+ (* (* 4.0 p) p) (* x x))))))))