| Alternative 1 | |
|---|---|
| Accuracy | 100.0% |
| Cost | 14016 |
\[\begin{array}{l}
t_0 := 1 - v \cdot v\\
\sqrt{0.125 \cdot \left(\mathsf{fma}\left(v \cdot v, -3, 1\right) \cdot \left(t_0 \cdot t_0\right)\right)}
\end{array}
\]

(FPCore (v) :precision binary64 (* (* (/ (sqrt 2.0) 4.0) (sqrt (- 1.0 (* 3.0 (* v v))))) (- 1.0 (* v v))))
(FPCore (v) :precision binary64 (let* ((t_0 (- 1.0 (* v v)))) (sqrt (* 0.125 (* (fma (* v v) -3.0 1.0) (* t_0 t_0))))))
double code(double v) {
return ((sqrt(2.0) / 4.0) * sqrt((1.0 - (3.0 * (v * v))))) * (1.0 - (v * v));
}
double code(double v) {
double t_0 = 1.0 - (v * v);
return sqrt((0.125 * (fma((v * v), -3.0, 1.0) * (t_0 * t_0))));
}
function code(v) return Float64(Float64(Float64(sqrt(2.0) / 4.0) * sqrt(Float64(1.0 - Float64(3.0 * Float64(v * v))))) * Float64(1.0 - Float64(v * v))) end
function code(v) t_0 = Float64(1.0 - Float64(v * v)) return sqrt(Float64(0.125 * Float64(fma(Float64(v * v), -3.0, 1.0) * Float64(t_0 * t_0)))) end
code[v_] := N[(N[(N[(N[Sqrt[2.0], $MachinePrecision] / 4.0), $MachinePrecision] * N[Sqrt[N[(1.0 - N[(3.0 * N[(v * v), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] * N[(1.0 - N[(v * v), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
code[v_] := Block[{t$95$0 = N[(1.0 - N[(v * v), $MachinePrecision]), $MachinePrecision]}, N[Sqrt[N[(0.125 * N[(N[(N[(v * v), $MachinePrecision] * -3.0 + 1.0), $MachinePrecision] * N[(t$95$0 * t$95$0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]]
\left(\frac{\sqrt{2}}{4} \cdot \sqrt{1 - 3 \cdot \left(v \cdot v\right)}\right) \cdot \left(1 - v \cdot v\right)
\begin{array}{l}
t_0 := 1 - v \cdot v\\
\sqrt{0.125 \cdot \left(\mathsf{fma}\left(v \cdot v, -3, 1\right) \cdot \left(t_0 \cdot t_0\right)\right)}
\end{array}
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
Initial program 100.0%
Simplified100.0%
[Start]100.0% | \[ \left(\frac{\sqrt{2}}{4} \cdot \sqrt{1 - 3 \cdot \left(v \cdot v\right)}\right) \cdot \left(1 - v \cdot v\right)
\] |
|---|---|
associate-*l* [=>]100.0% | \[ \color{blue}{\frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)}
\] |
Applied egg-rr100.0%
[Start]100.0% | \[ \frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)
\] |
|---|---|
add-sqr-sqrt [=>]98.5% | \[ \color{blue}{\sqrt{\frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)} \cdot \sqrt{\frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)}}
\] |
sqrt-unprod [=>]100.0% | \[ \color{blue}{\sqrt{\left(\frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right) \cdot \left(\frac{\sqrt{2}}{4} \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}}
\] |
swap-sqr [=>]100.0% | \[ \sqrt{\color{blue}{\left(\frac{\sqrt{2}}{4} \cdot \frac{\sqrt{2}}{4}\right) \cdot \left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right) \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}}
\] |
frac-times [=>]100.0% | \[ \sqrt{\color{blue}{\frac{\sqrt{2} \cdot \sqrt{2}}{4 \cdot 4}} \cdot \left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right) \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}
\] |
add-sqr-sqrt [<=]100.0% | \[ \sqrt{\frac{\color{blue}{2}}{4 \cdot 4} \cdot \left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right) \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}
\] |
metadata-eval [=>]100.0% | \[ \sqrt{\frac{2}{\color{blue}{16}} \cdot \left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right) \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}
\] |
metadata-eval [=>]100.0% | \[ \sqrt{\color{blue}{0.125} \cdot \left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right) \cdot \left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \left(1 - v \cdot v\right)\right)\right)}
\] |
swap-sqr [=>]100.0% | \[ \sqrt{0.125 \cdot \color{blue}{\left(\left(\sqrt{1 - 3 \cdot \left(v \cdot v\right)} \cdot \sqrt{1 - 3 \cdot \left(v \cdot v\right)}\right) \cdot \left(\left(1 - v \cdot v\right) \cdot \left(1 - v \cdot v\right)\right)\right)}}
\] |
Applied egg-rr100.0%
[Start]100.0% | \[ \sqrt{0.125 \cdot \left(\mathsf{fma}\left(v \cdot v, -3, 1\right) \cdot {\left(1 - v \cdot v\right)}^{2}\right)}
\] |
|---|---|
unpow2 [=>]100.0% | \[ \sqrt{0.125 \cdot \left(\mathsf{fma}\left(v \cdot v, -3, 1\right) \cdot \color{blue}{\left(\left(1 - v \cdot v\right) \cdot \left(1 - v \cdot v\right)\right)}\right)}
\] |
Final simplification100.0%
| Alternative 1 | |
|---|---|
| Accuracy | 100.0% |
| Cost | 14016 |
| Alternative 2 | |
|---|---|
| Accuracy | 100.0% |
| Cost | 13632 |
| Alternative 3 | |
|---|---|
| Accuracy | 99.6% |
| Cost | 6976 |
| Alternative 4 | |
|---|---|
| Accuracy | 99.6% |
| Cost | 6976 |
| Alternative 5 | |
|---|---|
| Accuracy | 99.0% |
| Cost | 6464 |
herbie shell --seed 2023272
(FPCore (v)
:name "Falkner and Boettcher, Appendix B, 2"
:precision binary64
(* (* (/ (sqrt 2.0) 4.0) (sqrt (- 1.0 (* 3.0 (* v v))))) (- 1.0 (* v v))))