UniformSampleCone 2

Percentage Accurate: 98.9% → 98.9%
Time: 24.6s
Alternatives: 20
Speedup: N/A×

Specification

?
\[\left(\left(\left(\left(\left(-10000 \leq xi \land xi \leq 10000\right) \land \left(-10000 \leq yi \land yi \leq 10000\right)\right) \land \left(-10000 \leq zi \land zi \leq 10000\right)\right) \land \left(2.328306437 \cdot 10^{-10} \leq ux \land ux \leq 1\right)\right) \land \left(2.328306437 \cdot 10^{-10} \leq uy \land uy \leq 1\right)\right) \land \left(0 \leq maxCos \land maxCos \leq 1\right)\]
\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\\ t_1 := \sqrt{1 - t\_0 \cdot t\_0}\\ t_2 := \left(uy \cdot 2\right) \cdot \pi\\ \left(\left(\cos t\_2 \cdot t\_1\right) \cdot xi + \left(\sin t\_2 \cdot t\_1\right) \cdot yi\right) + t\_0 \cdot zi \end{array} \end{array} \]
(FPCore (xi yi zi ux uy maxCos)
 :precision binary32
 (let* ((t_0 (* (* (- 1.0 ux) maxCos) ux))
        (t_1 (sqrt (- 1.0 (* t_0 t_0))))
        (t_2 (* (* uy 2.0) PI)))
   (+ (+ (* (* (cos t_2) t_1) xi) (* (* (sin t_2) t_1) yi)) (* t_0 zi))))
float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
	float t_0 = ((1.0f - ux) * maxCos) * ux;
	float t_1 = sqrtf((1.0f - (t_0 * t_0)));
	float t_2 = (uy * 2.0f) * ((float) M_PI);
	return (((cosf(t_2) * t_1) * xi) + ((sinf(t_2) * t_1) * yi)) + (t_0 * zi);
}
function code(xi, yi, zi, ux, uy, maxCos)
	t_0 = Float32(Float32(Float32(Float32(1.0) - ux) * maxCos) * ux)
	t_1 = sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))
	t_2 = Float32(Float32(uy * Float32(2.0)) * Float32(pi))
	return Float32(Float32(Float32(Float32(cos(t_2) * t_1) * xi) + Float32(Float32(sin(t_2) * t_1) * yi)) + Float32(t_0 * zi))
end
function tmp = code(xi, yi, zi, ux, uy, maxCos)
	t_0 = ((single(1.0) - ux) * maxCos) * ux;
	t_1 = sqrt((single(1.0) - (t_0 * t_0)));
	t_2 = (uy * single(2.0)) * single(pi);
	tmp = (((cos(t_2) * t_1) * xi) + ((sin(t_2) * t_1) * yi)) + (t_0 * zi);
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\\
t_1 := \sqrt{1 - t\_0 \cdot t\_0}\\
t_2 := \left(uy \cdot 2\right) \cdot \pi\\
\left(\left(\cos t\_2 \cdot t\_1\right) \cdot xi + \left(\sin t\_2 \cdot t\_1\right) \cdot yi\right) + t\_0 \cdot zi
\end{array}
\end{array}

Sampling outcomes in binary32 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 20 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 98.9% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\\ t_1 := \sqrt{1 - t\_0 \cdot t\_0}\\ t_2 := \left(uy \cdot 2\right) \cdot \pi\\ \left(\left(\cos t\_2 \cdot t\_1\right) \cdot xi + \left(\sin t\_2 \cdot t\_1\right) \cdot yi\right) + t\_0 \cdot zi \end{array} \end{array} \]
(FPCore (xi yi zi ux uy maxCos)
 :precision binary32
 (let* ((t_0 (* (* (- 1.0 ux) maxCos) ux))
        (t_1 (sqrt (- 1.0 (* t_0 t_0))))
        (t_2 (* (* uy 2.0) PI)))
   (+ (+ (* (* (cos t_2) t_1) xi) (* (* (sin t_2) t_1) yi)) (* t_0 zi))))
float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
	float t_0 = ((1.0f - ux) * maxCos) * ux;
	float t_1 = sqrtf((1.0f - (t_0 * t_0)));
	float t_2 = (uy * 2.0f) * ((float) M_PI);
	return (((cosf(t_2) * t_1) * xi) + ((sinf(t_2) * t_1) * yi)) + (t_0 * zi);
}
function code(xi, yi, zi, ux, uy, maxCos)
	t_0 = Float32(Float32(Float32(Float32(1.0) - ux) * maxCos) * ux)
	t_1 = sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))
	t_2 = Float32(Float32(uy * Float32(2.0)) * Float32(pi))
	return Float32(Float32(Float32(Float32(cos(t_2) * t_1) * xi) + Float32(Float32(sin(t_2) * t_1) * yi)) + Float32(t_0 * zi))
end
function tmp = code(xi, yi, zi, ux, uy, maxCos)
	t_0 = ((single(1.0) - ux) * maxCos) * ux;
	t_1 = sqrt((single(1.0) - (t_0 * t_0)));
	t_2 = (uy * single(2.0)) * single(pi);
	tmp = (((cos(t_2) * t_1) * xi) + ((sin(t_2) * t_1) * yi)) + (t_0 * zi);
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\\
t_1 := \sqrt{1 - t\_0 \cdot t\_0}\\
t_2 := \left(uy \cdot 2\right) \cdot \pi\\
\left(\left(\cos t\_2 \cdot t\_1\right) \cdot xi + \left(\sin t\_2 \cdot t\_1\right) \cdot yi\right) + t\_0 \cdot zi
\end{array}
\end{array}

Alternative 1: 98.9% accurate, 1.2× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := 2 \cdot \left(uy \cdot \pi\right)\\ \mathsf{fma}\left(\sin t\_0, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \mathsf{fma}\left(maxCos, ux, -maxCos\right), 1\right)}, \cos t\_0 \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \end{array} \end{array} \]
(FPCore (xi yi zi ux uy maxCos)
 :precision binary32
 (let* ((t_0 (* 2.0 (* uy PI))))
   (fma
    (sin t_0)
    yi
    (fma
     (sqrt
      (fma (* ux ux) (* (* maxCos (- 1.0 ux)) (fma maxCos ux (- maxCos))) 1.0))
     (* (cos t_0) xi)
     (* (- 1.0 ux) (* maxCos (* ux zi)))))))
float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
	float t_0 = 2.0f * (uy * ((float) M_PI));
	return fmaf(sinf(t_0), yi, fmaf(sqrtf(fmaf((ux * ux), ((maxCos * (1.0f - ux)) * fmaf(maxCos, ux, -maxCos)), 1.0f)), (cosf(t_0) * xi), ((1.0f - ux) * (maxCos * (ux * zi)))));
}
function code(xi, yi, zi, ux, uy, maxCos)
	t_0 = Float32(Float32(2.0) * Float32(uy * Float32(pi)))
	return fma(sin(t_0), yi, fma(sqrt(fma(Float32(ux * ux), Float32(Float32(maxCos * Float32(Float32(1.0) - ux)) * fma(maxCos, ux, Float32(-maxCos))), Float32(1.0))), Float32(cos(t_0) * xi), Float32(Float32(Float32(1.0) - ux) * Float32(maxCos * Float32(ux * zi)))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := 2 \cdot \left(uy \cdot \pi\right)\\
\mathsf{fma}\left(\sin t\_0, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \mathsf{fma}\left(maxCos, ux, -maxCos\right), 1\right)}, \cos t\_0 \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right)
\end{array}
\end{array}
Derivation
  1. Initial program 98.9%

    \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
  2. Add Preprocessing
  3. Applied rewrites99.0%

    \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)} \cdot \sin \left(2 \cdot \left(uy \cdot \pi\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right)} \]
  4. Taylor expanded in ux around 0

    \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  5. Step-by-step derivation
    1. lower-sin.f32N/A

      \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    2. lower-*.f32N/A

      \[\leadsto \mathsf{fma}\left(\sin \color{blue}{\left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    3. lower-*.f32N/A

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \color{blue}{\left(uy \cdot \mathsf{PI}\left(\right)\right)}\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    4. lower-PI.f3299.0

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \color{blue}{\pi}\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  6. Applied rewrites99.0%

    \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \pi\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  7. Taylor expanded in ux around 0

    \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \color{blue}{\left(maxCos \cdot ux - maxCos\right)}, 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  8. Step-by-step derivation
    1. sub-negN/A

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \color{blue}{\left(maxCos \cdot ux + \left(\mathsf{neg}\left(maxCos\right)\right)\right)}, 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    2. mul-1-negN/A

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(maxCos \cdot ux + \color{blue}{-1 \cdot maxCos}\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    3. lower-fma.f32N/A

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \color{blue}{\mathsf{fma}\left(maxCos, ux, -1 \cdot maxCos\right)}, 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    4. mul-1-negN/A

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \mathsf{fma}\left(maxCos, ux, \color{blue}{\mathsf{neg}\left(maxCos\right)}\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    5. lower-neg.f3299.0

      \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \pi\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \mathsf{fma}\left(maxCos, ux, \color{blue}{-maxCos}\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  9. Applied rewrites99.0%

    \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \pi\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \color{blue}{\mathsf{fma}\left(maxCos, ux, -maxCos\right)}, 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  10. Final simplification99.0%

    \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \pi\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \mathsf{fma}\left(maxCos, ux, -maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
  11. Add Preprocessing

Alternative 2: 94.9% accurate, 1.4× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := 2 \cdot \left(uy \cdot \pi\right)\\ \mathsf{fma}\left(yi, \mathsf{fma}\left(xi, \frac{\cos t\_0}{yi}, \sin t\_0\right), maxCos \cdot \left(ux \cdot zi\right)\right) \end{array} \end{array} \]
(FPCore (xi yi zi ux uy maxCos)
 :precision binary32
 (let* ((t_0 (* 2.0 (* uy PI))))
   (fma yi (fma xi (/ (cos t_0) yi) (sin t_0)) (* maxCos (* ux zi)))))
float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
	float t_0 = 2.0f * (uy * ((float) M_PI));
	return fmaf(yi, fmaf(xi, (cosf(t_0) / yi), sinf(t_0)), (maxCos * (ux * zi)));
}
function code(xi, yi, zi, ux, uy, maxCos)
	t_0 = Float32(Float32(2.0) * Float32(uy * Float32(pi)))
	return fma(yi, fma(xi, Float32(cos(t_0) / yi), sin(t_0)), Float32(maxCos * Float32(ux * zi)))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := 2 \cdot \left(uy \cdot \pi\right)\\
\mathsf{fma}\left(yi, \mathsf{fma}\left(xi, \frac{\cos t\_0}{yi}, \sin t\_0\right), maxCos \cdot \left(ux \cdot zi\right)\right)
\end{array}
\end{array}
Derivation
  1. Initial program 98.9%

    \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
  2. Add Preprocessing
  3. Taylor expanded in yi around inf

    \[\leadsto \color{blue}{yi \cdot \left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + \left(\frac{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}{yi} \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + \frac{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)}{yi}\right)\right)} \]
  4. Applied rewrites98.4%

    \[\leadsto \color{blue}{yi \cdot \mathsf{fma}\left(maxCos, \left(\left(1 - ux\right) \cdot zi\right) \cdot \frac{ux}{yi}, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(\cos \left(\left(2 \cdot uy\right) \cdot \pi\right), \frac{xi}{yi}, \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)\right)} \]
  5. Taylor expanded in ux around 0

    \[\leadsto maxCos \cdot \left(ux \cdot zi\right) + \color{blue}{yi \cdot \left(\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + \frac{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}{yi}\right)} \]
  6. Step-by-step derivation
    1. Applied rewrites95.9%

      \[\leadsto \mathsf{fma}\left(yi, \color{blue}{\mathsf{fma}\left(xi, \frac{\cos \left(2 \cdot \left(uy \cdot \pi\right)\right)}{yi}, \sin \left(2 \cdot \left(uy \cdot \pi\right)\right)\right)}, maxCos \cdot \left(ux \cdot zi\right)\right) \]
    2. Add Preprocessing

    Alternative 3: 97.6% accurate, 1.5× speedup?

    \[\begin{array}{l} \\ \begin{array}{l} t_0 := \pi \cdot \left(2 \cdot uy\right)\\ t_1 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\ \mathbf{if}\;2 \cdot uy \leq 0.02500000037252903:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, t\_1 \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), t\_1 \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, t\_1, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, \cos t\_0, yi \cdot \sin t\_0\right)\\ \end{array} \end{array} \]
    (FPCore (xi yi zi ux uy maxCos)
     :precision binary32
     (let* ((t_0 (* PI (* 2.0 uy)))
            (t_1
             (sqrt
              (fma
               (* maxCos maxCos)
               (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0)))
               1.0))))
       (if (<= (* 2.0 uy) 0.02500000037252903)
         (fma
          uy
          (fma
           uy
           (*
            t_1
            (fma
             -1.3333333333333333
             (* uy (* yi (* PI (* PI PI))))
             (* -2.0 (* xi (* PI PI)))))
           (* t_1 (* 2.0 (* PI yi))))
          (fma xi t_1 (* maxCos (* (- 1.0 ux) (* ux zi)))))
         (fma xi (cos t_0) (* yi (sin t_0))))))
    float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
    	float t_0 = ((float) M_PI) * (2.0f * uy);
    	float t_1 = sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f));
    	float tmp;
    	if ((2.0f * uy) <= 0.02500000037252903f) {
    		tmp = fmaf(uy, fmaf(uy, (t_1 * fmaf(-1.3333333333333333f, (uy * (yi * (((float) M_PI) * (((float) M_PI) * ((float) M_PI))))), (-2.0f * (xi * (((float) M_PI) * ((float) M_PI)))))), (t_1 * (2.0f * (((float) M_PI) * yi)))), fmaf(xi, t_1, (maxCos * ((1.0f - ux) * (ux * zi)))));
    	} else {
    		tmp = fmaf(xi, cosf(t_0), (yi * sinf(t_0)));
    	}
    	return tmp;
    }
    
    function code(xi, yi, zi, ux, uy, maxCos)
    	t_0 = Float32(Float32(pi) * Float32(Float32(2.0) * uy))
    	t_1 = sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0)))
    	tmp = Float32(0.0)
    	if (Float32(Float32(2.0) * uy) <= Float32(0.02500000037252903))
    		tmp = fma(uy, fma(uy, Float32(t_1 * fma(Float32(-1.3333333333333333), Float32(uy * Float32(yi * Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))))), Float32(Float32(-2.0) * Float32(xi * Float32(Float32(pi) * Float32(pi)))))), Float32(t_1 * Float32(Float32(2.0) * Float32(Float32(pi) * yi)))), fma(xi, t_1, Float32(maxCos * Float32(Float32(Float32(1.0) - ux) * Float32(ux * zi)))));
    	else
    		tmp = fma(xi, cos(t_0), Float32(yi * sin(t_0)));
    	end
    	return tmp
    end
    
    \begin{array}{l}
    
    \\
    \begin{array}{l}
    t_0 := \pi \cdot \left(2 \cdot uy\right)\\
    t_1 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\
    \mathbf{if}\;2 \cdot uy \leq 0.02500000037252903:\\
    \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, t\_1 \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), t\_1 \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, t\_1, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\
    
    \mathbf{else}:\\
    \;\;\;\;\mathsf{fma}\left(xi, \cos t\_0, yi \cdot \sin t\_0\right)\\
    
    
    \end{array}
    \end{array}
    
    Derivation
    1. Split input into 2 regimes
    2. if (*.f32 uy #s(literal 2 binary32)) < 0.0250000004

      1. Initial program 99.1%

        \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
      2. Add Preprocessing
      3. Taylor expanded in uy around 0

        \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + \left(uy \cdot \left(2 \cdot \left(\left(yi \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + uy \cdot \left(-2 \cdot \left(\left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \frac{-4}{3} \cdot \left(\left(uy \cdot \left(yi \cdot {\mathsf{PI}\left(\right)}^{3}\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
      4. Applied rewrites99.1%

        \[\leadsto \color{blue}{\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), \left(2 \cdot \left(yi \cdot \pi\right)\right) \cdot \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}\right), \mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)\right)} \]

      if 0.0250000004 < (*.f32 uy #s(literal 2 binary32))

      1. Initial program 97.9%

        \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
      2. Add Preprocessing
      3. Taylor expanded in ux around 0

        \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
      4. Step-by-step derivation
        1. lower-fma.f32N/A

          \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
        2. lower-cos.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
        3. associate-*r*N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
        4. lower-*.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
        5. lower-*.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
        6. lower-PI.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
        7. lower-*.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
        8. lower-sin.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
        9. associate-*r*N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
        10. lower-*.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
        11. lower-*.f32N/A

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
        12. lower-PI.f3290.2

          \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
      5. Applied rewrites90.2%

        \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
    3. Recombined 2 regimes into one program.
    4. Final simplification97.8%

      \[\leadsto \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.02500000037252903:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, \cos \left(\pi \cdot \left(2 \cdot uy\right)\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \end{array} \]
    5. Add Preprocessing

    Alternative 4: 89.2% accurate, 1.6× speedup?

    \[\begin{array}{l} \\ \begin{array}{l} t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\ \mathsf{fma}\left(uy, \mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), t\_0 \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, t\_0, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right) \end{array} \end{array} \]
    (FPCore (xi yi zi ux uy maxCos)
     :precision binary32
     (let* ((t_0
             (sqrt
              (fma
               (* maxCos maxCos)
               (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0)))
               1.0))))
       (fma
        uy
        (fma
         uy
         (*
          t_0
          (fma
           -1.3333333333333333
           (* uy (* yi (* PI (* PI PI))))
           (* -2.0 (* xi (* PI PI)))))
         (* t_0 (* 2.0 (* PI yi))))
        (fma xi t_0 (* maxCos (* (- 1.0 ux) (* ux zi)))))))
    float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
    	float t_0 = sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f));
    	return fmaf(uy, fmaf(uy, (t_0 * fmaf(-1.3333333333333333f, (uy * (yi * (((float) M_PI) * (((float) M_PI) * ((float) M_PI))))), (-2.0f * (xi * (((float) M_PI) * ((float) M_PI)))))), (t_0 * (2.0f * (((float) M_PI) * yi)))), fmaf(xi, t_0, (maxCos * ((1.0f - ux) * (ux * zi)))));
    }
    
    function code(xi, yi, zi, ux, uy, maxCos)
    	t_0 = sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0)))
    	return fma(uy, fma(uy, Float32(t_0 * fma(Float32(-1.3333333333333333), Float32(uy * Float32(yi * Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))))), Float32(Float32(-2.0) * Float32(xi * Float32(Float32(pi) * Float32(pi)))))), Float32(t_0 * Float32(Float32(2.0) * Float32(Float32(pi) * yi)))), fma(xi, t_0, Float32(maxCos * Float32(Float32(Float32(1.0) - ux) * Float32(ux * zi)))))
    end
    
    \begin{array}{l}
    
    \\
    \begin{array}{l}
    t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\
    \mathsf{fma}\left(uy, \mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), t\_0 \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, t\_0, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)
    \end{array}
    \end{array}
    
    Derivation
    1. Initial program 98.9%

      \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
    2. Add Preprocessing
    3. Taylor expanded in uy around 0

      \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + \left(uy \cdot \left(2 \cdot \left(\left(yi \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + uy \cdot \left(-2 \cdot \left(\left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \frac{-4}{3} \cdot \left(\left(uy \cdot \left(yi \cdot {\mathsf{PI}\left(\right)}^{3}\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
    4. Applied rewrites92.2%

      \[\leadsto \color{blue}{\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), \left(2 \cdot \left(yi \cdot \pi\right)\right) \cdot \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}\right), \mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)\right)} \]
    5. Final simplification92.2%

      \[\leadsto \mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(-1.3333333333333333, uy \cdot \left(yi \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \left(2 \cdot \left(\pi \cdot yi\right)\right)\right), \mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    6. Add Preprocessing

    Alternative 5: 90.3% accurate, 1.8× speedup?

    \[\begin{array}{l} \\ \mathsf{fma}\left(\pi \cdot \left(2 \cdot uy\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \left(maxCos \cdot \left(ux + -1\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \end{array} \]
    (FPCore (xi yi zi ux uy maxCos)
     :precision binary32
     (fma
      (* PI (* 2.0 uy))
      yi
      (fma
       (sqrt (fma (* ux ux) (* (* maxCos (- 1.0 ux)) (* maxCos (+ ux -1.0))) 1.0))
       (* (cos (* 2.0 (* uy PI))) xi)
       (* (- 1.0 ux) (* maxCos (* ux zi))))))
    float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
    	return fmaf((((float) M_PI) * (2.0f * uy)), yi, fmaf(sqrtf(fmaf((ux * ux), ((maxCos * (1.0f - ux)) * (maxCos * (ux + -1.0f))), 1.0f)), (cosf((2.0f * (uy * ((float) M_PI)))) * xi), ((1.0f - ux) * (maxCos * (ux * zi)))));
    }
    
    function code(xi, yi, zi, ux, uy, maxCos)
    	return fma(Float32(Float32(pi) * Float32(Float32(2.0) * uy)), yi, fma(sqrt(fma(Float32(ux * ux), Float32(Float32(maxCos * Float32(Float32(1.0) - ux)) * Float32(maxCos * Float32(ux + Float32(-1.0)))), Float32(1.0))), Float32(cos(Float32(Float32(2.0) * Float32(uy * Float32(pi)))) * xi), Float32(Float32(Float32(1.0) - ux) * Float32(maxCos * Float32(ux * zi)))))
    end
    
    \begin{array}{l}
    
    \\
    \mathsf{fma}\left(\pi \cdot \left(2 \cdot uy\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \left(maxCos \cdot \left(ux + -1\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right)
    \end{array}
    
    Derivation
    1. Initial program 98.9%

      \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
    2. Add Preprocessing
    3. Applied rewrites99.0%

      \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)} \cdot \sin \left(2 \cdot \left(uy \cdot \pi\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right)} \]
    4. Taylor expanded in ux around 0

      \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    5. Step-by-step derivation
      1. lower-sin.f32N/A

        \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
      2. lower-*.f32N/A

        \[\leadsto \mathsf{fma}\left(\sin \color{blue}{\left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
      3. lower-*.f32N/A

        \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \color{blue}{\left(uy \cdot \mathsf{PI}\left(\right)\right)}\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
      4. lower-PI.f3299.0

        \[\leadsto \mathsf{fma}\left(\sin \left(2 \cdot \left(uy \cdot \color{blue}{\pi}\right)\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    6. Applied rewrites99.0%

      \[\leadsto \mathsf{fma}\left(\color{blue}{\sin \left(2 \cdot \left(uy \cdot \pi\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    7. Taylor expanded in uy around 0

      \[\leadsto \mathsf{fma}\left(2 \cdot \color{blue}{\left(uy \cdot \mathsf{PI}\left(\right)\right)}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(\mathsf{neg}\left(\left(1 - ux\right) \cdot maxCos\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
    8. Step-by-step derivation
      1. Applied rewrites91.6%

        \[\leadsto \mathsf{fma}\left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}, yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(\left(1 - ux\right) \cdot maxCos\right) \cdot \left(-\left(1 - ux\right) \cdot maxCos\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
      2. Final simplification91.6%

        \[\leadsto \mathsf{fma}\left(\pi \cdot \left(2 \cdot uy\right), yi, \mathsf{fma}\left(\sqrt{\mathsf{fma}\left(ux \cdot ux, \left(maxCos \cdot \left(1 - ux\right)\right) \cdot \left(maxCos \cdot \left(ux + -1\right)\right), 1\right)}, \cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot xi, \left(1 - ux\right) \cdot \left(maxCos \cdot \left(ux \cdot zi\right)\right)\right)\right) \]
      3. Add Preprocessing

      Alternative 6: 88.8% accurate, 2.1× speedup?

      \[\begin{array}{l} \\ \begin{array}{l} t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\ t_1 := ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right)\\ \mathbf{if}\;t\_1 \leq 1.000000045813705 \cdot 10^{-18}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi \cdot t\_0\right) + zi \cdot t\_1\\ \end{array} \end{array} \]
      (FPCore (xi yi zi ux uy maxCos)
       :precision binary32
       (let* ((t_0
               (sqrt
                (fma
                 (* maxCos maxCos)
                 (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0)))
                 1.0)))
              (t_1 (* ux (* maxCos (- 1.0 ux)))))
         (if (<= t_1 1.000000045813705e-18)
           (fma
            xi
            (fma -2.0 (* (* uy PI) (* uy PI)) 1.0)
            (* yi (sin (* PI (* 2.0 uy)))))
           (+
            (fma
             uy
             (* t_0 (fma -2.0 (* uy (* xi (* PI PI))) (* 2.0 (* PI yi))))
             (* xi t_0))
            (* zi t_1)))))
      float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
      	float t_0 = sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f));
      	float t_1 = ux * (maxCos * (1.0f - ux));
      	float tmp;
      	if (t_1 <= 1.000000045813705e-18f) {
      		tmp = fmaf(xi, fmaf(-2.0f, ((uy * ((float) M_PI)) * (uy * ((float) M_PI))), 1.0f), (yi * sinf((((float) M_PI) * (2.0f * uy)))));
      	} else {
      		tmp = fmaf(uy, (t_0 * fmaf(-2.0f, (uy * (xi * (((float) M_PI) * ((float) M_PI)))), (2.0f * (((float) M_PI) * yi)))), (xi * t_0)) + (zi * t_1);
      	}
      	return tmp;
      }
      
      function code(xi, yi, zi, ux, uy, maxCos)
      	t_0 = sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0)))
      	t_1 = Float32(ux * Float32(maxCos * Float32(Float32(1.0) - ux)))
      	tmp = Float32(0.0)
      	if (t_1 <= Float32(1.000000045813705e-18))
      		tmp = fma(xi, fma(Float32(-2.0), Float32(Float32(uy * Float32(pi)) * Float32(uy * Float32(pi))), Float32(1.0)), Float32(yi * sin(Float32(Float32(pi) * Float32(Float32(2.0) * uy)))));
      	else
      		tmp = Float32(fma(uy, Float32(t_0 * fma(Float32(-2.0), Float32(uy * Float32(xi * Float32(Float32(pi) * Float32(pi)))), Float32(Float32(2.0) * Float32(Float32(pi) * yi)))), Float32(xi * t_0)) + Float32(zi * t_1));
      	end
      	return tmp
      end
      
      \begin{array}{l}
      
      \\
      \begin{array}{l}
      t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\
      t_1 := ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right)\\
      \mathbf{if}\;t\_1 \leq 1.000000045813705 \cdot 10^{-18}:\\
      \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\
      
      \mathbf{else}:\\
      \;\;\;\;\mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi \cdot t\_0\right) + zi \cdot t\_1\\
      
      
      \end{array}
      \end{array}
      
      Derivation
      1. Split input into 2 regimes
      2. if (*.f32 (*.f32 (-.f32 #s(literal 1 binary32) ux) maxCos) ux) < 1.00000005e-18

        1. Initial program 98.9%

          \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
        2. Add Preprocessing
        3. Taylor expanded in ux around 0

          \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
        4. Step-by-step derivation
          1. lower-fma.f32N/A

            \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
          2. lower-cos.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
          3. associate-*r*N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
          4. lower-*.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
          5. lower-*.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
          6. lower-PI.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
          7. lower-*.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
          8. lower-sin.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
          9. associate-*r*N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
          10. lower-*.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
          11. lower-*.f32N/A

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
          12. lower-PI.f3297.0

            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
        5. Applied rewrites97.0%

          \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
        6. Taylor expanded in uy around 0

          \[\leadsto \mathsf{fma}\left(xi, 1 + \color{blue}{-2 \cdot \left({uy}^{2} \cdot {\mathsf{PI}\left(\right)}^{2}\right)}, yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)\right) \]
        7. Step-by-step derivation
          1. Applied rewrites94.2%

            \[\leadsto \mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \color{blue}{\left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right)}, 1\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right) \]

          if 1.00000005e-18 < (*.f32 (*.f32 (-.f32 #s(literal 1 binary32) ux) maxCos) ux)

          1. Initial program 98.9%

            \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
          2. Add Preprocessing
          3. Taylor expanded in uy around 0

            \[\leadsto \color{blue}{\left(uy \cdot \left(-2 \cdot \left(\left(uy \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + 2 \cdot \left(\left(yi \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
          4. Step-by-step derivation
            1. lower-fma.f32N/A

              \[\leadsto \color{blue}{\mathsf{fma}\left(uy, -2 \cdot \left(\left(uy \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + 2 \cdot \left(\left(yi \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right), xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
          5. Applied rewrites91.1%

            \[\leadsto \color{blue}{\mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(yi \cdot \pi\right)\right), xi \cdot \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
        8. Recombined 2 regimes into one program.
        9. Final simplification93.1%

          \[\leadsto \begin{array}{l} \mathbf{if}\;ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right) \leq 1.000000045813705 \cdot 10^{-18}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi \cdot \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\right) + zi \cdot \left(ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right)\right)\\ \end{array} \]
        10. Add Preprocessing

        Alternative 7: 88.9% accurate, 2.1× speedup?

        \[\begin{array}{l} \\ \begin{array}{l} t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\ \mathbf{if}\;ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right) \leq 1.000000045813705 \cdot 10^{-18}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, t\_0, \mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\ \end{array} \end{array} \]
        (FPCore (xi yi zi ux uy maxCos)
         :precision binary32
         (let* ((t_0
                 (sqrt
                  (fma
                   (* maxCos maxCos)
                   (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0)))
                   1.0))))
           (if (<= (* ux (* maxCos (- 1.0 ux))) 1.000000045813705e-18)
             (fma
              xi
              (fma -2.0 (* (* uy PI) (* uy PI)) 1.0)
              (* yi (sin (* PI (* 2.0 uy)))))
             (fma
              xi
              t_0
              (fma
               uy
               (* t_0 (fma -2.0 (* uy (* xi (* PI PI))) (* 2.0 (* PI yi))))
               (* maxCos (* (- 1.0 ux) (* ux zi))))))))
        float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
        	float t_0 = sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f));
        	float tmp;
        	if ((ux * (maxCos * (1.0f - ux))) <= 1.000000045813705e-18f) {
        		tmp = fmaf(xi, fmaf(-2.0f, ((uy * ((float) M_PI)) * (uy * ((float) M_PI))), 1.0f), (yi * sinf((((float) M_PI) * (2.0f * uy)))));
        	} else {
        		tmp = fmaf(xi, t_0, fmaf(uy, (t_0 * fmaf(-2.0f, (uy * (xi * (((float) M_PI) * ((float) M_PI)))), (2.0f * (((float) M_PI) * yi)))), (maxCos * ((1.0f - ux) * (ux * zi)))));
        	}
        	return tmp;
        }
        
        function code(xi, yi, zi, ux, uy, maxCos)
        	t_0 = sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0)))
        	tmp = Float32(0.0)
        	if (Float32(ux * Float32(maxCos * Float32(Float32(1.0) - ux))) <= Float32(1.000000045813705e-18))
        		tmp = fma(xi, fma(Float32(-2.0), Float32(Float32(uy * Float32(pi)) * Float32(uy * Float32(pi))), Float32(1.0)), Float32(yi * sin(Float32(Float32(pi) * Float32(Float32(2.0) * uy)))));
        	else
        		tmp = fma(xi, t_0, fma(uy, Float32(t_0 * fma(Float32(-2.0), Float32(uy * Float32(xi * Float32(Float32(pi) * Float32(pi)))), Float32(Float32(2.0) * Float32(Float32(pi) * yi)))), Float32(maxCos * Float32(Float32(Float32(1.0) - ux) * Float32(ux * zi)))));
        	end
        	return tmp
        end
        
        \begin{array}{l}
        
        \\
        \begin{array}{l}
        t_0 := \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}\\
        \mathbf{if}\;ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right) \leq 1.000000045813705 \cdot 10^{-18}:\\
        \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\
        
        \mathbf{else}:\\
        \;\;\;\;\mathsf{fma}\left(xi, t\_0, \mathsf{fma}\left(uy, t\_0 \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\
        
        
        \end{array}
        \end{array}
        
        Derivation
        1. Split input into 2 regimes
        2. if (*.f32 (*.f32 (-.f32 #s(literal 1 binary32) ux) maxCos) ux) < 1.00000005e-18

          1. Initial program 98.9%

            \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
          2. Add Preprocessing
          3. Taylor expanded in ux around 0

            \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
          4. Step-by-step derivation
            1. lower-fma.f32N/A

              \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
            2. lower-cos.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
            3. associate-*r*N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
            4. lower-*.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
            5. lower-*.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
            6. lower-PI.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
            7. lower-*.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
            8. lower-sin.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
            9. associate-*r*N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
            10. lower-*.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
            11. lower-*.f32N/A

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
            12. lower-PI.f3297.0

              \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
          5. Applied rewrites97.0%

            \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
          6. Taylor expanded in uy around 0

            \[\leadsto \mathsf{fma}\left(xi, 1 + \color{blue}{-2 \cdot \left({uy}^{2} \cdot {\mathsf{PI}\left(\right)}^{2}\right)}, yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)\right) \]
          7. Step-by-step derivation
            1. Applied rewrites94.2%

              \[\leadsto \mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \color{blue}{\left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right)}, 1\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right) \]

            if 1.00000005e-18 < (*.f32 (*.f32 (-.f32 #s(literal 1 binary32) ux) maxCos) ux)

            1. Initial program 98.9%

              \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
            2. Add Preprocessing
            3. Taylor expanded in uy around 0

              \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + \left(uy \cdot \left(-2 \cdot \left(\left(uy \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + 2 \cdot \left(\left(yi \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
            4. Applied rewrites91.0%

              \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(yi \cdot \pi\right)\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)\right)} \]
          8. Recombined 2 regimes into one program.
          9. Final simplification93.1%

            \[\leadsto \begin{array}{l} \mathbf{if}\;ux \cdot \left(maxCos \cdot \left(1 - ux\right)\right) \leq 1.000000045813705 \cdot 10^{-18}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, \mathsf{fma}\left(uy, \sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\right)\\ \end{array} \]
          10. Add Preprocessing

          Alternative 8: 90.1% accurate, 2.3× speedup?

          \[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \end{array} \end{array} \]
          (FPCore (xi yi zi ux uy maxCos)
           :precision binary32
           (if (<= (* 2.0 uy) 0.00044999999227002263)
             (-
              (*
               (sqrt
                (fma (* maxCos maxCos) (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0))) 1.0))
               (fma 2.0 (* uy (* PI yi)) xi))
              (* zi (* ux (* maxCos (+ ux -1.0)))))
             (fma
              xi
              (fma -2.0 (* (* uy PI) (* uy PI)) 1.0)
              (* yi (sin (* PI (* 2.0 uy)))))))
          float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
          	float tmp;
          	if ((2.0f * uy) <= 0.00044999999227002263f) {
          		tmp = (sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f)) * fmaf(2.0f, (uy * (((float) M_PI) * yi)), xi)) - (zi * (ux * (maxCos * (ux + -1.0f))));
          	} else {
          		tmp = fmaf(xi, fmaf(-2.0f, ((uy * ((float) M_PI)) * (uy * ((float) M_PI))), 1.0f), (yi * sinf((((float) M_PI) * (2.0f * uy)))));
          	}
          	return tmp;
          }
          
          function code(xi, yi, zi, ux, uy, maxCos)
          	tmp = Float32(0.0)
          	if (Float32(Float32(2.0) * uy) <= Float32(0.00044999999227002263))
          		tmp = Float32(Float32(sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0))) * fma(Float32(2.0), Float32(uy * Float32(Float32(pi) * yi)), xi)) - Float32(zi * Float32(ux * Float32(maxCos * Float32(ux + Float32(-1.0))))));
          	else
          		tmp = fma(xi, fma(Float32(-2.0), Float32(Float32(uy * Float32(pi)) * Float32(uy * Float32(pi))), Float32(1.0)), Float32(yi * sin(Float32(Float32(pi) * Float32(Float32(2.0) * uy)))));
          	end
          	return tmp
          end
          
          \begin{array}{l}
          
          \\
          \begin{array}{l}
          \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\
          \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\
          
          \mathbf{else}:\\
          \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\
          
          
          \end{array}
          \end{array}
          
          Derivation
          1. Split input into 2 regimes
          2. if (*.f32 uy #s(literal 2 binary32)) < 4.49999992e-4

            1. Initial program 99.2%

              \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
            2. Add Preprocessing
            3. Taylor expanded in uy around 0

              \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
            4. Step-by-step derivation
              1. associate-*r*N/A

                \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              2. distribute-rgt-outN/A

                \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              3. lower-*.f32N/A

                \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
            5. Applied rewrites99.0%

              \[\leadsto \color{blue}{\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]

            if 4.49999992e-4 < (*.f32 uy #s(literal 2 binary32))

            1. Initial program 98.5%

              \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
            2. Add Preprocessing
            3. Taylor expanded in ux around 0

              \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
            4. Step-by-step derivation
              1. lower-fma.f32N/A

                \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
              2. lower-cos.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
              3. associate-*r*N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
              4. lower-*.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
              5. lower-*.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
              6. lower-PI.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
              7. lower-*.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
              8. lower-sin.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
              9. associate-*r*N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
              10. lower-*.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
              11. lower-*.f32N/A

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
              12. lower-PI.f3289.5

                \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
            5. Applied rewrites89.5%

              \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
            6. Taylor expanded in uy around 0

              \[\leadsto \mathsf{fma}\left(xi, 1 + \color{blue}{-2 \cdot \left({uy}^{2} \cdot {\mathsf{PI}\left(\right)}^{2}\right)}, yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)\right) \]
            7. Step-by-step derivation
              1. Applied rewrites81.0%

                \[\leadsto \mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \color{blue}{\left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right)}, 1\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right) \]
            8. Recombined 2 regimes into one program.
            9. Final simplification92.1%

              \[\leadsto \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(xi, \mathsf{fma}\left(-2, \left(uy \cdot \pi\right) \cdot \left(uy \cdot \pi\right), 1\right), yi \cdot \sin \left(\pi \cdot \left(2 \cdot uy\right)\right)\right)\\ \end{array} \]
            10. Add Preprocessing

            Alternative 9: 86.6% accurate, 3.7× speedup?

            \[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \end{array} \]
            (FPCore (xi yi zi ux uy maxCos)
             :precision binary32
             (if (<= (* 2.0 uy) 0.00044999999227002263)
               (-
                (*
                 (sqrt
                  (fma (* maxCos maxCos) (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0))) 1.0))
                 (fma 2.0 (* uy (* PI yi)) xi))
                (* zi (* ux (* maxCos (+ ux -1.0)))))
               (fma
                uy
                (fma
                 uy
                 (fma
                  -1.3333333333333333
                  (* (* PI (* PI PI)) (* uy yi))
                  (* -2.0 (* xi (* PI PI))))
                 (* 2.0 (* PI yi)))
                xi)))
            float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
            	float tmp;
            	if ((2.0f * uy) <= 0.00044999999227002263f) {
            		tmp = (sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f)) * fmaf(2.0f, (uy * (((float) M_PI) * yi)), xi)) - (zi * (ux * (maxCos * (ux + -1.0f))));
            	} else {
            		tmp = fmaf(uy, fmaf(uy, fmaf(-1.3333333333333333f, ((((float) M_PI) * (((float) M_PI) * ((float) M_PI))) * (uy * yi)), (-2.0f * (xi * (((float) M_PI) * ((float) M_PI))))), (2.0f * (((float) M_PI) * yi))), xi);
            	}
            	return tmp;
            }
            
            function code(xi, yi, zi, ux, uy, maxCos)
            	tmp = Float32(0.0)
            	if (Float32(Float32(2.0) * uy) <= Float32(0.00044999999227002263))
            		tmp = Float32(Float32(sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0))) * fma(Float32(2.0), Float32(uy * Float32(Float32(pi) * yi)), xi)) - Float32(zi * Float32(ux * Float32(maxCos * Float32(ux + Float32(-1.0))))));
            	else
            		tmp = fma(uy, fma(uy, fma(Float32(-1.3333333333333333), Float32(Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))) * Float32(uy * yi)), Float32(Float32(-2.0) * Float32(xi * Float32(Float32(pi) * Float32(pi))))), Float32(Float32(2.0) * Float32(Float32(pi) * yi))), xi);
            	end
            	return tmp
            end
            
            \begin{array}{l}
            
            \\
            \begin{array}{l}
            \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\
            \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\
            
            \mathbf{else}:\\
            \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\
            
            
            \end{array}
            \end{array}
            
            Derivation
            1. Split input into 2 regimes
            2. if (*.f32 uy #s(literal 2 binary32)) < 4.49999992e-4

              1. Initial program 99.2%

                \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              2. Add Preprocessing
              3. Taylor expanded in uy around 0

                \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              4. Step-by-step derivation
                1. associate-*r*N/A

                  \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                2. distribute-rgt-outN/A

                  \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                3. lower-*.f32N/A

                  \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              5. Applied rewrites99.0%

                \[\leadsto \color{blue}{\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right)} + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]

              if 4.49999992e-4 < (*.f32 uy #s(literal 2 binary32))

              1. Initial program 98.5%

                \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
              2. Add Preprocessing
              3. Taylor expanded in ux around 0

                \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
              4. Step-by-step derivation
                1. lower-fma.f32N/A

                  \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
                2. lower-cos.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                3. associate-*r*N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                4. lower-*.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                5. lower-*.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                6. lower-PI.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                7. lower-*.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                8. lower-sin.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                9. associate-*r*N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                10. lower-*.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                11. lower-*.f32N/A

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
                12. lower-PI.f3289.5

                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
              5. Applied rewrites89.5%

                \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
              6. Taylor expanded in uy around 0

                \[\leadsto xi + \color{blue}{uy \cdot \left(2 \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right) + uy \cdot \left(-2 \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right) + \frac{-4}{3} \cdot \left(uy \cdot \left(yi \cdot {\mathsf{PI}\left(\right)}^{3}\right)\right)\right)\right)} \]
              7. Step-by-step derivation
                1. Applied rewrites72.7%

                  \[\leadsto \mathsf{fma}\left(uy, \color{blue}{\mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(uy \cdot yi\right) \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right)}, xi\right) \]
              8. Recombined 2 regimes into one program.
              9. Final simplification88.9%

                \[\leadsto \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)} \cdot \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) - zi \cdot \left(ux \cdot \left(maxCos \cdot \left(ux + -1\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \]
              10. Add Preprocessing

              Alternative 10: 86.6% accurate, 3.8× speedup?

              \[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \end{array} \]
              (FPCore (xi yi zi ux uy maxCos)
               :precision binary32
               (if (<= (* 2.0 uy) 0.00044999999227002263)
                 (fma
                  (sqrt (fma (* maxCos maxCos) (* (* ux ux) (* (- 1.0 ux) (+ ux -1.0))) 1.0))
                  (fma 2.0 (* uy (* PI yi)) xi)
                  (* maxCos (* (- 1.0 ux) (* ux zi))))
                 (fma
                  uy
                  (fma
                   uy
                   (fma
                    -1.3333333333333333
                    (* (* PI (* PI PI)) (* uy yi))
                    (* -2.0 (* xi (* PI PI))))
                   (* 2.0 (* PI yi)))
                  xi)))
              float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
              	float tmp;
              	if ((2.0f * uy) <= 0.00044999999227002263f) {
              		tmp = fmaf(sqrtf(fmaf((maxCos * maxCos), ((ux * ux) * ((1.0f - ux) * (ux + -1.0f))), 1.0f)), fmaf(2.0f, (uy * (((float) M_PI) * yi)), xi), (maxCos * ((1.0f - ux) * (ux * zi))));
              	} else {
              		tmp = fmaf(uy, fmaf(uy, fmaf(-1.3333333333333333f, ((((float) M_PI) * (((float) M_PI) * ((float) M_PI))) * (uy * yi)), (-2.0f * (xi * (((float) M_PI) * ((float) M_PI))))), (2.0f * (((float) M_PI) * yi))), xi);
              	}
              	return tmp;
              }
              
              function code(xi, yi, zi, ux, uy, maxCos)
              	tmp = Float32(0.0)
              	if (Float32(Float32(2.0) * uy) <= Float32(0.00044999999227002263))
              		tmp = fma(sqrt(fma(Float32(maxCos * maxCos), Float32(Float32(ux * ux) * Float32(Float32(Float32(1.0) - ux) * Float32(ux + Float32(-1.0)))), Float32(1.0))), fma(Float32(2.0), Float32(uy * Float32(Float32(pi) * yi)), xi), Float32(maxCos * Float32(Float32(Float32(1.0) - ux) * Float32(ux * zi))));
              	else
              		tmp = fma(uy, fma(uy, fma(Float32(-1.3333333333333333), Float32(Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))) * Float32(uy * yi)), Float32(Float32(-2.0) * Float32(xi * Float32(Float32(pi) * Float32(pi))))), Float32(Float32(2.0) * Float32(Float32(pi) * yi))), xi);
              	end
              	return tmp
              end
              
              \begin{array}{l}
              
              \\
              \begin{array}{l}
              \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\
              \;\;\;\;\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\\
              
              \mathbf{else}:\\
              \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\
              
              
              \end{array}
              \end{array}
              
              Derivation
              1. Split input into 2 regimes
              2. if (*.f32 uy #s(literal 2 binary32)) < 4.49999992e-4

                1. Initial program 99.2%

                  \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                2. Add Preprocessing
                3. Taylor expanded in uy around 0

                  \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                4. Step-by-step derivation
                  1. +-commutativeN/A

                    \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                  2. associate-+r+N/A

                    \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                  3. associate-*r*N/A

                    \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                  4. distribute-rgt-outN/A

                    \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                5. Applied rewrites99.0%

                  \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]

                if 4.49999992e-4 < (*.f32 uy #s(literal 2 binary32))

                1. Initial program 98.5%

                  \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                2. Add Preprocessing
                3. Taylor expanded in ux around 0

                  \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                4. Step-by-step derivation
                  1. lower-fma.f32N/A

                    \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
                  2. lower-cos.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                  3. associate-*r*N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                  4. lower-*.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                  5. lower-*.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                  6. lower-PI.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                  7. lower-*.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                  8. lower-sin.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                  9. associate-*r*N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                  10. lower-*.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                  11. lower-*.f32N/A

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
                  12. lower-PI.f3289.5

                    \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
                5. Applied rewrites89.5%

                  \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
                6. Taylor expanded in uy around 0

                  \[\leadsto xi + \color{blue}{uy \cdot \left(2 \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right) + uy \cdot \left(-2 \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right) + \frac{-4}{3} \cdot \left(uy \cdot \left(yi \cdot {\mathsf{PI}\left(\right)}^{3}\right)\right)\right)\right)} \]
                7. Step-by-step derivation
                  1. Applied rewrites72.7%

                    \[\leadsto \mathsf{fma}\left(uy, \color{blue}{\mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(uy \cdot yi\right) \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right)}, xi\right) \]
                8. Recombined 2 regimes into one program.
                9. Final simplification88.9%

                  \[\leadsto \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(ux \cdot ux\right) \cdot \left(\left(1 - ux\right) \cdot \left(ux + -1\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \]
                10. Add Preprocessing

                Alternative 11: 86.5% accurate, 4.7× speedup?

                \[\begin{array}{l} \\ \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \end{array} \]
                (FPCore (xi yi zi ux uy maxCos)
                 :precision binary32
                 (if (<= (* 2.0 uy) 0.00044999999227002263)
                   (+ xi (fma (* ux maxCos) (* (- 1.0 ux) zi) (* (* PI yi) (* 2.0 uy))))
                   (fma
                    uy
                    (fma
                     uy
                     (fma
                      -1.3333333333333333
                      (* (* PI (* PI PI)) (* uy yi))
                      (* -2.0 (* xi (* PI PI))))
                     (* 2.0 (* PI yi)))
                    xi)))
                float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                	float tmp;
                	if ((2.0f * uy) <= 0.00044999999227002263f) {
                		tmp = xi + fmaf((ux * maxCos), ((1.0f - ux) * zi), ((((float) M_PI) * yi) * (2.0f * uy)));
                	} else {
                		tmp = fmaf(uy, fmaf(uy, fmaf(-1.3333333333333333f, ((((float) M_PI) * (((float) M_PI) * ((float) M_PI))) * (uy * yi)), (-2.0f * (xi * (((float) M_PI) * ((float) M_PI))))), (2.0f * (((float) M_PI) * yi))), xi);
                	}
                	return tmp;
                }
                
                function code(xi, yi, zi, ux, uy, maxCos)
                	tmp = Float32(0.0)
                	if (Float32(Float32(2.0) * uy) <= Float32(0.00044999999227002263))
                		tmp = Float32(xi + fma(Float32(ux * maxCos), Float32(Float32(Float32(1.0) - ux) * zi), Float32(Float32(Float32(pi) * yi) * Float32(Float32(2.0) * uy))));
                	else
                		tmp = fma(uy, fma(uy, fma(Float32(-1.3333333333333333), Float32(Float32(Float32(pi) * Float32(Float32(pi) * Float32(pi))) * Float32(uy * yi)), Float32(Float32(-2.0) * Float32(xi * Float32(Float32(pi) * Float32(pi))))), Float32(Float32(2.0) * Float32(Float32(pi) * yi))), xi);
                	end
                	return tmp
                end
                
                \begin{array}{l}
                
                \\
                \begin{array}{l}
                \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\
                \;\;\;\;xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right)\\
                
                \mathbf{else}:\\
                \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\
                
                
                \end{array}
                \end{array}
                
                Derivation
                1. Split input into 2 regimes
                2. if (*.f32 uy #s(literal 2 binary32)) < 4.49999992e-4

                  1. Initial program 99.2%

                    \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                  2. Add Preprocessing
                  3. Taylor expanded in uy around 0

                    \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                  4. Step-by-step derivation
                    1. +-commutativeN/A

                      \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                    2. associate-+r+N/A

                      \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                    3. associate-*r*N/A

                      \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                    4. distribute-rgt-outN/A

                      \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                  5. Applied rewrites99.0%

                    \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]
                  6. Taylor expanded in maxCos around 0

                    \[\leadsto xi + \color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                  7. Step-by-step derivation
                    1. Applied rewrites98.7%

                      \[\leadsto xi + \color{blue}{\mathsf{fma}\left(maxCos \cdot ux, zi \cdot \left(1 - ux\right), \left(2 \cdot uy\right) \cdot \left(yi \cdot \pi\right)\right)} \]

                    if 4.49999992e-4 < (*.f32 uy #s(literal 2 binary32))

                    1. Initial program 98.5%

                      \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                    2. Add Preprocessing
                    3. Taylor expanded in ux around 0

                      \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                    4. Step-by-step derivation
                      1. lower-fma.f32N/A

                        \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
                      2. lower-cos.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                      3. associate-*r*N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                      4. lower-*.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                      5. lower-*.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                      6. lower-PI.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                      7. lower-*.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                      8. lower-sin.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                      9. associate-*r*N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                      10. lower-*.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                      11. lower-*.f32N/A

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
                      12. lower-PI.f3289.5

                        \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
                    5. Applied rewrites89.5%

                      \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
                    6. Taylor expanded in uy around 0

                      \[\leadsto xi + \color{blue}{uy \cdot \left(2 \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right) + uy \cdot \left(-2 \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right) + \frac{-4}{3} \cdot \left(uy \cdot \left(yi \cdot {\mathsf{PI}\left(\right)}^{3}\right)\right)\right)\right)} \]
                    7. Step-by-step derivation
                      1. Applied rewrites72.7%

                        \[\leadsto \mathsf{fma}\left(uy, \color{blue}{\mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(uy \cdot yi\right) \cdot \left(\pi \cdot \left(\pi \cdot \pi\right)\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right)}, xi\right) \]
                    8. Recombined 2 regimes into one program.
                    9. Final simplification88.8%

                      \[\leadsto \begin{array}{l} \mathbf{if}\;2 \cdot uy \leq 0.00044999999227002263:\\ \;\;\;\;xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(uy, \mathsf{fma}\left(uy, \mathsf{fma}\left(-1.3333333333333333, \left(\pi \cdot \left(\pi \cdot \pi\right)\right) \cdot \left(uy \cdot yi\right), -2 \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)\\ \end{array} \]
                    10. Add Preprocessing

                    Alternative 12: 81.5% accurate, 8.6× speedup?

                    \[\begin{array}{l} \\ \mathsf{fma}\left(1, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right) \end{array} \]
                    (FPCore (xi yi zi ux uy maxCos)
                     :precision binary32
                     (fma 1.0 (fma 2.0 (* uy (* PI yi)) xi) (* maxCos (* (- 1.0 ux) (* ux zi)))))
                    float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                    	return fmaf(1.0f, fmaf(2.0f, (uy * (((float) M_PI) * yi)), xi), (maxCos * ((1.0f - ux) * (ux * zi))));
                    }
                    
                    function code(xi, yi, zi, ux, uy, maxCos)
                    	return fma(Float32(1.0), fma(Float32(2.0), Float32(uy * Float32(Float32(pi) * yi)), xi), Float32(maxCos * Float32(Float32(Float32(1.0) - ux) * Float32(ux * zi))))
                    end
                    
                    \begin{array}{l}
                    
                    \\
                    \mathsf{fma}\left(1, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right)
                    \end{array}
                    
                    Derivation
                    1. Initial program 98.9%

                      \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                    2. Add Preprocessing
                    3. Taylor expanded in uy around 0

                      \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                    4. Step-by-step derivation
                      1. +-commutativeN/A

                        \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                      2. associate-+r+N/A

                        \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                      3. associate-*r*N/A

                        \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                      4. distribute-rgt-outN/A

                        \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                    5. Applied rewrites84.3%

                      \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]
                    6. Taylor expanded in maxCos around 0

                      \[\leadsto \mathsf{fma}\left(1, \mathsf{fma}\left(\color{blue}{2}, uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right) \]
                    7. Step-by-step derivation
                      1. Applied rewrites84.1%

                        \[\leadsto \mathsf{fma}\left(1, \mathsf{fma}\left(\color{blue}{2}, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right) \]
                      2. Final simplification84.1%

                        \[\leadsto \mathsf{fma}\left(1, \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right), maxCos \cdot \left(\left(1 - ux\right) \cdot \left(ux \cdot zi\right)\right)\right) \]
                      3. Add Preprocessing

                      Alternative 13: 81.5% accurate, 9.3× speedup?

                      \[\begin{array}{l} \\ xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right) \end{array} \]
                      (FPCore (xi yi zi ux uy maxCos)
                       :precision binary32
                       (+ xi (fma (* ux maxCos) (* (- 1.0 ux) zi) (* (* PI yi) (* 2.0 uy)))))
                      float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                      	return xi + fmaf((ux * maxCos), ((1.0f - ux) * zi), ((((float) M_PI) * yi) * (2.0f * uy)));
                      }
                      
                      function code(xi, yi, zi, ux, uy, maxCos)
                      	return Float32(xi + fma(Float32(ux * maxCos), Float32(Float32(Float32(1.0) - ux) * zi), Float32(Float32(Float32(pi) * yi) * Float32(Float32(2.0) * uy))))
                      end
                      
                      \begin{array}{l}
                      
                      \\
                      xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right)
                      \end{array}
                      
                      Derivation
                      1. Initial program 98.9%

                        \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                      2. Add Preprocessing
                      3. Taylor expanded in uy around 0

                        \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                      4. Step-by-step derivation
                        1. +-commutativeN/A

                          \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                        2. associate-+r+N/A

                          \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                        3. associate-*r*N/A

                          \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                        4. distribute-rgt-outN/A

                          \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                      5. Applied rewrites84.3%

                        \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]
                      6. Taylor expanded in maxCos around 0

                        \[\leadsto xi + \color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                      7. Step-by-step derivation
                        1. Applied rewrites84.1%

                          \[\leadsto xi + \color{blue}{\mathsf{fma}\left(maxCos \cdot ux, zi \cdot \left(1 - ux\right), \left(2 \cdot uy\right) \cdot \left(yi \cdot \pi\right)\right)} \]
                        2. Final simplification84.1%

                          \[\leadsto xi + \mathsf{fma}\left(ux \cdot maxCos, \left(1 - ux\right) \cdot zi, \left(\pi \cdot yi\right) \cdot \left(2 \cdot uy\right)\right) \]
                        3. Add Preprocessing

                        Alternative 14: 78.0% accurate, 9.3× speedup?

                        \[\begin{array}{l} \\ \mathsf{fma}\left(uy, \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right) \end{array} \]
                        (FPCore (xi yi zi ux uy maxCos)
                         :precision binary32
                         (fma uy (fma -2.0 (* uy (* xi (* PI PI))) (* 2.0 (* PI yi))) xi))
                        float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                        	return fmaf(uy, fmaf(-2.0f, (uy * (xi * (((float) M_PI) * ((float) M_PI)))), (2.0f * (((float) M_PI) * yi))), xi);
                        }
                        
                        function code(xi, yi, zi, ux, uy, maxCos)
                        	return fma(uy, fma(Float32(-2.0), Float32(uy * Float32(xi * Float32(Float32(pi) * Float32(pi)))), Float32(Float32(2.0) * Float32(Float32(pi) * yi))), xi)
                        end
                        
                        \begin{array}{l}
                        
                        \\
                        \mathsf{fma}\left(uy, \mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right), xi\right)
                        \end{array}
                        
                        Derivation
                        1. Initial program 98.9%

                          \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                        2. Add Preprocessing
                        3. Taylor expanded in ux around 0

                          \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                        4. Step-by-step derivation
                          1. lower-fma.f32N/A

                            \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
                          2. lower-cos.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                          3. associate-*r*N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                          4. lower-*.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                          5. lower-*.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                          6. lower-PI.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                          7. lower-*.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                          8. lower-sin.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                          9. associate-*r*N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                          10. lower-*.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                          11. lower-*.f32N/A

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
                          12. lower-PI.f3291.6

                            \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
                        5. Applied rewrites91.6%

                          \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
                        6. Taylor expanded in uy around 0

                          \[\leadsto xi + \color{blue}{uy \cdot \left(-2 \cdot \left(uy \cdot \left(xi \cdot {\mathsf{PI}\left(\right)}^{2}\right)\right) + 2 \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                        7. Step-by-step derivation
                          1. Applied rewrites82.1%

                            \[\leadsto \mathsf{fma}\left(uy, \color{blue}{\mathsf{fma}\left(-2, uy \cdot \left(xi \cdot \left(\pi \cdot \pi\right)\right), 2 \cdot \left(\pi \cdot yi\right)\right)}, xi\right) \]
                          2. Add Preprocessing

                          Alternative 15: 78.8% accurate, 11.8× speedup?

                          \[\begin{array}{l} \\ maxCos \cdot \left(ux \cdot zi\right) + \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right) \end{array} \]
                          (FPCore (xi yi zi ux uy maxCos)
                           :precision binary32
                           (+ (* maxCos (* ux zi)) (fma (* 2.0 uy) (* PI yi) xi)))
                          float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                          	return (maxCos * (ux * zi)) + fmaf((2.0f * uy), (((float) M_PI) * yi), xi);
                          }
                          
                          function code(xi, yi, zi, ux, uy, maxCos)
                          	return Float32(Float32(maxCos * Float32(ux * zi)) + fma(Float32(Float32(2.0) * uy), Float32(Float32(pi) * yi), xi))
                          end
                          
                          \begin{array}{l}
                          
                          \\
                          maxCos \cdot \left(ux \cdot zi\right) + \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right)
                          \end{array}
                          
                          Derivation
                          1. Initial program 98.9%

                            \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                          2. Add Preprocessing
                          3. Taylor expanded in uy around 0

                            \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                          4. Step-by-step derivation
                            1. +-commutativeN/A

                              \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                            2. associate-+r+N/A

                              \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                            3. associate-*r*N/A

                              \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                            4. distribute-rgt-outN/A

                              \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                          5. Applied rewrites84.3%

                            \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]
                          6. Taylor expanded in ux around 0

                            \[\leadsto xi + \color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + maxCos \cdot \left(ux \cdot zi\right)\right)} \]
                          7. Step-by-step derivation
                            1. Applied rewrites82.0%

                              \[\leadsto \mathsf{fma}\left(2 \cdot uy, yi \cdot \pi, xi\right) + \color{blue}{maxCos \cdot \left(ux \cdot zi\right)} \]
                            2. Final simplification82.0%

                              \[\leadsto maxCos \cdot \left(ux \cdot zi\right) + \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right) \]
                            3. Add Preprocessing

                            Alternative 16: 74.0% accurate, 20.8× speedup?

                            \[\begin{array}{l} \\ \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right) \end{array} \]
                            (FPCore (xi yi zi ux uy maxCos)
                             :precision binary32
                             (fma (* 2.0 uy) (* PI yi) xi))
                            float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                            	return fmaf((2.0f * uy), (((float) M_PI) * yi), xi);
                            }
                            
                            function code(xi, yi, zi, ux, uy, maxCos)
                            	return fma(Float32(Float32(2.0) * uy), Float32(Float32(pi) * yi), xi)
                            end
                            
                            \begin{array}{l}
                            
                            \\
                            \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right)
                            \end{array}
                            
                            Derivation
                            1. Initial program 98.9%

                              \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                            2. Add Preprocessing
                            3. Taylor expanded in uy around 0

                              \[\leadsto \color{blue}{2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \left(maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right)} \]
                            4. Step-by-step derivation
                              1. +-commutativeN/A

                                \[\leadsto 2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + \color{blue}{\left(xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)\right)} \]
                              2. associate-+r+N/A

                                \[\leadsto \color{blue}{\left(2 \cdot \left(\left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                              3. associate-*r*N/A

                                \[\leadsto \left(\color{blue}{\left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)\right) \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}} + xi \cdot \sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)}\right) + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                              4. distribute-rgt-outN/A

                                \[\leadsto \color{blue}{\sqrt{1 - {maxCos}^{2} \cdot \left({ux}^{2} \cdot {\left(1 - ux\right)}^{2}\right)} \cdot \left(2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right) + xi\right)} + maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right) \]
                            5. Applied rewrites84.3%

                              \[\leadsto \color{blue}{\mathsf{fma}\left(\sqrt{\mathsf{fma}\left(maxCos \cdot maxCos, \left(\left(1 - ux\right) \cdot \left(1 - ux\right)\right) \cdot \left(ux \cdot \left(-ux\right)\right), 1\right)}, \mathsf{fma}\left(2, uy \cdot \left(yi \cdot \pi\right), xi\right), maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)\right)} \]
                            6. Taylor expanded in maxCos around 0

                              \[\leadsto xi + \color{blue}{2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                            7. Step-by-step derivation
                              1. Applied rewrites77.6%

                                \[\leadsto \mathsf{fma}\left(2 \cdot uy, \color{blue}{yi \cdot \pi}, xi\right) \]
                              2. Final simplification77.6%

                                \[\leadsto \mathsf{fma}\left(2 \cdot uy, \pi \cdot yi, xi\right) \]
                              3. Add Preprocessing

                              Alternative 17: 74.0% accurate, 20.8× speedup?

                              \[\begin{array}{l} \\ \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right) \end{array} \]
                              (FPCore (xi yi zi ux uy maxCos)
                               :precision binary32
                               (fma 2.0 (* uy (* PI yi)) xi))
                              float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                              	return fmaf(2.0f, (uy * (((float) M_PI) * yi)), xi);
                              }
                              
                              function code(xi, yi, zi, ux, uy, maxCos)
                              	return fma(Float32(2.0), Float32(uy * Float32(Float32(pi) * yi)), xi)
                              end
                              
                              \begin{array}{l}
                              
                              \\
                              \mathsf{fma}\left(2, uy \cdot \left(\pi \cdot yi\right), xi\right)
                              \end{array}
                              
                              Derivation
                              1. Initial program 98.9%

                                \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                              2. Add Preprocessing
                              3. Taylor expanded in ux around 0

                                \[\leadsto \color{blue}{xi \cdot \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right) + yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                              4. Step-by-step derivation
                                1. lower-fma.f32N/A

                                  \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right)} \]
                                2. lower-cos.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \color{blue}{\cos \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                                3. associate-*r*N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                                4. lower-*.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}, yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                                5. lower-*.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                                6. lower-PI.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \color{blue}{\mathsf{PI}\left(\right)}\right), yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)\right) \]
                                7. lower-*.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), \color{blue}{yi \cdot \sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                                8. lower-sin.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \color{blue}{\sin \left(2 \cdot \left(uy \cdot \mathsf{PI}\left(\right)\right)\right)}\right) \]
                                9. associate-*r*N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                                10. lower-*.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \color{blue}{\left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right)}\right) \]
                                11. lower-*.f32N/A

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \mathsf{PI}\left(\right)\right), yi \cdot \sin \left(\color{blue}{\left(2 \cdot uy\right)} \cdot \mathsf{PI}\left(\right)\right)\right) \]
                                12. lower-PI.f3291.6

                                  \[\leadsto \mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \color{blue}{\pi}\right)\right) \]
                              5. Applied rewrites91.6%

                                \[\leadsto \color{blue}{\mathsf{fma}\left(xi, \cos \left(\left(2 \cdot uy\right) \cdot \pi\right), yi \cdot \sin \left(\left(2 \cdot uy\right) \cdot \pi\right)\right)} \]
                              6. Taylor expanded in uy around 0

                                \[\leadsto xi + \color{blue}{2 \cdot \left(uy \cdot \left(yi \cdot \mathsf{PI}\left(\right)\right)\right)} \]
                              7. Step-by-step derivation
                                1. Applied rewrites77.6%

                                  \[\leadsto \mathsf{fma}\left(2, \color{blue}{uy \cdot \left(\pi \cdot yi\right)}, xi\right) \]
                                2. Add Preprocessing

                                Alternative 18: 11.8% accurate, 32.1× speedup?

                                \[\begin{array}{l} \\ maxCos \cdot \left(ux \cdot zi\right) \end{array} \]
                                (FPCore (xi yi zi ux uy maxCos) :precision binary32 (* maxCos (* ux zi)))
                                float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                                	return maxCos * (ux * zi);
                                }
                                
                                real(4) function code(xi, yi, zi, ux, uy, maxcos)
                                    real(4), intent (in) :: xi
                                    real(4), intent (in) :: yi
                                    real(4), intent (in) :: zi
                                    real(4), intent (in) :: ux
                                    real(4), intent (in) :: uy
                                    real(4), intent (in) :: maxcos
                                    code = maxcos * (ux * zi)
                                end function
                                
                                function code(xi, yi, zi, ux, uy, maxCos)
                                	return Float32(maxCos * Float32(ux * zi))
                                end
                                
                                function tmp = code(xi, yi, zi, ux, uy, maxCos)
                                	tmp = maxCos * (ux * zi);
                                end
                                
                                \begin{array}{l}
                                
                                \\
                                maxCos \cdot \left(ux \cdot zi\right)
                                \end{array}
                                
                                Derivation
                                1. Initial program 98.9%

                                  \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                                2. Add Preprocessing
                                3. Taylor expanded in zi around inf

                                  \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                4. Step-by-step derivation
                                  1. lower-*.f32N/A

                                    \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                  2. associate-*r*N/A

                                    \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                  3. lower-*.f32N/A

                                    \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                  4. lower-*.f32N/A

                                    \[\leadsto maxCos \cdot \left(\color{blue}{\left(ux \cdot zi\right)} \cdot \left(1 - ux\right)\right) \]
                                  5. lower--.f3213.1

                                    \[\leadsto maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \color{blue}{\left(1 - ux\right)}\right) \]
                                5. Applied rewrites13.1%

                                  \[\leadsto \color{blue}{maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                6. Taylor expanded in ux around 0

                                  \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                7. Step-by-step derivation
                                  1. Applied rewrites11.6%

                                    \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                  2. Add Preprocessing

                                  Alternative 19: 11.8% accurate, 32.1× speedup?

                                  \[\begin{array}{l} \\ ux \cdot \left(maxCos \cdot zi\right) \end{array} \]
                                  (FPCore (xi yi zi ux uy maxCos) :precision binary32 (* ux (* maxCos zi)))
                                  float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                                  	return ux * (maxCos * zi);
                                  }
                                  
                                  real(4) function code(xi, yi, zi, ux, uy, maxcos)
                                      real(4), intent (in) :: xi
                                      real(4), intent (in) :: yi
                                      real(4), intent (in) :: zi
                                      real(4), intent (in) :: ux
                                      real(4), intent (in) :: uy
                                      real(4), intent (in) :: maxcos
                                      code = ux * (maxcos * zi)
                                  end function
                                  
                                  function code(xi, yi, zi, ux, uy, maxCos)
                                  	return Float32(ux * Float32(maxCos * zi))
                                  end
                                  
                                  function tmp = code(xi, yi, zi, ux, uy, maxCos)
                                  	tmp = ux * (maxCos * zi);
                                  end
                                  
                                  \begin{array}{l}
                                  
                                  \\
                                  ux \cdot \left(maxCos \cdot zi\right)
                                  \end{array}
                                  
                                  Derivation
                                  1. Initial program 98.9%

                                    \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                                  2. Add Preprocessing
                                  3. Taylor expanded in zi around inf

                                    \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                  4. Step-by-step derivation
                                    1. lower-*.f32N/A

                                      \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                    2. associate-*r*N/A

                                      \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                    3. lower-*.f32N/A

                                      \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                    4. lower-*.f32N/A

                                      \[\leadsto maxCos \cdot \left(\color{blue}{\left(ux \cdot zi\right)} \cdot \left(1 - ux\right)\right) \]
                                    5. lower--.f3213.1

                                      \[\leadsto maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \color{blue}{\left(1 - ux\right)}\right) \]
                                  5. Applied rewrites13.1%

                                    \[\leadsto \color{blue}{maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                  6. Taylor expanded in ux around 0

                                    \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                  7. Step-by-step derivation
                                    1. Applied rewrites11.6%

                                      \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                    2. Taylor expanded in ux around 0

                                      \[\leadsto maxCos \cdot \color{blue}{\left(ux \cdot zi\right)} \]
                                    3. Step-by-step derivation
                                      1. Applied rewrites11.6%

                                        \[\leadsto \left(maxCos \cdot ux\right) \cdot \color{blue}{zi} \]
                                      2. Step-by-step derivation
                                        1. Applied rewrites11.6%

                                          \[\leadsto \left(zi \cdot maxCos\right) \cdot ux \]
                                        2. Final simplification11.6%

                                          \[\leadsto ux \cdot \left(maxCos \cdot zi\right) \]
                                        3. Add Preprocessing

                                        Alternative 20: 11.8% accurate, 32.1× speedup?

                                        \[\begin{array}{l} \\ zi \cdot \left(ux \cdot maxCos\right) \end{array} \]
                                        (FPCore (xi yi zi ux uy maxCos) :precision binary32 (* zi (* ux maxCos)))
                                        float code(float xi, float yi, float zi, float ux, float uy, float maxCos) {
                                        	return zi * (ux * maxCos);
                                        }
                                        
                                        real(4) function code(xi, yi, zi, ux, uy, maxcos)
                                            real(4), intent (in) :: xi
                                            real(4), intent (in) :: yi
                                            real(4), intent (in) :: zi
                                            real(4), intent (in) :: ux
                                            real(4), intent (in) :: uy
                                            real(4), intent (in) :: maxcos
                                            code = zi * (ux * maxcos)
                                        end function
                                        
                                        function code(xi, yi, zi, ux, uy, maxCos)
                                        	return Float32(zi * Float32(ux * maxCos))
                                        end
                                        
                                        function tmp = code(xi, yi, zi, ux, uy, maxCos)
                                        	tmp = zi * (ux * maxCos);
                                        end
                                        
                                        \begin{array}{l}
                                        
                                        \\
                                        zi \cdot \left(ux \cdot maxCos\right)
                                        \end{array}
                                        
                                        Derivation
                                        1. Initial program 98.9%

                                          \[\left(\left(\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot xi + \left(\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right)}\right) \cdot yi\right) + \left(\left(\left(1 - ux\right) \cdot maxCos\right) \cdot ux\right) \cdot zi \]
                                        2. Add Preprocessing
                                        3. Taylor expanded in zi around inf

                                          \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                        4. Step-by-step derivation
                                          1. lower-*.f32N/A

                                            \[\leadsto \color{blue}{maxCos \cdot \left(ux \cdot \left(zi \cdot \left(1 - ux\right)\right)\right)} \]
                                          2. associate-*r*N/A

                                            \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                          3. lower-*.f32N/A

                                            \[\leadsto maxCos \cdot \color{blue}{\left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                          4. lower-*.f32N/A

                                            \[\leadsto maxCos \cdot \left(\color{blue}{\left(ux \cdot zi\right)} \cdot \left(1 - ux\right)\right) \]
                                          5. lower--.f3213.1

                                            \[\leadsto maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \color{blue}{\left(1 - ux\right)}\right) \]
                                        5. Applied rewrites13.1%

                                          \[\leadsto \color{blue}{maxCos \cdot \left(\left(ux \cdot zi\right) \cdot \left(1 - ux\right)\right)} \]
                                        6. Taylor expanded in ux around 0

                                          \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                        7. Step-by-step derivation
                                          1. Applied rewrites11.6%

                                            \[\leadsto maxCos \cdot \left(ux \cdot \color{blue}{zi}\right) \]
                                          2. Taylor expanded in ux around 0

                                            \[\leadsto maxCos \cdot \color{blue}{\left(ux \cdot zi\right)} \]
                                          3. Step-by-step derivation
                                            1. Applied rewrites11.6%

                                              \[\leadsto \left(maxCos \cdot ux\right) \cdot \color{blue}{zi} \]
                                            2. Final simplification11.6%

                                              \[\leadsto zi \cdot \left(ux \cdot maxCos\right) \]
                                            3. Add Preprocessing

                                            Reproduce

                                            ?
                                            herbie shell --seed 2024233 
                                            (FPCore (xi yi zi ux uy maxCos)
                                              :name "UniformSampleCone 2"
                                              :precision binary32
                                              :pre (and (and (and (and (and (and (<= -10000.0 xi) (<= xi 10000.0)) (and (<= -10000.0 yi) (<= yi 10000.0))) (and (<= -10000.0 zi) (<= zi 10000.0))) (and (<= 2.328306437e-10 ux) (<= ux 1.0))) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
                                              (+ (+ (* (* (cos (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (* (* (- 1.0 ux) maxCos) ux) (* (* (- 1.0 ux) maxCos) ux))))) xi) (* (* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (* (* (- 1.0 ux) maxCos) ux) (* (* (- 1.0 ux) maxCos) ux))))) yi)) (* (* (* (- 1.0 ux) maxCos) ux) zi)))