\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - \left(\left(1 - ux\right) + ux \cdot maxCos\right) \cdot \left(\left(1 - ux\right) + ux \cdot maxCos\right)}
\begin{array}{l}
t_0 := 2 \cdot \mathsf{fma}\left(maxCos, ux \cdot ux, ux\right) - \mathsf{fma}\left(2, maxCos \cdot ux, \left(ux \cdot ux\right) \cdot \mathsf{fma}\left(maxCos, maxCos, 1\right)\right)\\
\sqrt[3]{{\sin \left(\left(uy \cdot 2\right) \cdot \pi\right)}^{3} \cdot \left(t_0 \cdot \sqrt[3]{{t_0}^{1.5}}\right)}
\end{array}
(FPCore (ux uy maxCos) :precision binary32 (* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0
(-
(* 2.0 (fma maxCos (* ux ux) ux))
(fma 2.0 (* maxCos ux) (* (* ux ux) (fma maxCos maxCos 1.0))))))
(cbrt (* (pow (sin (* (* uy 2.0) PI)) 3.0) (* t_0 (cbrt (pow t_0 1.5)))))))float code(float ux, float uy, float maxCos) {
return sinf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((1.0f - (((1.0f - ux) + (ux * maxCos)) * ((1.0f - ux) + (ux * maxCos)))));
}
float code(float ux, float uy, float maxCos) {
float t_0 = (2.0f * fmaf(maxCos, (ux * ux), ux)) - fmaf(2.0f, (maxCos * ux), ((ux * ux) * fmaf(maxCos, maxCos, 1.0f)));
return cbrtf((powf(sinf(((uy * 2.0f) * ((float) M_PI))), 3.0f) * (t_0 * cbrtf(powf(t_0, 1.5f)))));
}



Bits error versus ux



Bits error versus uy



Bits error versus maxCos
Initial program 13.5
Simplified13.5
Taylor expanded in ux around 0 0.5
Simplified0.5
Applied egg-rr0.5
Applied egg-rr0.5
Final simplification0.5
herbie shell --seed 2022125
(FPCore (ux uy maxCos)
:name "UniformSampleCone, y"
:precision binary32
:pre (and (and (and (<= 2.328306437e-10 ux) (<= ux 1.0)) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
(* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))