
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* t_0 t_0))))))
float code(float ux, float uy, float maxCos) {
float t_0 = (1.0f - ux) + (ux * maxCos);
return sinf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((1.0f - (t_0 * t_0)));
}
function code(ux, uy, maxCos) t_0 = Float32(Float32(Float32(1.0) - ux) + Float32(ux * maxCos)) return Float32(sin(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))) end
function tmp = code(ux, uy, maxCos) t_0 = (single(1.0) - ux) + (ux * maxCos); tmp = sin(((uy * single(2.0)) * single(pi))) * sqrt((single(1.0) - (t_0 * t_0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 11 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* t_0 t_0))))))
float code(float ux, float uy, float maxCos) {
float t_0 = (1.0f - ux) + (ux * maxCos);
return sinf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((1.0f - (t_0 * t_0)));
}
function code(ux, uy, maxCos) t_0 = Float32(Float32(Float32(1.0) - ux) + Float32(ux * maxCos)) return Float32(sin(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))) end
function tmp = code(ux, uy, maxCos) t_0 = (single(1.0) - ux) + (ux * maxCos); tmp = sin(((uy * single(2.0)) * single(pi))) * sqrt((single(1.0) - (t_0 * t_0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\sin \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
(FPCore (ux uy maxCos)
:precision binary32
(cbrt
(*
(pow
(* ux (+ 2.0 (fma (- ux) (pow (+ -1.0 maxCos) 2.0) (* maxCos -2.0))))
1.5)
(pow (sin (* 2.0 (* uy PI))) 3.0))))
float code(float ux, float uy, float maxCos) {
return cbrtf((powf((ux * (2.0f + fmaf(-ux, powf((-1.0f + maxCos), 2.0f), (maxCos * -2.0f)))), 1.5f) * powf(sinf((2.0f * (uy * ((float) M_PI)))), 3.0f)));
}
function code(ux, uy, maxCos) return cbrt(Float32((Float32(ux * Float32(Float32(2.0) + fma(Float32(-ux), (Float32(Float32(-1.0) + maxCos) ^ Float32(2.0)), Float32(maxCos * Float32(-2.0))))) ^ Float32(1.5)) * (sin(Float32(Float32(2.0) * Float32(uy * Float32(pi)))) ^ Float32(3.0)))) end
\begin{array}{l}
\\
\sqrt[3]{{\left(ux \cdot \left(2 + \mathsf{fma}\left(-ux, {\left(-1 + maxCos\right)}^{2}, maxCos \cdot -2\right)\right)\right)}^{1.5} \cdot {\sin \left(2 \cdot \left(uy \cdot \pi\right)\right)}^{3}}
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
*-commutative98.5%
add-cbrt-cube98.4%
add-cbrt-cube98.4%
cbrt-unprod98.3%
Applied egg-rr98.7%
Final simplification98.7%
(FPCore (ux uy maxCos) :precision binary32 (cbrt (* (pow (sin (* 2.0 (* uy PI))) 3.0) (pow (* ux (- 2.0 (+ ux (* maxCos (+ 2.0 (* ux (+ maxCos -2.0))))))) 1.5))))
float code(float ux, float uy, float maxCos) {
return cbrtf((powf(sinf((2.0f * (uy * ((float) M_PI)))), 3.0f) * powf((ux * (2.0f - (ux + (maxCos * (2.0f + (ux * (maxCos + -2.0f))))))), 1.5f)));
}
function code(ux, uy, maxCos) return cbrt(Float32((sin(Float32(Float32(2.0) * Float32(uy * Float32(pi)))) ^ Float32(3.0)) * (Float32(ux * Float32(Float32(2.0) - Float32(ux + Float32(maxCos * Float32(Float32(2.0) + Float32(ux * Float32(maxCos + Float32(-2.0)))))))) ^ Float32(1.5)))) end
\begin{array}{l}
\\
\sqrt[3]{{\sin \left(2 \cdot \left(uy \cdot \pi\right)\right)}^{3} \cdot {\left(ux \cdot \left(2 - \left(ux + maxCos \cdot \left(2 + ux \cdot \left(maxCos + -2\right)\right)\right)\right)\right)}^{1.5}}
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
*-commutative98.5%
add-cbrt-cube98.4%
add-cbrt-cube98.4%
cbrt-unprod98.3%
Applied egg-rr98.7%
Taylor expanded in maxCos around 0 98.7%
Taylor expanded in ux around -inf 98.7%
associate-*r*98.7%
neg-mul-198.7%
sub-neg98.7%
metadata-eval98.7%
Simplified98.7%
Final simplification98.7%
(FPCore (ux uy maxCos) :precision binary32 (* (sin (* PI (* 2.0 uy))) (sqrt (* ux (+ 2.0 (- (* maxCos (- (- (* ux 2.0) (* ux maxCos)) 2.0)) ux))))))
float code(float ux, float uy, float maxCos) {
return sinf((((float) M_PI) * (2.0f * uy))) * sqrtf((ux * (2.0f + ((maxCos * (((ux * 2.0f) - (ux * maxCos)) - 2.0f)) - ux))));
}
function code(ux, uy, maxCos) return Float32(sin(Float32(Float32(pi) * Float32(Float32(2.0) * uy))) * sqrt(Float32(ux * Float32(Float32(2.0) + Float32(Float32(maxCos * Float32(Float32(Float32(ux * Float32(2.0)) - Float32(ux * maxCos)) - Float32(2.0))) - ux))))) end
function tmp = code(ux, uy, maxCos) tmp = sin((single(pi) * (single(2.0) * uy))) * sqrt((ux * (single(2.0) + ((maxCos * (((ux * single(2.0)) - (ux * maxCos)) - single(2.0))) - ux)))); end
\begin{array}{l}
\\
\sin \left(\pi \cdot \left(2 \cdot uy\right)\right) \cdot \sqrt{ux \cdot \left(2 + \left(maxCos \cdot \left(\left(ux \cdot 2 - ux \cdot maxCos\right) - 2\right) - ux\right)\right)}
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
Taylor expanded in maxCos around 0 98.5%
Final simplification98.5%
(FPCore (ux uy maxCos) :precision binary32 (* (sin (* PI (* 2.0 uy))) (sqrt (* ux (+ 2.0 (- (* maxCos (- (* ux 2.0) 2.0)) ux))))))
float code(float ux, float uy, float maxCos) {
return sinf((((float) M_PI) * (2.0f * uy))) * sqrtf((ux * (2.0f + ((maxCos * ((ux * 2.0f) - 2.0f)) - ux))));
}
function code(ux, uy, maxCos) return Float32(sin(Float32(Float32(pi) * Float32(Float32(2.0) * uy))) * sqrt(Float32(ux * Float32(Float32(2.0) + Float32(Float32(maxCos * Float32(Float32(ux * Float32(2.0)) - Float32(2.0))) - ux))))) end
function tmp = code(ux, uy, maxCos) tmp = sin((single(pi) * (single(2.0) * uy))) * sqrt((ux * (single(2.0) + ((maxCos * ((ux * single(2.0)) - single(2.0))) - ux)))); end
\begin{array}{l}
\\
\sin \left(\pi \cdot \left(2 \cdot uy\right)\right) \cdot \sqrt{ux \cdot \left(2 + \left(maxCos \cdot \left(ux \cdot 2 - 2\right) - ux\right)\right)}
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
Taylor expanded in maxCos around 0 97.5%
Final simplification97.5%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0 (* PI (* 2.0 uy))))
(if (<= (* 2.0 uy) 0.00039999998989515007)
(*
(sqrt
(* ux (+ 2.0 (- (* maxCos (- (- (* ux 2.0) (* ux maxCos)) 2.0)) ux))))
t_0)
(* (sin t_0) (sqrt (* ux (- 2.0 ux)))))))
float code(float ux, float uy, float maxCos) {
float t_0 = ((float) M_PI) * (2.0f * uy);
float tmp;
if ((2.0f * uy) <= 0.00039999998989515007f) {
tmp = sqrtf((ux * (2.0f + ((maxCos * (((ux * 2.0f) - (ux * maxCos)) - 2.0f)) - ux)))) * t_0;
} else {
tmp = sinf(t_0) * sqrtf((ux * (2.0f - ux)));
}
return tmp;
}
function code(ux, uy, maxCos) t_0 = Float32(Float32(pi) * Float32(Float32(2.0) * uy)) tmp = Float32(0.0) if (Float32(Float32(2.0) * uy) <= Float32(0.00039999998989515007)) tmp = Float32(sqrt(Float32(ux * Float32(Float32(2.0) + Float32(Float32(maxCos * Float32(Float32(Float32(ux * Float32(2.0)) - Float32(ux * maxCos)) - Float32(2.0))) - ux)))) * t_0); else tmp = Float32(sin(t_0) * sqrt(Float32(ux * Float32(Float32(2.0) - ux)))); end return tmp end
function tmp_2 = code(ux, uy, maxCos) t_0 = single(pi) * (single(2.0) * uy); tmp = single(0.0); if ((single(2.0) * uy) <= single(0.00039999998989515007)) tmp = sqrt((ux * (single(2.0) + ((maxCos * (((ux * single(2.0)) - (ux * maxCos)) - single(2.0))) - ux)))) * t_0; else tmp = sin(t_0) * sqrt((ux * (single(2.0) - ux))); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \pi \cdot \left(2 \cdot uy\right)\\
\mathbf{if}\;2 \cdot uy \leq 0.00039999998989515007:\\
\;\;\;\;\sqrt{ux \cdot \left(2 + \left(maxCos \cdot \left(\left(ux \cdot 2 - ux \cdot maxCos\right) - 2\right) - ux\right)\right)} \cdot t\_0\\
\mathbf{else}:\\
\;\;\;\;\sin t\_0 \cdot \sqrt{ux \cdot \left(2 - ux\right)}\\
\end{array}
\end{array}
if (*.f32 uy #s(literal 2 binary32)) < 3.9999999e-4Initial program 58.7%
Taylor expanded in ux around 0 98.5%
associate--l+98.6%
associate-*r*98.6%
mul-1-neg98.6%
sub-neg98.6%
metadata-eval98.6%
+-commutative98.6%
Simplified98.6%
Taylor expanded in uy around 0 98.4%
associate-*r*98.4%
Simplified98.4%
Taylor expanded in maxCos around 0 98.4%
if 3.9999999e-4 < (*.f32 uy #s(literal 2 binary32)) Initial program 60.8%
Taylor expanded in ux around 0 98.3%
associate--l+98.3%
associate-*r*98.3%
mul-1-neg98.3%
sub-neg98.3%
metadata-eval98.3%
+-commutative98.3%
Simplified98.3%
add-cbrt-cube98.2%
pow1/395.8%
Applied egg-rr95.9%
unpow1/398.1%
fma-define98.1%
*-commutative98.1%
fma-undefine98.1%
+-commutative98.1%
*-commutative98.1%
Simplified98.1%
Taylor expanded in maxCos around 0 93.1%
mul-1-neg93.1%
unsub-neg93.1%
Simplified93.1%
Final simplification96.6%
(FPCore (ux uy maxCos) :precision binary32 (* (sqrt (* ux (+ 2.0 (- (* maxCos (- (- (* ux 2.0) (* ux maxCos)) 2.0)) ux)))) (* PI (* 2.0 uy))))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * (2.0f + ((maxCos * (((ux * 2.0f) - (ux * maxCos)) - 2.0f)) - ux)))) * (((float) M_PI) * (2.0f * uy));
}
function code(ux, uy, maxCos) return Float32(sqrt(Float32(ux * Float32(Float32(2.0) + Float32(Float32(maxCos * Float32(Float32(Float32(ux * Float32(2.0)) - Float32(ux * maxCos)) - Float32(2.0))) - ux)))) * Float32(Float32(pi) * Float32(Float32(2.0) * uy))) end
function tmp = code(ux, uy, maxCos) tmp = sqrt((ux * (single(2.0) + ((maxCos * (((ux * single(2.0)) - (ux * maxCos)) - single(2.0))) - ux)))) * (single(pi) * (single(2.0) * uy)); end
\begin{array}{l}
\\
\sqrt{ux \cdot \left(2 + \left(maxCos \cdot \left(\left(ux \cdot 2 - ux \cdot maxCos\right) - 2\right) - ux\right)\right)} \cdot \left(\pi \cdot \left(2 \cdot uy\right)\right)
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
Taylor expanded in uy around 0 83.3%
associate-*r*83.3%
Simplified83.3%
Taylor expanded in maxCos around 0 83.3%
Final simplification83.3%
(FPCore (ux uy maxCos) :precision binary32 (* (sqrt (* ux (+ 2.0 (- (* maxCos (- (* ux 2.0) 2.0)) ux)))) (* PI (* 2.0 uy))))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * (2.0f + ((maxCos * ((ux * 2.0f) - 2.0f)) - ux)))) * (((float) M_PI) * (2.0f * uy));
}
function code(ux, uy, maxCos) return Float32(sqrt(Float32(ux * Float32(Float32(2.0) + Float32(Float32(maxCos * Float32(Float32(ux * Float32(2.0)) - Float32(2.0))) - ux)))) * Float32(Float32(pi) * Float32(Float32(2.0) * uy))) end
function tmp = code(ux, uy, maxCos) tmp = sqrt((ux * (single(2.0) + ((maxCos * ((ux * single(2.0)) - single(2.0))) - ux)))) * (single(pi) * (single(2.0) * uy)); end
\begin{array}{l}
\\
\sqrt{ux \cdot \left(2 + \left(maxCos \cdot \left(ux \cdot 2 - 2\right) - ux\right)\right)} \cdot \left(\pi \cdot \left(2 \cdot uy\right)\right)
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
Taylor expanded in uy around 0 83.3%
associate-*r*83.3%
Simplified83.3%
Taylor expanded in maxCos around 0 82.6%
Final simplification82.6%
(FPCore (ux uy maxCos) :precision binary32 (* 2.0 (* (* uy PI) (sqrt (* ux (- 2.0 ux))))))
float code(float ux, float uy, float maxCos) {
return 2.0f * ((uy * ((float) M_PI)) * sqrtf((ux * (2.0f - ux))));
}
function code(ux, uy, maxCos) return Float32(Float32(2.0) * Float32(Float32(uy * Float32(pi)) * sqrt(Float32(ux * Float32(Float32(2.0) - ux))))) end
function tmp = code(ux, uy, maxCos) tmp = single(2.0) * ((uy * single(pi)) * sqrt((ux * (single(2.0) - ux)))); end
\begin{array}{l}
\\
2 \cdot \left(\left(uy \cdot \pi\right) \cdot \sqrt{ux \cdot \left(2 - ux\right)}\right)
\end{array}
Initial program 59.4%
Taylor expanded in ux around 0 98.5%
associate--l+98.5%
associate-*r*98.5%
mul-1-neg98.5%
sub-neg98.5%
metadata-eval98.5%
+-commutative98.5%
Simplified98.5%
Taylor expanded in uy around 0 83.3%
associate-*r*83.3%
Simplified83.3%
Taylor expanded in maxCos around 0 78.3%
*-commutative78.3%
mul-1-neg78.3%
unsub-neg78.3%
Simplified78.3%
(FPCore (ux uy maxCos) :precision binary32 (* (+ 1.0 (+ (* maxCos -2.0) 1.0)) (* ux (* uy PI))))
float code(float ux, float uy, float maxCos) {
return (1.0f + ((maxCos * -2.0f) + 1.0f)) * (ux * (uy * ((float) M_PI)));
}
function code(ux, uy, maxCos) return Float32(Float32(Float32(1.0) + Float32(Float32(maxCos * Float32(-2.0)) + Float32(1.0))) * Float32(ux * Float32(uy * Float32(pi)))) end
function tmp = code(ux, uy, maxCos) tmp = (single(1.0) + ((maxCos * single(-2.0)) + single(1.0))) * (ux * (uy * single(pi))); end
\begin{array}{l}
\\
\left(1 + \left(maxCos \cdot -2 + 1\right)\right) \cdot \left(ux \cdot \left(uy \cdot \pi\right)\right)
\end{array}
Initial program 59.4%
associate-*l*59.4%
sub-neg59.4%
+-commutative59.4%
distribute-rgt-neg-in59.4%
fma-define59.3%
Simplified59.4%
Taylor expanded in uy around 0 52.3%
Simplified52.5%
Taylor expanded in maxCos around -inf -0.0%
associate-*r*-0.0%
*-commutative-0.0%
associate-*r*-0.0%
Simplified-0.0%
Applied egg-rr6.2%
rem-cube-cbrt6.2%
Simplified6.2%
Applied egg-rr19.1%
sub-neg19.1%
log1p-undefine19.1%
rem-exp-log19.1%
*-commutative19.1%
metadata-eval19.1%
Simplified19.1%
Final simplification19.1%
(FPCore (ux uy maxCos) :precision binary32 (* (* maxCos -2.0) (* PI (* ux (- uy)))))
float code(float ux, float uy, float maxCos) {
return (maxCos * -2.0f) * (((float) M_PI) * (ux * -uy));
}
function code(ux, uy, maxCos) return Float32(Float32(maxCos * Float32(-2.0)) * Float32(Float32(pi) * Float32(ux * Float32(-uy)))) end
function tmp = code(ux, uy, maxCos) tmp = (maxCos * single(-2.0)) * (single(pi) * (ux * -uy)); end
\begin{array}{l}
\\
\left(maxCos \cdot -2\right) \cdot \left(\pi \cdot \left(ux \cdot \left(-uy\right)\right)\right)
\end{array}
Initial program 59.4%
associate-*l*59.4%
sub-neg59.4%
+-commutative59.4%
distribute-rgt-neg-in59.4%
fma-define59.3%
Simplified59.4%
Taylor expanded in uy around 0 52.3%
Simplified52.5%
Taylor expanded in maxCos around -inf -0.0%
associate-*r*-0.0%
*-commutative-0.0%
associate-*r*-0.0%
Simplified-0.0%
Applied egg-rr9.7%
Final simplification9.7%
(FPCore (ux uy maxCos) :precision binary32 (* -2.0 (* maxCos (* ux (* uy PI)))))
float code(float ux, float uy, float maxCos) {
return -2.0f * (maxCos * (ux * (uy * ((float) M_PI))));
}
function code(ux, uy, maxCos) return Float32(Float32(-2.0) * Float32(maxCos * Float32(ux * Float32(uy * Float32(pi))))) end
function tmp = code(ux, uy, maxCos) tmp = single(-2.0) * (maxCos * (ux * (uy * single(pi)))); end
\begin{array}{l}
\\
-2 \cdot \left(maxCos \cdot \left(ux \cdot \left(uy \cdot \pi\right)\right)\right)
\end{array}
Initial program 59.4%
associate-*l*59.4%
sub-neg59.4%
+-commutative59.4%
distribute-rgt-neg-in59.4%
fma-define59.3%
Simplified59.4%
Taylor expanded in uy around 0 52.3%
Simplified52.5%
Taylor expanded in maxCos around -inf -0.0%
associate-*r*-0.0%
*-commutative-0.0%
associate-*r*-0.0%
Simplified-0.0%
Applied egg-rr6.2%
rem-cube-cbrt6.2%
Simplified6.2%
Taylor expanded in maxCos around 0 6.2%
herbie shell --seed 2024137
(FPCore (ux uy maxCos)
:name "UniformSampleCone, y"
:precision binary32
:pre (and (and (and (<= 2.328306437e-10 ux) (<= ux 1.0)) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
(* (sin (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))