
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (- (log (- 1.0 u1)))) (cos (* (* 2.0 PI) u2))))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(-logf((1.0f - u1))) * cosf(((2.0f * ((float) M_PI)) * u2));
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(-log(Float32(Float32(1.0) - u1)))) * cos(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt(-log((single(1.0) - u1))) * cos(((single(2.0) * single(pi)) * u2)); end
\begin{array}{l}
\\
\sqrt{-\log \left(1 - u1\right)} \cdot \cos \left(\left(2 \cdot \pi\right) \cdot u2\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 1 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (- (log (- 1.0 u1)))) (cos (* (* 2.0 PI) u2))))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(-logf((1.0f - u1))) * cosf(((2.0f * ((float) M_PI)) * u2));
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(-log(Float32(Float32(1.0) - u1)))) * cos(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt(-log((single(1.0) - u1))) * cos(((single(2.0) * single(pi)) * u2)); end
\begin{array}{l}
\\
\sqrt{-\log \left(1 - u1\right)} \cdot \cos \left(\left(2 \cdot \pi\right) \cdot u2\right)
\end{array}
(FPCore (cosTheta_i u1 u2)
:precision binary32
(let* ((t_0 (- (* (- (* -0.25 u1) 0.3333333333333333) u1) 0.5))
(t_1 (* t_0 u1))
(t_2 (cos (* (* 2.0 PI) u2))))
(if (<= u1 0.04500000178813934)
(*
(pow
(-
(/
(* (- (pow t_1 3.0) 1.0) u1)
(fma t_1 (* (- (* -0.3333333333333333 u1) 0.5) u1) (fma t_0 u1 1.0))))
0.5)
t_2)
(* (sqrt (- (log (- 1.0 u1)))) t_2))))
float code(float cosTheta_i, float u1, float u2) {
float t_0 = (((-0.25f * u1) - 0.3333333333333333f) * u1) - 0.5f;
float t_1 = t_0 * u1;
float t_2 = cosf(((2.0f * ((float) M_PI)) * u2));
float tmp;
if (u1 <= 0.04500000178813934f) {
tmp = powf(-(((powf(t_1, 3.0f) - 1.0f) * u1) / fmaf(t_1, (((-0.3333333333333333f * u1) - 0.5f) * u1), fmaf(t_0, u1, 1.0f))), 0.5f) * t_2;
} else {
tmp = sqrtf(-logf((1.0f - u1))) * t_2;
}
return tmp;
}
function code(cosTheta_i, u1, u2) t_0 = Float32(Float32(Float32(Float32(Float32(-0.25) * u1) - Float32(0.3333333333333333)) * u1) - Float32(0.5)) t_1 = Float32(t_0 * u1) t_2 = cos(Float32(Float32(Float32(2.0) * Float32(pi)) * u2)) tmp = Float32(0.0) if (u1 <= Float32(0.04500000178813934)) tmp = Float32((Float32(-Float32(Float32(Float32((t_1 ^ Float32(3.0)) - Float32(1.0)) * u1) / fma(t_1, Float32(Float32(Float32(Float32(-0.3333333333333333) * u1) - Float32(0.5)) * u1), fma(t_0, u1, Float32(1.0))))) ^ Float32(0.5)) * t_2); else tmp = Float32(sqrt(Float32(-log(Float32(Float32(1.0) - u1)))) * t_2); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(-0.25 \cdot u1 - 0.3333333333333333\right) \cdot u1 - 0.5\\
t_1 := t\_0 \cdot u1\\
t_2 := \cos \left(\left(2 \cdot \pi\right) \cdot u2\right)\\
\mathbf{if}\;u1 \leq 0.04500000178813934:\\
\;\;\;\;{\left(-\frac{\left({t\_1}^{3} - 1\right) \cdot u1}{\mathsf{fma}\left(t\_1, \left(-0.3333333333333333 \cdot u1 - 0.5\right) \cdot u1, \mathsf{fma}\left(t\_0, u1, 1\right)\right)}\right)}^{0.5} \cdot t\_2\\
\mathbf{else}:\\
\;\;\;\;\sqrt{-\log \left(1 - u1\right)} \cdot t\_2\\
\end{array}
\end{array}
if u1 < 0.0450000018Initial program 51.9%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
lower-*.f3298.7
Applied rewrites98.7%
lift--.f32N/A
lift-*.f32N/A
lift--.f32N/A
lift-*.f32N/A
lift--.f32N/A
lift-*.f32N/A
flip3--N/A
lower-/.f32N/A
Applied rewrites98.7%
Taylor expanded in u1 around 0
Applied rewrites98.8%
Applied rewrites98.8%
if 0.0450000018 < u1 Initial program 97.5%
herbie shell --seed 2025059
(FPCore (cosTheta_i u1 u2)
:name "Beckmann Sample, near normal, slope_x"
:precision binary32
:pre (and (and (and (> cosTheta_i 0.9999) (<= cosTheta_i 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 1.0))) (and (<= 2.328306437e-10 u2) (<= u2 1.0)))
(* (sqrt (- (log (- 1.0 u1)))) (cos (* (* 2.0 PI) u2))))