
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* t_0 t_0))))))
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* t_0 t_0))))))
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0 (+ (- 1.0 ux) (* ux maxCos))) (t_1 (* (* uy 2.0) (PI))))
(if (<= t_0 0.9999999403953552)
(* (cos t_1) (sqrt (- 1.0 (* t_0 t_0))))
t_1)))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
t_1 := \left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\\
\mathbf{if}\;t\_0 \leq 0.9999999403953552:\\
\;\;\;\;\cos t\_1 \cdot \sqrt{1 - t\_0 \cdot t\_0}\\
\mathbf{else}:\\
\;\;\;\;t\_1\\
\end{array}
\end{array}
if (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)) < 0.99999994Initial program 69.1%
if 0.99999994 < (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)) Initial program 6.8%
Taylor expanded in ux around 0
Applied rewrites21.7%
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (* (* uy 2.0) (PI)))) (* (cos t_0) (sqrt t_0))))
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\\
\cos t\_0 \cdot \sqrt{t\_0}
\end{array}
\end{array}
Initial program 54.0%
Taylor expanded in ux around 0
Applied rewrites20.1%
Taylor expanded in ux around 0
Applied rewrites22.2%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) (PI))) (sqrt (* uy 2.0))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{uy \cdot 2}
\end{array}
Initial program 54.0%
Taylor expanded in ux around 0
Applied rewrites20.1%
Taylor expanded in ux around 0
Applied rewrites22.2%
(FPCore (ux uy maxCos) :precision binary32 (cos (* (* uy 2.0) (PI))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right)
\end{array}
Initial program 54.0%
Taylor expanded in ux around 0
Applied rewrites20.4%
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* t_0 t_0)))
float code(float ux, float uy, float maxCos) {
float t_0 = (1.0f - ux) + (ux * maxCos);
return t_0 * t_0;
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
real(4) :: t_0
t_0 = (1.0e0 - ux) + (ux * maxcos)
code = t_0 * t_0
end function
function code(ux, uy, maxCos) t_0 = Float32(Float32(Float32(1.0) - ux) + Float32(ux * maxCos)) return Float32(t_0 * t_0) end
function tmp = code(ux, uy, maxCos) t_0 = (single(1.0) - ux) + (ux * maxCos); tmp = t_0 * t_0; end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
t\_0 \cdot t\_0
\end{array}
\end{array}
Initial program 54.0%
Taylor expanded in ux around 0
Applied rewrites20.4%
Taylor expanded in ux around inf
Applied rewrites19.4%
(FPCore (ux uy maxCos) :precision binary32 (- 1.0 ux))
float code(float ux, float uy, float maxCos) {
return 1.0f - ux;
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
code = 1.0e0 - ux
end function
function code(ux, uy, maxCos) return Float32(Float32(1.0) - ux) end
function tmp = code(ux, uy, maxCos) tmp = single(1.0) - ux; end
\begin{array}{l}
\\
1 - ux
\end{array}
Initial program 54.0%
Taylor expanded in ux around 0
Applied rewrites20.4%
Taylor expanded in ux around inf
Applied rewrites19.4%
Taylor expanded in ux around 0
Applied rewrites19.3%
herbie shell --seed 2024321
(FPCore (ux uy maxCos)
:name "UniformSampleCone, x"
:precision binary32
:pre (and (and (and (<= 2.328306437e-10 ux) (<= ux 1.0)) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
(* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))