
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* t_0 t_0))))))
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* t_0 t_0))))))
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) (PI))) (sqrt (* (- (* (- 1.0 maxCos) 2.0) (* (pow (- 1.0 maxCos) 2.0) ux)) ux))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(\left(1 - maxCos\right) \cdot 2 - {\left(1 - maxCos\right)}^{2} \cdot ux\right) \cdot ux}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in maxCos around inf
*-commutativeN/A
lower-*.f32N/A
associate--r+N/A
lower--.f32N/A
lower--.f32N/A
lower-/.f32N/A
lower-/.f3258.0
Applied rewrites58.0%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
fp-cancel-sub-signN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-pow.f32N/A
lower--.f3299.0
Applied rewrites99.0%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))
(t_1 (cos (* (* uy 2.0) (PI))))
(t_2 (sqrt (- 1.0 (* t_0 t_0)))))
(if (<= (* t_1 t_2) 0.025499999523162842)
(* t_1 (sqrt (* 2.0 ux)))
(* (+ 1.0 (* (* (* (* uy uy) -2.0) (PI)) (PI))) t_2))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
t_1 := \cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right)\\
t_2 := \sqrt{1 - t\_0 \cdot t\_0}\\
\mathbf{if}\;t\_1 \cdot t\_2 \leq 0.025499999523162842:\\
\;\;\;\;t\_1 \cdot \sqrt{2 \cdot ux}\\
\mathbf{else}:\\
\;\;\;\;\left(1 + \left(\left(\left(uy \cdot uy\right) \cdot -2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \mathsf{PI}\left(\right)\right) \cdot t\_2\\
\end{array}
\end{array}
if (*.f32 (cos.f32 (*.f32 (*.f32 uy #s(literal 2 binary32)) (PI.f32))) (sqrt.f32 (-.f32 #s(literal 1 binary32) (*.f32 (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)) (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)))))) < 0.0255Initial program 39.9%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
lower-fma.f3265.4
Applied rewrites65.3%
Taylor expanded in maxCos around 0
Applied rewrites87.2%
if 0.0255 < (*.f32 (cos.f32 (*.f32 (*.f32 uy #s(literal 2 binary32)) (PI.f32))) (sqrt.f32 (-.f32 #s(literal 1 binary32) (*.f32 (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)) (+.f32 (-.f32 #s(literal 1 binary32) ux) (*.f32 ux maxCos)))))) Initial program 89.3%
Taylor expanded in uy around 0
+-commutativeN/A
associate-*r*N/A
lower-fma.f32N/A
*-commutativeN/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-PI.f3280.3
Applied rewrites80.3%
Applied rewrites85.8%
Final simplification86.7%
(FPCore (ux uy maxCos)
:precision binary32
(*
(cos (* (* uy 2.0) (PI)))
(sqrt
(*
(+ (* 2.0 (/ (- 1.0 maxCos) ux)) (* (+ -1.0 maxCos) (- 1.0 maxCos)))
(* ux ux)))))\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(2 \cdot \frac{1 - maxCos}{ux} + \left(-1 + maxCos\right) \cdot \left(1 - maxCos\right)\right) \cdot \left(ux \cdot ux\right)}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in ux around inf
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
unpow2N/A
lower-*.f3298.8
Applied rewrites98.8%
Applied rewrites98.8%
Final simplification98.8%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) (PI))) (sqrt (- (* (- 2.0 ux) ux) (* (* (fma -2.0 ux 2.0) ux) maxCos)))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(2 - ux\right) \cdot ux - \left(\mathsf{fma}\left(-2, ux, 2\right) \cdot ux\right) \cdot maxCos}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in maxCos around inf
*-commutativeN/A
lower-*.f32N/A
associate--r+N/A
lower--.f32N/A
lower--.f32N/A
lower-/.f32N/A
lower-/.f3258.0
Applied rewrites58.0%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
fp-cancel-sub-signN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-pow.f32N/A
lower--.f3299.0
Applied rewrites99.0%
Taylor expanded in maxCos around 0
Applied rewrites92.2%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) (PI))) (sqrt (* (- (- 2.0 (* (fma -2.0 ux 2.0) maxCos)) ux) ux))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(\left(2 - \mathsf{fma}\left(-2, ux, 2\right) \cdot maxCos\right) - ux\right) \cdot ux}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in maxCos around inf
*-commutativeN/A
lower-*.f32N/A
associate--r+N/A
lower--.f32N/A
lower--.f32N/A
lower-/.f32N/A
lower-/.f3258.0
Applied rewrites58.0%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
fp-cancel-sub-signN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-pow.f32N/A
lower--.f3299.0
Applied rewrites99.0%
Taylor expanded in maxCos around 0
Applied rewrites91.8%
(FPCore (ux uy maxCos) :precision binary32 (if (<= uy 0.00011700000322889537) (sqrt (* (- (* (- 1.0 maxCos) 2.0) (* (pow (- 1.0 maxCos) 2.0) ux)) ux)) (* (cos (* (* uy 2.0) (PI))) (sqrt (* (- 2.0 ux) ux)))))
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;uy \leq 0.00011700000322889537:\\
\;\;\;\;\sqrt{\left(\left(1 - maxCos\right) \cdot 2 - {\left(1 - maxCos\right)}^{2} \cdot ux\right) \cdot ux}\\
\mathbf{else}:\\
\;\;\;\;\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(2 - ux\right) \cdot ux}\\
\end{array}
\end{array}
if uy < 1.17000003e-4Initial program 58.8%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites59.0%
Taylor expanded in ux around inf
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
unpow2N/A
lower-*.f3299.4
Applied rewrites99.4%
Taylor expanded in uy around 0
lower-sqrt.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f3255.8
Applied rewrites54.9%
Taylor expanded in ux around 0
Applied rewrites99.4%
if 1.17000003e-4 < uy Initial program 55.8%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites55.8%
Taylor expanded in maxCos around inf
*-commutativeN/A
lower-*.f32N/A
associate--r+N/A
lower--.f32N/A
lower--.f32N/A
lower-/.f32N/A
lower-/.f3254.7
Applied rewrites54.7%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
fp-cancel-sub-signN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-pow.f32N/A
lower--.f3298.0
Applied rewrites98.0%
Taylor expanded in maxCos around 0
Applied rewrites92.9%
Final simplification96.9%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) (PI))) (sqrt (* (- 2.0 ux) ux))))
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{\left(2 - ux\right) \cdot ux}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in maxCos around inf
*-commutativeN/A
lower-*.f32N/A
associate--r+N/A
lower--.f32N/A
lower--.f32N/A
lower-/.f32N/A
lower-/.f3258.0
Applied rewrites58.0%
Taylor expanded in ux around 0
metadata-evalN/A
fp-cancel-sign-sub-invN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
fp-cancel-sub-signN/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-pow.f32N/A
lower--.f3299.0
Applied rewrites99.0%
Taylor expanded in maxCos around 0
Applied rewrites92.7%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0 (+ (- 1.0 ux) (* ux maxCos))))
(if (<= ux 7.100000220816582e-5)
(sqrt (* (* (- 1.0 maxCos) ux) 2.0))
(*
(+ 1.0 (* (* (* (* uy uy) -2.0) (PI)) (PI)))
(sqrt (- 1.0 (* t_0 t_0)))))))\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\mathbf{if}\;ux \leq 7.100000220816582 \cdot 10^{-5}:\\
\;\;\;\;\sqrt{\left(\left(1 - maxCos\right) \cdot ux\right) \cdot 2}\\
\mathbf{else}:\\
\;\;\;\;\left(1 + \left(\left(\left(uy \cdot uy\right) \cdot -2\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \mathsf{PI}\left(\right)\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}\\
\end{array}
\end{array}
if ux < 7.10000022e-5Initial program 36.2%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites36.2%
Taylor expanded in ux around inf
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
unpow2N/A
lower-*.f3298.6
Applied rewrites98.6%
Taylor expanded in uy around 0
lower-sqrt.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f3232.7
Applied rewrites31.1%
Taylor expanded in ux around 0
Applied rewrites76.5%
if 7.10000022e-5 < ux Initial program 87.1%
Taylor expanded in uy around 0
+-commutativeN/A
associate-*r*N/A
lower-fma.f32N/A
*-commutativeN/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-PI.f32N/A
lower-PI.f3275.7
Applied rewrites75.3%
Applied rewrites81.5%
Final simplification78.6%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (* (* (- 1.0 maxCos) ux) 2.0)))
float code(float ux, float uy, float maxCos) {
return sqrtf((((1.0f - maxCos) * ux) * 2.0f));
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
code = sqrt((((1.0e0 - maxcos) * ux) * 2.0e0))
end function
function code(ux, uy, maxCos) return sqrt(Float32(Float32(Float32(Float32(1.0) - maxCos) * ux) * Float32(2.0))) end
function tmp = code(ux, uy, maxCos) tmp = sqrt((((single(1.0) - maxCos) * ux) * single(2.0))); end
\begin{array}{l}
\\
\sqrt{\left(\left(1 - maxCos\right) \cdot ux\right) \cdot 2}
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in ux around inf
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
unpow2N/A
lower-*.f3298.8
Applied rewrites98.8%
Taylor expanded in uy around 0
lower-sqrt.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f3248.6
Applied rewrites43.4%
Taylor expanded in ux around 0
Applied rewrites65.5%
Final simplification65.5%
(FPCore (ux uy maxCos) :precision binary32 (* (* (sqrt -1.0) ux) maxCos))
float code(float ux, float uy, float maxCos) {
return (sqrtf(-1.0f) * ux) * maxCos;
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
code = (sqrt((-1.0e0)) * ux) * maxcos
end function
function code(ux, uy, maxCos) return Float32(Float32(sqrt(Float32(-1.0)) * ux) * maxCos) end
function tmp = code(ux, uy, maxCos) tmp = (sqrt(single(-1.0)) * ux) * maxCos; end
\begin{array}{l}
\\
\left(\sqrt{-1} \cdot ux\right) \cdot maxCos
\end{array}
Initial program 57.7%
lift-*.f32N/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
unpow1N/A
metadata-evalN/A
sqrt-pow1N/A
pow2N/A
rem-sqrt-square-revN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
fabs-subN/A
Applied rewrites57.8%
Taylor expanded in ux around inf
*-commutativeN/A
lower-*.f32N/A
lower--.f32N/A
*-commutativeN/A
lower-*.f32N/A
lower-/.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
unpow2N/A
lower-*.f3298.8
Applied rewrites98.8%
Taylor expanded in uy around 0
lower-sqrt.f32N/A
lower--.f32N/A
lower-pow.f32N/A
lower--.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f3248.6
Applied rewrites45.9%
Taylor expanded in maxCos around inf
Applied rewrites-0.0%
herbie shell --seed 2024343
(FPCore (ux uy maxCos)
:name "UniformSampleCone, x"
:precision binary32
:pre (and (and (and (<= 2.328306437e-10 ux) (<= ux 1.0)) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
(* (cos (* (* uy 2.0) (PI))) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))