
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) PI)) (sqrt (- 1.0 (* t_0 t_0))))))
float code(float ux, float uy, float maxCos) {
float t_0 = (1.0f - ux) + (ux * maxCos);
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((1.0f - (t_0 * t_0)));
}
function code(ux, uy, maxCos) t_0 = Float32(Float32(Float32(1.0) - ux) + Float32(ux * maxCos)) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))) end
function tmp = code(ux, uy, maxCos) t_0 = (single(1.0) - ux) + (ux * maxCos); tmp = cos(((uy * single(2.0)) * single(pi))) * sqrt((single(1.0) - (t_0 * t_0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 19 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (ux uy maxCos) :precision binary32 (let* ((t_0 (+ (- 1.0 ux) (* ux maxCos)))) (* (cos (* (* uy 2.0) PI)) (sqrt (- 1.0 (* t_0 t_0))))))
float code(float ux, float uy, float maxCos) {
float t_0 = (1.0f - ux) + (ux * maxCos);
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((1.0f - (t_0 * t_0)));
}
function code(ux, uy, maxCos) t_0 = Float32(Float32(Float32(1.0) - ux) + Float32(ux * maxCos)) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(Float32(1.0) - Float32(t_0 * t_0)))) end
function tmp = code(ux, uy, maxCos) t_0 = (single(1.0) - ux) + (ux * maxCos); tmp = cos(((uy * single(2.0)) * single(pi))) * sqrt((single(1.0) - (t_0 * t_0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \left(1 - ux\right) + ux \cdot maxCos\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{1 - t\_0 \cdot t\_0}
\end{array}
\end{array}
(FPCore (ux uy maxCos)
:precision binary32
(*
(cos (* (* uy 2.0) PI))
(sqrt
(fma
(fma ux (* (+ maxCos -1.0) (- 1.0 maxCos)) (* maxCos -2.0))
ux
(* 2.0 ux)))))
float code(float ux, float uy, float maxCos) {
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf(fmaf(fmaf(ux, ((maxCos + -1.0f) * (1.0f - maxCos)), (maxCos * -2.0f)), ux, (2.0f * ux)));
}
function code(ux, uy, maxCos) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(fma(fma(ux, Float32(Float32(maxCos + Float32(-1.0)) * Float32(Float32(1.0) - maxCos)), Float32(maxCos * Float32(-2.0))), ux, Float32(Float32(2.0) * ux)))) end
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{\mathsf{fma}\left(\mathsf{fma}\left(ux, \left(maxCos + -1\right) \cdot \left(1 - maxCos\right), maxCos \cdot -2\right), ux, 2 \cdot ux\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
associate-+r+N/A
distribute-rgt-inN/A
accelerator-lowering-fma.f32N/A
accelerator-lowering-fma.f32N/A
sub-negN/A
metadata-evalN/A
neg-mul-1N/A
distribute-lft-inN/A
+-commutativeN/A
*-lowering-*.f32N/A
+-lowering-+.f32N/A
+-commutativeN/A
distribute-lft-inN/A
metadata-evalN/A
neg-mul-1N/A
sub-negN/A
--lowering--.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f3298.9
Applied egg-rr98.9%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0
(sqrt
(*
ux
(+
(fma -2.0 maxCos 2.0)
(* (+ maxCos -1.0) (fma (- maxCos) ux ux)))))))
(if (<= (cos (* (* uy 2.0) PI)) 0.9991999864578247)
(* (sqrt ux) (* (sqrt (- 2.0 ux)) (cos (* 2.0 (* uy PI)))))
(fma -2.0 (* t_0 (* (* uy uy) (* PI PI))) t_0))))
float code(float ux, float uy, float maxCos) {
float t_0 = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
float tmp;
if (cosf(((uy * 2.0f) * ((float) M_PI))) <= 0.9991999864578247f) {
tmp = sqrtf(ux) * (sqrtf((2.0f - ux)) * cosf((2.0f * (uy * ((float) M_PI)))));
} else {
tmp = fmaf(-2.0f, (t_0 * ((uy * uy) * (((float) M_PI) * ((float) M_PI)))), t_0);
}
return tmp;
}
function code(ux, uy, maxCos) t_0 = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))) tmp = Float32(0.0) if (cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) <= Float32(0.9991999864578247)) tmp = Float32(sqrt(ux) * Float32(sqrt(Float32(Float32(2.0) - ux)) * cos(Float32(Float32(2.0) * Float32(uy * Float32(pi)))))); else tmp = fma(Float32(-2.0), Float32(t_0 * Float32(Float32(uy * uy) * Float32(Float32(pi) * Float32(pi)))), t_0); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\mathbf{if}\;\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \leq 0.9991999864578247:\\
\;\;\;\;\sqrt{ux} \cdot \left(\sqrt{2 - ux} \cdot \cos \left(2 \cdot \left(uy \cdot \pi\right)\right)\right)\\
\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(-2, t\_0 \cdot \left(\left(uy \cdot uy\right) \cdot \left(\pi \cdot \pi\right)\right), t\_0\right)\\
\end{array}
\end{array}
if (cos.f32 (*.f32 (*.f32 uy #s(literal 2 binary32)) (PI.f32))) < 0.999199986Initial program 56.3%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified97.6%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3291.6
Simplified91.6%
pow1/2N/A
unpow-prod-downN/A
associate-*r*N/A
*-commutativeN/A
add-sqr-sqrtN/A
associate-*l*N/A
associate-*l*N/A
*-lowering-*.f32N/A
pow1/2N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
pow1/2N/A
sqrt-lowering-sqrt.f32N/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
associate-*l*N/A
add-sqr-sqrtN/A
Applied egg-rr91.9%
if 0.999199986 < (cos.f32 (*.f32 (*.f32 uy #s(literal 2 binary32)) (PI.f32))) Initial program 54.4%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified99.2%
Taylor expanded in uy around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
Simplified99.2%
Final simplification97.7%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) PI)) (sqrt (* ux (fma ux (* (+ maxCos -1.0) (- 1.0 maxCos)) (fma maxCos -2.0 2.0))))))
float code(float ux, float uy, float maxCos) {
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((ux * fmaf(ux, ((maxCos + -1.0f) * (1.0f - maxCos)), fmaf(maxCos, -2.0f, 2.0f))));
}
function code(ux, uy, maxCos) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(ux * fma(ux, Float32(Float32(maxCos + Float32(-1.0)) * Float32(Float32(1.0) - maxCos)), fma(maxCos, Float32(-2.0), Float32(2.0)))))) end
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{ux \cdot \mathsf{fma}\left(ux, \left(maxCos + -1\right) \cdot \left(1 - maxCos\right), \mathsf{fma}\left(maxCos, -2, 2\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) PI)) (sqrt (fma ux (- 2.0 ux) (* (* ux maxCos) (fma 2.0 ux -2.0))))))
float code(float ux, float uy, float maxCos) {
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf(fmaf(ux, (2.0f - ux), ((ux * maxCos) * fmaf(2.0f, ux, -2.0f))));
}
function code(ux, uy, maxCos) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(fma(ux, Float32(Float32(2.0) - ux), Float32(Float32(ux * maxCos) * fma(Float32(2.0), ux, Float32(-2.0)))))) end
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{\mathsf{fma}\left(ux, 2 - ux, \left(ux \cdot maxCos\right) \cdot \mathsf{fma}\left(2, ux, -2\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
associate-*r*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
accelerator-lowering-fma.f3298.2
Simplified98.2%
Final simplification98.2%
(FPCore (ux uy maxCos) :precision binary32 (* (cos (* (* uy 2.0) PI)) (sqrt (fma (- maxCos) (* 2.0 ux) (- (* ux (+ ux -2.0)))))))
float code(float ux, float uy, float maxCos) {
return cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf(fmaf(-maxCos, (2.0f * ux), -(ux * (ux + -2.0f))));
}
function code(ux, uy, maxCos) return Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(fma(Float32(-maxCos), Float32(Float32(2.0) * ux), Float32(-Float32(ux * Float32(ux + Float32(-2.0))))))) end
\begin{array}{l}
\\
\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{\mathsf{fma}\left(-maxCos, 2 \cdot ux, -ux \cdot \left(ux + -2\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
+-commutativeN/A
associate--l+N/A
accelerator-lowering-fma.f32N/A
unpow2N/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
sub-negN/A
metadata-evalN/A
accelerator-lowering-fma.f3258.6
Simplified58.6%
Taylor expanded in maxCos around 0
sub-negN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
*-lowering-*.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
associate-*r*N/A
*-lowering-*.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f3298.2
Simplified98.2%
Taylor expanded in ux around 0
*-commutativeN/A
*-lowering-*.f3297.3
Simplified97.3%
Final simplification97.3%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0
(sqrt
(*
ux
(+
(fma -2.0 maxCos 2.0)
(* (+ maxCos -1.0) (fma (- maxCos) ux ux)))))))
(if (<= (* uy 2.0) 0.012000000104308128)
(fma -2.0 (* t_0 (* (* uy uy) (* PI PI))) t_0)
(* (cos (* 2.0 (* uy PI))) (sqrt (* ux (- 2.0 ux)))))))
float code(float ux, float uy, float maxCos) {
float t_0 = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
float tmp;
if ((uy * 2.0f) <= 0.012000000104308128f) {
tmp = fmaf(-2.0f, (t_0 * ((uy * uy) * (((float) M_PI) * ((float) M_PI)))), t_0);
} else {
tmp = cosf((2.0f * (uy * ((float) M_PI)))) * sqrtf((ux * (2.0f - ux)));
}
return tmp;
}
function code(ux, uy, maxCos) t_0 = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))) tmp = Float32(0.0) if (Float32(uy * Float32(2.0)) <= Float32(0.012000000104308128)) tmp = fma(Float32(-2.0), Float32(t_0 * Float32(Float32(uy * uy) * Float32(Float32(pi) * Float32(pi)))), t_0); else tmp = Float32(cos(Float32(Float32(2.0) * Float32(uy * Float32(pi)))) * sqrt(Float32(ux * Float32(Float32(2.0) - ux)))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\mathbf{if}\;uy \cdot 2 \leq 0.012000000104308128:\\
\;\;\;\;\mathsf{fma}\left(-2, t\_0 \cdot \left(\left(uy \cdot uy\right) \cdot \left(\pi \cdot \pi\right)\right), t\_0\right)\\
\mathbf{else}:\\
\;\;\;\;\cos \left(2 \cdot \left(uy \cdot \pi\right)\right) \cdot \sqrt{ux \cdot \left(2 - ux\right)}\\
\end{array}
\end{array}
if (*.f32 uy #s(literal 2 binary32)) < 0.0120000001Initial program 54.4%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified99.2%
Taylor expanded in uy around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
Simplified99.2%
if 0.0120000001 < (*.f32 uy #s(literal 2 binary32)) Initial program 56.3%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified97.6%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3291.6
Simplified91.6%
Final simplification97.7%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0
(sqrt
(*
ux
(+
(fma -2.0 maxCos 2.0)
(* (+ maxCos -1.0) (fma (- maxCos) ux ux)))))))
(if (<= (* uy 2.0) 0.10000000149011612)
(fma -2.0 (* t_0 (* (* uy uy) (* PI PI))) t_0)
(* (cos (* (* uy 2.0) PI)) (sqrt (* 2.0 ux))))))
float code(float ux, float uy, float maxCos) {
float t_0 = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
float tmp;
if ((uy * 2.0f) <= 0.10000000149011612f) {
tmp = fmaf(-2.0f, (t_0 * ((uy * uy) * (((float) M_PI) * ((float) M_PI)))), t_0);
} else {
tmp = cosf(((uy * 2.0f) * ((float) M_PI))) * sqrtf((2.0f * ux));
}
return tmp;
}
function code(ux, uy, maxCos) t_0 = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))) tmp = Float32(0.0) if (Float32(uy * Float32(2.0)) <= Float32(0.10000000149011612)) tmp = fma(Float32(-2.0), Float32(t_0 * Float32(Float32(uy * uy) * Float32(Float32(pi) * Float32(pi)))), t_0); else tmp = Float32(cos(Float32(Float32(uy * Float32(2.0)) * Float32(pi))) * sqrt(Float32(Float32(2.0) * ux))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\mathbf{if}\;uy \cdot 2 \leq 0.10000000149011612:\\
\;\;\;\;\mathsf{fma}\left(-2, t\_0 \cdot \left(\left(uy \cdot uy\right) \cdot \left(\pi \cdot \pi\right)\right), t\_0\right)\\
\mathbf{else}:\\
\;\;\;\;\cos \left(\left(uy \cdot 2\right) \cdot \pi\right) \cdot \sqrt{2 \cdot ux}\\
\end{array}
\end{array}
if (*.f32 uy #s(literal 2 binary32)) < 0.100000001Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified99.2%
Taylor expanded in uy around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
Simplified97.7%
if 0.100000001 < (*.f32 uy #s(literal 2 binary32)) Initial program 54.4%
Taylor expanded in maxCos around 0
sub-negN/A
+-commutativeN/A
unpow2N/A
distribute-rgt-neg-inN/A
mul-1-negN/A
accelerator-lowering-fma.f32N/A
--lowering--.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
--lowering--.f3253.4
Simplified53.4%
Taylor expanded in ux around 0
*-lowering-*.f3273.8
Simplified73.8%
Final simplification94.1%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0
(sqrt
(*
ux
(+
(fma -2.0 maxCos 2.0)
(* (+ maxCos -1.0) (fma (- maxCos) ux ux)))))))
(fma -2.0 (* t_0 (* (* uy uy) (* PI PI))) t_0)))
float code(float ux, float uy, float maxCos) {
float t_0 = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
return fmaf(-2.0f, (t_0 * ((uy * uy) * (((float) M_PI) * ((float) M_PI)))), t_0);
}
function code(ux, uy, maxCos) t_0 = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))) return fma(Float32(-2.0), Float32(t_0 * Float32(Float32(uy * uy) * Float32(Float32(pi) * Float32(pi)))), t_0) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\mathsf{fma}\left(-2, t\_0 \cdot \left(\left(uy \cdot uy\right) \cdot \left(\pi \cdot \pi\right)\right), t\_0\right)
\end{array}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in uy around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
Simplified87.4%
Final simplification87.4%
(FPCore (ux uy maxCos)
:precision binary32
(*
(sqrt
(fma
(fma ux (* (+ maxCos -1.0) (- 1.0 maxCos)) (* maxCos -2.0))
ux
(* 2.0 ux)))
(fma (* -2.0 (* uy uy)) (* PI PI) 1.0)))
float code(float ux, float uy, float maxCos) {
return sqrtf(fmaf(fmaf(ux, ((maxCos + -1.0f) * (1.0f - maxCos)), (maxCos * -2.0f)), ux, (2.0f * ux))) * fmaf((-2.0f * (uy * uy)), (((float) M_PI) * ((float) M_PI)), 1.0f);
}
function code(ux, uy, maxCos) return Float32(sqrt(fma(fma(ux, Float32(Float32(maxCos + Float32(-1.0)) * Float32(Float32(1.0) - maxCos)), Float32(maxCos * Float32(-2.0))), ux, Float32(Float32(2.0) * ux))) * fma(Float32(Float32(-2.0) * Float32(uy * uy)), Float32(Float32(pi) * Float32(pi)), Float32(1.0))) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(ux, \left(maxCos + -1\right) \cdot \left(1 - maxCos\right), maxCos \cdot -2\right), ux, 2 \cdot ux\right)} \cdot \mathsf{fma}\left(-2 \cdot \left(uy \cdot uy\right), \pi \cdot \pi, 1\right)
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
associate-+r+N/A
distribute-rgt-inN/A
accelerator-lowering-fma.f32N/A
accelerator-lowering-fma.f32N/A
sub-negN/A
metadata-evalN/A
neg-mul-1N/A
distribute-lft-inN/A
+-commutativeN/A
*-lowering-*.f32N/A
+-lowering-+.f32N/A
+-commutativeN/A
distribute-lft-inN/A
metadata-evalN/A
neg-mul-1N/A
sub-negN/A
--lowering--.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f3298.9
Applied egg-rr98.9%
Taylor expanded in uy around 0
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f3287.3
Simplified87.3%
Final simplification87.3%
(FPCore (ux uy maxCos)
:precision binary32
(let* ((t_0 (sqrt (* ux (- 2.0 ux)))))
(if (<= maxCos 4.999999987376214e-7)
(fma -2.0 (* (* (* uy uy) (* PI PI)) t_0) t_0)
(sqrt
(*
ux
(+
(fma -2.0 maxCos 2.0)
(* (+ maxCos -1.0) (fma (- maxCos) ux ux))))))))
float code(float ux, float uy, float maxCos) {
float t_0 = sqrtf((ux * (2.0f - ux)));
float tmp;
if (maxCos <= 4.999999987376214e-7f) {
tmp = fmaf(-2.0f, (((uy * uy) * (((float) M_PI) * ((float) M_PI))) * t_0), t_0);
} else {
tmp = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
}
return tmp;
}
function code(ux, uy, maxCos) t_0 = sqrt(Float32(ux * Float32(Float32(2.0) - ux))) tmp = Float32(0.0) if (maxCos <= Float32(4.999999987376214e-7)) tmp = fma(Float32(-2.0), Float32(Float32(Float32(uy * uy) * Float32(Float32(pi) * Float32(pi))) * t_0), t_0); else tmp = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt{ux \cdot \left(2 - ux\right)}\\
\mathbf{if}\;maxCos \leq 4.999999987376214 \cdot 10^{-7}:\\
\;\;\;\;\mathsf{fma}\left(-2, \left(\left(uy \cdot uy\right) \cdot \left(\pi \cdot \pi\right)\right) \cdot t\_0, t\_0\right)\\
\mathbf{else}:\\
\;\;\;\;\sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\end{array}
\end{array}
if maxCos < 4.99999999e-7Initial program 53.7%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3298.8
Simplified98.8%
Taylor expanded in uy around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
Simplified87.8%
if 4.99999999e-7 < maxCos Initial program 59.6%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
associate-+r+N/A
+-lowering-+.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
associate-*r*N/A
sub-negN/A
mul-1-negN/A
*-lowering-*.f32N/A
distribute-rgt-inN/A
*-lft-identityN/A
associate-*r*N/A
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f3277.2
Simplified77.2%
Final simplification85.9%
(FPCore (ux uy maxCos) :precision binary32 (* (sqrt (* ux (fma ux (* (+ maxCos -1.0) (- 1.0 maxCos)) (fma maxCos -2.0 2.0)))) (fma (* -2.0 (* uy uy)) (* PI PI) 1.0)))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * fmaf(ux, ((maxCos + -1.0f) * (1.0f - maxCos)), fmaf(maxCos, -2.0f, 2.0f)))) * fmaf((-2.0f * (uy * uy)), (((float) M_PI) * ((float) M_PI)), 1.0f);
}
function code(ux, uy, maxCos) return Float32(sqrt(Float32(ux * fma(ux, Float32(Float32(maxCos + Float32(-1.0)) * Float32(Float32(1.0) - maxCos)), fma(maxCos, Float32(-2.0), Float32(2.0))))) * fma(Float32(Float32(-2.0) * Float32(uy * uy)), Float32(Float32(pi) * Float32(pi)), Float32(1.0))) end
\begin{array}{l}
\\
\sqrt{ux \cdot \mathsf{fma}\left(ux, \left(maxCos + -1\right) \cdot \left(1 - maxCos\right), \mathsf{fma}\left(maxCos, -2, 2\right)\right)} \cdot \mathsf{fma}\left(-2 \cdot \left(uy \cdot uy\right), \pi \cdot \pi, 1\right)
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in uy around 0
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f3287.3
Simplified87.3%
Final simplification87.3%
(FPCore (ux uy maxCos)
:precision binary32
(if (<= maxCos 4.999999987376214e-7)
(* (sqrt (* ux (- 2.0 ux))) (fma (* -2.0 (* uy uy)) (* PI PI) 1.0))
(sqrt
(*
ux
(+ (fma -2.0 maxCos 2.0) (* (+ maxCos -1.0) (fma (- maxCos) ux ux)))))))
float code(float ux, float uy, float maxCos) {
float tmp;
if (maxCos <= 4.999999987376214e-7f) {
tmp = sqrtf((ux * (2.0f - ux))) * fmaf((-2.0f * (uy * uy)), (((float) M_PI) * ((float) M_PI)), 1.0f);
} else {
tmp = sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
}
return tmp;
}
function code(ux, uy, maxCos) tmp = Float32(0.0) if (maxCos <= Float32(4.999999987376214e-7)) tmp = Float32(sqrt(Float32(ux * Float32(Float32(2.0) - ux))) * fma(Float32(Float32(-2.0) * Float32(uy * uy)), Float32(Float32(pi) * Float32(pi)), Float32(1.0))); else tmp = sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;maxCos \leq 4.999999987376214 \cdot 10^{-7}:\\
\;\;\;\;\sqrt{ux \cdot \left(2 - ux\right)} \cdot \mathsf{fma}\left(-2 \cdot \left(uy \cdot uy\right), \pi \cdot \pi, 1\right)\\
\mathbf{else}:\\
\;\;\;\;\sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}\\
\end{array}
\end{array}
if maxCos < 4.99999999e-7Initial program 53.7%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3298.8
Simplified98.8%
Taylor expanded in uy around 0
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
unpow2N/A
*-lowering-*.f32N/A
PI-lowering-PI.f32N/A
PI-lowering-PI.f3287.7
Simplified87.7%
if 4.99999999e-7 < maxCos Initial program 59.6%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
associate-+r+N/A
+-lowering-+.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
associate-*r*N/A
sub-negN/A
mul-1-negN/A
*-lowering-*.f32N/A
distribute-rgt-inN/A
*-lft-identityN/A
associate-*r*N/A
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f3277.2
Simplified77.2%
Final simplification85.8%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (* ux (+ (fma -2.0 maxCos 2.0) (* (+ maxCos -1.0) (fma (- maxCos) ux ux))))))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * (fmaf(-2.0f, maxCos, 2.0f) + ((maxCos + -1.0f) * fmaf(-maxCos, ux, ux)))));
}
function code(ux, uy, maxCos) return sqrt(Float32(ux * Float32(fma(Float32(-2.0), maxCos, Float32(2.0)) + Float32(Float32(maxCos + Float32(-1.0)) * fma(Float32(-maxCos), ux, ux))))) end
\begin{array}{l}
\\
\sqrt{ux \cdot \left(\mathsf{fma}\left(-2, maxCos, 2\right) + \left(maxCos + -1\right) \cdot \mathsf{fma}\left(-maxCos, ux, ux\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
associate-+r+N/A
+-lowering-+.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
associate-*r*N/A
sub-negN/A
mul-1-negN/A
*-lowering-*.f32N/A
distribute-rgt-inN/A
*-lft-identityN/A
associate-*r*N/A
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f3279.2
Simplified79.2%
Final simplification79.2%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (fma (- ux) (+ ux -2.0) (* maxCos (* (- ux) (fma ux -2.0 2.0))))))
float code(float ux, float uy, float maxCos) {
return sqrtf(fmaf(-ux, (ux + -2.0f), (maxCos * (-ux * fmaf(ux, -2.0f, 2.0f)))));
}
function code(ux, uy, maxCos) return sqrt(fma(Float32(-ux), Float32(ux + Float32(-2.0)), Float32(maxCos * Float32(Float32(-ux) * fma(ux, Float32(-2.0), Float32(2.0)))))) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(-ux, ux + -2, maxCos \cdot \left(\left(-ux\right) \cdot \mathsf{fma}\left(ux, -2, 2\right)\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
+-commutativeN/A
associate--l+N/A
accelerator-lowering-fma.f32N/A
unpow2N/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
sub-negN/A
metadata-evalN/A
accelerator-lowering-fma.f3258.6
Simplified58.6%
Taylor expanded in maxCos around 0
sub-negN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
*-lowering-*.f32N/A
+-commutativeN/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
associate-*r*N/A
*-lowering-*.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f3298.2
Simplified98.2%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
+-commutativeN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
associate-*r*N/A
*-lowering-*.f32N/A
mul-1-negN/A
neg-lowering-neg.f32N/A
*-lowering-*.f32N/A
+-commutativeN/A
*-commutativeN/A
accelerator-lowering-fma.f3278.6
Simplified78.6%
Final simplification78.6%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (* ux (+ 2.0 (fma ux (* (+ maxCos -1.0) (- 1.0 maxCos)) (- maxCos))))))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * (2.0f + fmaf(ux, ((maxCos + -1.0f) * (1.0f - maxCos)), -maxCos))));
}
function code(ux, uy, maxCos) return sqrt(Float32(ux * Float32(Float32(2.0) + fma(ux, Float32(Float32(maxCos + Float32(-1.0)) * Float32(Float32(1.0) - maxCos)), Float32(-maxCos))))) end
\begin{array}{l}
\\
\sqrt{ux \cdot \left(2 + \mathsf{fma}\left(ux, \left(maxCos + -1\right) \cdot \left(1 - maxCos\right), -maxCos\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
sub-negN/A
+-commutativeN/A
unpow2N/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
Simplified46.7%
+-commutativeN/A
distribute-rgt-inN/A
associate-+r+N/A
+-lowering-+.f32N/A
Applied egg-rr46.9%
Taylor expanded in maxCos around 0
sub-negN/A
metadata-evalN/A
+-lowering-+.f3245.3
Simplified45.3%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
+-lowering-+.f32N/A
+-commutativeN/A
associate-*r*N/A
mul-1-negN/A
sub-negN/A
associate-*r*N/A
accelerator-lowering-fma.f32N/A
*-lowering-*.f32N/A
--lowering--.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
neg-lowering-neg.f3275.7
Simplified75.7%
Final simplification75.7%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (fma ux 2.0 (* ux (- ux)))))
float code(float ux, float uy, float maxCos) {
return sqrtf(fmaf(ux, 2.0f, (ux * -ux)));
}
function code(ux, uy, maxCos) return sqrt(fma(ux, Float32(2.0), Float32(ux * Float32(-ux)))) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(ux, 2, ux \cdot \left(-ux\right)\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3293.0
Simplified93.0%
Taylor expanded in uy around 0
sub-negN/A
mul-1-negN/A
+-commutativeN/A
distribute-rgt-inN/A
mul-1-negN/A
distribute-lft-neg-inN/A
unpow2N/A
mul-1-negN/A
sqrt-lowering-sqrt.f32N/A
+-commutativeN/A
mul-1-negN/A
unpow2N/A
distribute-lft-neg-inN/A
mul-1-negN/A
distribute-rgt-inN/A
*-lowering-*.f32N/A
mul-1-negN/A
sub-negN/A
--lowering--.f3275.4
Simplified75.4%
sub-negN/A
distribute-rgt-inN/A
*-commutativeN/A
accelerator-lowering-fma.f32N/A
distribute-lft-neg-outN/A
neg-lowering-neg.f32N/A
*-lowering-*.f3275.5
Applied egg-rr75.5%
Final simplification75.5%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (fma ux (- 1.0 ux) ux)))
float code(float ux, float uy, float maxCos) {
return sqrtf(fmaf(ux, (1.0f - ux), ux));
}
function code(ux, uy, maxCos) return sqrt(fma(ux, Float32(Float32(1.0) - ux), ux)) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(ux, 1 - ux, ux\right)}
\end{array}
Initial program 54.8%
Taylor expanded in uy around 0
sqrt-lowering-sqrt.f32N/A
sub-negN/A
+-commutativeN/A
unpow2N/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
Simplified46.7%
+-commutativeN/A
distribute-rgt-inN/A
associate-+r+N/A
+-lowering-+.f32N/A
Applied egg-rr46.9%
Taylor expanded in maxCos around 0
+-commutativeN/A
accelerator-lowering-fma.f32N/A
--lowering--.f3275.4
Simplified75.4%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (* ux (- 2.0 ux))))
float code(float ux, float uy, float maxCos) {
return sqrtf((ux * (2.0f - ux)));
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
code = sqrt((ux * (2.0e0 - ux)))
end function
function code(ux, uy, maxCos) return sqrt(Float32(ux * Float32(Float32(2.0) - ux))) end
function tmp = code(ux, uy, maxCos) tmp = sqrt((ux * (single(2.0) - ux))); end
\begin{array}{l}
\\
\sqrt{ux \cdot \left(2 - ux\right)}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3293.0
Simplified93.0%
Taylor expanded in uy around 0
sub-negN/A
mul-1-negN/A
+-commutativeN/A
distribute-rgt-inN/A
mul-1-negN/A
distribute-lft-neg-inN/A
unpow2N/A
mul-1-negN/A
sqrt-lowering-sqrt.f32N/A
+-commutativeN/A
mul-1-negN/A
unpow2N/A
distribute-lft-neg-inN/A
mul-1-negN/A
distribute-rgt-inN/A
*-lowering-*.f32N/A
mul-1-negN/A
sub-negN/A
--lowering--.f3275.4
Simplified75.4%
(FPCore (ux uy maxCos) :precision binary32 (sqrt (* 2.0 ux)))
float code(float ux, float uy, float maxCos) {
return sqrtf((2.0f * ux));
}
real(4) function code(ux, uy, maxcos)
real(4), intent (in) :: ux
real(4), intent (in) :: uy
real(4), intent (in) :: maxcos
code = sqrt((2.0e0 * ux))
end function
function code(ux, uy, maxCos) return sqrt(Float32(Float32(2.0) * ux)) end
function tmp = code(ux, uy, maxCos) tmp = sqrt((single(2.0) * ux)); end
\begin{array}{l}
\\
\sqrt{2 \cdot ux}
\end{array}
Initial program 54.8%
Taylor expanded in ux around 0
*-lowering-*.f32N/A
cancel-sign-sub-invN/A
+-commutativeN/A
metadata-evalN/A
associate-+l+N/A
mul-1-negN/A
distribute-rgt-neg-inN/A
accelerator-lowering-fma.f32N/A
unpow2N/A
distribute-rgt-neg-inN/A
neg-sub0N/A
associate-+l-N/A
neg-sub0N/A
mul-1-negN/A
+-commutativeN/A
*-lowering-*.f32N/A
sub-negN/A
metadata-evalN/A
+-lowering-+.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
Simplified98.9%
Taylor expanded in maxCos around 0
*-lowering-*.f32N/A
sqrt-lowering-sqrt.f32N/A
*-lowering-*.f32N/A
mul-1-negN/A
unsub-negN/A
--lowering--.f32N/A
cos-lowering-cos.f32N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
PI-lowering-PI.f3293.0
Simplified93.0%
Taylor expanded in uy around 0
sub-negN/A
mul-1-negN/A
+-commutativeN/A
distribute-rgt-inN/A
mul-1-negN/A
distribute-lft-neg-inN/A
unpow2N/A
mul-1-negN/A
sqrt-lowering-sqrt.f32N/A
+-commutativeN/A
mul-1-negN/A
unpow2N/A
distribute-lft-neg-inN/A
mul-1-negN/A
distribute-rgt-inN/A
*-lowering-*.f32N/A
mul-1-negN/A
sub-negN/A
--lowering--.f3275.4
Simplified75.4%
Taylor expanded in ux around 0
*-commutativeN/A
*-lowering-*.f3263.8
Simplified63.8%
Final simplification63.8%
herbie shell --seed 2024199
(FPCore (ux uy maxCos)
:name "UniformSampleCone, x"
:precision binary32
:pre (and (and (and (<= 2.328306437e-10 ux) (<= ux 1.0)) (and (<= 2.328306437e-10 uy) (<= uy 1.0))) (and (<= 0.0 maxCos) (<= maxCos 1.0)))
(* (cos (* (* uy 2.0) PI)) (sqrt (- 1.0 (* (+ (- 1.0 ux) (* ux maxCos)) (+ (- 1.0 ux) (* ux maxCos)))))))