
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (- (log (- 1.0 u1)))) (sin (* (* 2.0 PI) u2))))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(-logf((1.0f - u1))) * sinf(((2.0f * ((float) M_PI)) * u2));
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(-log(Float32(Float32(1.0) - u1)))) * sin(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt(-log((single(1.0) - u1))) * sin(((single(2.0) * single(pi)) * u2)); end
\begin{array}{l}
\\
\sqrt{-\log \left(1 - u1\right)} \cdot \sin \left(\left(2 \cdot \pi\right) \cdot u2\right)
\end{array}
Herbie found 13 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (- (log (- 1.0 u1)))) (sin (* (* 2.0 PI) u2))))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(-logf((1.0f - u1))) * sinf(((2.0f * ((float) M_PI)) * u2));
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(-log(Float32(Float32(1.0) - u1)))) * sin(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt(-log((single(1.0) - u1))) * sin(((single(2.0) * single(pi)) * u2)); end
\begin{array}{l}
\\
\sqrt{-\log \left(1 - u1\right)} \cdot \sin \left(\left(2 \cdot \pi\right) \cdot u2\right)
\end{array}
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (- (log1p (- u1)))) (sin (* (+ PI PI) u2))))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(-log1pf(-u1)) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(-log1p(Float32(-u1)))) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))) end
\begin{array}{l}
\\
\sqrt{-\mathsf{log1p}\left(-u1\right)} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)
\end{array}
Initial program 56.7%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3256.7
Applied rewrites56.7%
lift--.f32N/A
flip--N/A
lower-/.f32N/A
metadata-evalN/A
unpow2N/A
lower--.f32N/A
unpow2N/A
lower-*.f32N/A
lower-+.f3253.8
Applied rewrites53.8%
lift-log.f32N/A
lift-+.f32N/A
lift-/.f32N/A
lift--.f32N/A
lift-*.f32N/A
pow2N/A
metadata-evalN/A
pow2N/A
flip--N/A
*-rgt-identityN/A
*-commutativeN/A
metadata-evalN/A
fp-cancel-sign-sub-invN/A
mul-1-negN/A
lower-log1p.f32N/A
lower-neg.f3298.3
Applied rewrites98.3%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0001500000071246177)
(* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1)))))
(*
(sqrt (fma (* (fma (fma 0.25 u1 0.3333333333333333) u1 0.5) u1) u1 u1))
(sin (* (* 2.0 PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0001500000071246177f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf(fmaf((fmaf(fmaf(0.25f, u1, 0.3333333333333333f), u1, 0.5f) * u1), u1, u1)) * sinf(((2.0f * ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0001500000071246177)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(fma(Float32(fma(fma(Float32(0.25), u1, Float32(0.3333333333333333)), u1, Float32(0.5)) * u1), u1, u1)) * sin(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0001500000071246177:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(0.25, u1, 0.3333333333333333\right), u1, 0.5\right) \cdot u1, u1, u1\right)} \cdot \sin \left(\left(2 \cdot \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 1.50000007e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.5%
if 1.50000007e-4 < u2 Initial program 55.6%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.2
Applied rewrites93.2%
lift-*.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
distribute-lft-inN/A
lower-fma.f32N/A
lower-*.f32N/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
Applied rewrites93.2%
lift-fma.f32N/A
*-rgt-identityN/A
lift-*.f32N/A
lift-*.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
lift-*.f3293.2
Applied rewrites93.2%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0001500000071246177)
(* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1)))))
(*
(sqrt (* (fma (fma (fma 0.25 u1 0.3333333333333333) u1 0.5) u1 1.0) u1))
(sin (* (+ PI PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0001500000071246177f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf((fmaf(fmaf(fmaf(0.25f, u1, 0.3333333333333333f), u1, 0.5f), u1, 1.0f) * u1)) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0001500000071246177)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(Float32(fma(fma(fma(Float32(0.25), u1, Float32(0.3333333333333333)), u1, Float32(0.5)), u1, Float32(1.0)) * u1)) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0001500000071246177:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(0.25, u1, 0.3333333333333333\right), u1, 0.5\right), u1, 1\right) \cdot u1} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 1.50000007e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.5%
if 1.50000007e-4 < u2 Initial program 55.6%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.2
Applied rewrites93.2%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lift-+.f32N/A
lift-PI.f32N/A
lift-PI.f3293.2
Applied rewrites93.2%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0001500000071246177)
(* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1)))))
(*
(sqrt (fma (* (fma 0.3333333333333333 u1 0.5) u1) u1 u1))
(sin (* (* 2.0 PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0001500000071246177f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf(fmaf((fmaf(0.3333333333333333f, u1, 0.5f) * u1), u1, u1)) * sinf(((2.0f * ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0001500000071246177)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(fma(Float32(fma(Float32(0.3333333333333333), u1, Float32(0.5)) * u1), u1, u1)) * sin(Float32(Float32(Float32(2.0) * Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0001500000071246177:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(0.3333333333333333, u1, 0.5\right) \cdot u1, u1, u1\right)} \cdot \sin \left(\left(2 \cdot \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 1.50000007e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.5%
if 1.50000007e-4 < u2 Initial program 55.6%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.2
Applied rewrites93.2%
lift-*.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
lift-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
distribute-lft-inN/A
lower-fma.f32N/A
lower-*.f32N/A
*-commutativeN/A
+-commutativeN/A
*-commutativeN/A
+-commutativeN/A
Applied rewrites93.2%
Taylor expanded in u1 around 0
Applied rewrites91.6%
lift-fma.f32N/A
*-rgt-identityN/A
+-commutativeN/A
lift-*.f32N/A
*-commutativeN/A
lower-fma.f3291.6
Applied rewrites91.6%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0001500000071246177)
(* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1)))))
(*
(sqrt (* (fma (fma 0.3333333333333333 u1 0.5) u1 1.0) u1))
(sin (* (+ PI PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0001500000071246177f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf((fmaf(fmaf(0.3333333333333333f, u1, 0.5f), u1, 1.0f) * u1)) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0001500000071246177)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(Float32(fma(fma(Float32(0.3333333333333333), u1, Float32(0.5)), u1, Float32(1.0)) * u1)) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0001500000071246177:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(0.3333333333333333, u1, 0.5\right), u1, 1\right) \cdot u1} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 1.50000007e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.5%
if 1.50000007e-4 < u2 Initial program 55.6%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3255.6
Applied rewrites55.6%
lift--.f32N/A
flip--N/A
lower-/.f32N/A
metadata-evalN/A
unpow2N/A
lower--.f32N/A
unpow2N/A
lower-*.f32N/A
lower-+.f3252.6
Applied rewrites52.6%
lift-log.f32N/A
lift-+.f32N/A
lift-/.f32N/A
lift--.f32N/A
lift-*.f32N/A
pow2N/A
metadata-evalN/A
pow2N/A
flip--N/A
*-rgt-identityN/A
*-commutativeN/A
metadata-evalN/A
fp-cancel-sign-sub-invN/A
mul-1-negN/A
lower-log1p.f32N/A
lower-neg.f3298.0
Applied rewrites98.0%
Taylor expanded in u1 around 0
neg-logN/A
mul-1-negN/A
fp-cancel-sign-sub-invN/A
metadata-evalN/A
*-commutativeN/A
*-rgt-identityN/A
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3291.6
Applied rewrites91.6%
(FPCore (cosTheta_i u1 u2) :precision binary32 (if (<= u2 0.0002500000118743628) (* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1))))) (* (sqrt (* (fma 0.5 u1 1.0) u1)) (sin (* (+ PI PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0002500000118743628f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf((fmaf(0.5f, u1, 1.0f) * u1)) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0002500000118743628)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(Float32(fma(Float32(0.5), u1, Float32(1.0)) * u1)) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0002500000118743628:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(0.5, u1, 1\right) \cdot u1} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 2.50000012e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.3%
if 2.50000012e-4 < u2 Initial program 55.5%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
lower-fma.f3288.2
Applied rewrites88.2%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lift-+.f32N/A
lift-PI.f32N/A
lift-PI.f3288.2
Applied rewrites88.2%
(FPCore (cosTheta_i u1 u2) :precision binary32 (if (<= u2 0.0004400000034365803) (* (* (* PI 2.0) u2) (sqrt (- (log1p (- u1))))) (* (sqrt u1) (sin (* (+ PI PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0004400000034365803f) {
tmp = ((((float) M_PI) * 2.0f) * u2) * sqrtf(-log1pf(-u1));
} else {
tmp = sqrtf(u1) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0004400000034365803)) tmp = Float32(Float32(Float32(Float32(pi) * Float32(2.0)) * u2) * sqrt(Float32(-log1p(Float32(-u1))))); else tmp = Float32(sqrt(u1) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0004400000034365803:\\
\;\;\;\;\left(\left(\pi \cdot 2\right) \cdot u2\right) \cdot \sqrt{-\mathsf{log1p}\left(-u1\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{u1} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 4.40000003e-4Initial program 57.4%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lower-+.f32N/A
lift-PI.f32N/A
lift-PI.f3257.4
Applied rewrites57.4%
lift-neg.f32N/A
lift--.f32N/A
lift-log.f32N/A
neg-logN/A
lower-log.f32N/A
lower-/.f32N/A
lift--.f3255.1
Applied rewrites55.1%
Taylor expanded in u2 around 0
Applied rewrites98.0%
if 4.40000003e-4 < u2 Initial program 55.3%
Taylor expanded in u1 around 0
Applied rewrites77.6%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lift-+.f32N/A
lift-PI.f32N/A
lift-PI.f3277.6
Applied rewrites77.6%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0004400000034365803)
(*
(sqrt (* (fma (fma (fma 0.25 u1 0.3333333333333333) u1 0.5) u1 1.0) u1))
(* (* PI 2.0) u2))
(* (sqrt u1) (sin (* (+ PI PI) u2)))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0004400000034365803f) {
tmp = sqrtf((fmaf(fmaf(fmaf(0.25f, u1, 0.3333333333333333f), u1, 0.5f), u1, 1.0f) * u1)) * ((((float) M_PI) * 2.0f) * u2);
} else {
tmp = sqrtf(u1) * sinf(((((float) M_PI) + ((float) M_PI)) * u2));
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0004400000034365803)) tmp = Float32(sqrt(Float32(fma(fma(fma(Float32(0.25), u1, Float32(0.3333333333333333)), u1, Float32(0.5)), u1, Float32(1.0)) * u1)) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)); else tmp = Float32(sqrt(u1) * sin(Float32(Float32(Float32(pi) + Float32(pi)) * u2))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0004400000034365803:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(0.25, u1, 0.3333333333333333\right), u1, 0.5\right), u1, 1\right) \cdot u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)\\
\mathbf{else}:\\
\;\;\;\;\sqrt{u1} \cdot \sin \left(\left(\pi + \pi\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 4.40000003e-4Initial program 57.4%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.3
Applied rewrites93.3%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3292.9
Applied rewrites92.9%
if 4.40000003e-4 < u2 Initial program 55.3%
Taylor expanded in u1 around 0
Applied rewrites77.6%
lift-PI.f32N/A
lift-*.f32N/A
count-2-revN/A
lift-+.f32N/A
lift-PI.f32N/A
lift-PI.f3277.6
Applied rewrites77.6%
(FPCore (cosTheta_i u1 u2)
:precision binary32
(if (<= u2 0.0004400000034365803)
(*
(sqrt (* (fma (fma (fma 0.25 u1 0.3333333333333333) u1 0.5) u1 1.0) u1))
(* (* PI 2.0) u2))
(*
(sqrt u1)
(*
(fma (* -1.3333333333333333 (* u2 u2)) (* (* PI PI) PI) (* PI 2.0))
u2))))
float code(float cosTheta_i, float u1, float u2) {
float tmp;
if (u2 <= 0.0004400000034365803f) {
tmp = sqrtf((fmaf(fmaf(fmaf(0.25f, u1, 0.3333333333333333f), u1, 0.5f), u1, 1.0f) * u1)) * ((((float) M_PI) * 2.0f) * u2);
} else {
tmp = sqrtf(u1) * (fmaf((-1.3333333333333333f * (u2 * u2)), ((((float) M_PI) * ((float) M_PI)) * ((float) M_PI)), (((float) M_PI) * 2.0f)) * u2);
}
return tmp;
}
function code(cosTheta_i, u1, u2) tmp = Float32(0.0) if (u2 <= Float32(0.0004400000034365803)) tmp = Float32(sqrt(Float32(fma(fma(fma(Float32(0.25), u1, Float32(0.3333333333333333)), u1, Float32(0.5)), u1, Float32(1.0)) * u1)) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)); else tmp = Float32(sqrt(u1) * Float32(fma(Float32(Float32(-1.3333333333333333) * Float32(u2 * u2)), Float32(Float32(Float32(pi) * Float32(pi)) * Float32(pi)), Float32(Float32(pi) * Float32(2.0))) * u2)); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u2 \leq 0.0004400000034365803:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(0.25, u1, 0.3333333333333333\right), u1, 0.5\right), u1, 1\right) \cdot u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)\\
\mathbf{else}:\\
\;\;\;\;\sqrt{u1} \cdot \left(\mathsf{fma}\left(-1.3333333333333333 \cdot \left(u2 \cdot u2\right), \left(\pi \cdot \pi\right) \cdot \pi, \pi \cdot 2\right) \cdot u2\right)\\
\end{array}
\end{array}
if u2 < 4.40000003e-4Initial program 57.4%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.3
Applied rewrites93.3%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3292.9
Applied rewrites92.9%
if 4.40000003e-4 < u2 Initial program 55.3%
Taylor expanded in u1 around 0
Applied rewrites77.6%
Taylor expanded in u2 around 0
*-commutativeN/A
lower-*.f32N/A
associate-*r*N/A
lower-fma.f32N/A
lower-*.f32N/A
unpow2N/A
lower-*.f32N/A
lower-pow.f32N/A
lift-PI.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3259.7
Applied rewrites59.7%
lift-PI.f32N/A
lift-pow.f32N/A
unpow3N/A
lower-*.f32N/A
lower-*.f32N/A
lift-PI.f32N/A
lift-PI.f32N/A
lift-PI.f3259.7
Applied rewrites59.7%
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (* (fma (fma (fma 0.25 u1 0.3333333333333333) u1 0.5) u1 1.0) u1)) (* (* PI 2.0) u2)))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf((fmaf(fmaf(fmaf(0.25f, u1, 0.3333333333333333f), u1, 0.5f), u1, 1.0f) * u1)) * ((((float) M_PI) * 2.0f) * u2);
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(fma(fma(fma(Float32(0.25), u1, Float32(0.3333333333333333)), u1, Float32(0.5)), u1, Float32(1.0)) * u1)) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(0.25, u1, 0.3333333333333333\right), u1, 0.5\right), u1, 1\right) \cdot u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)
\end{array}
Initial program 56.7%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f32N/A
+-commutativeN/A
lower-fma.f3293.3
Applied rewrites93.3%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3277.6
Applied rewrites77.6%
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (+ u1 (* (* 0.5 u1) u1))) (* (* PI 2.0) u2)))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf((u1 + ((0.5f * u1) * u1))) * ((((float) M_PI) * 2.0f) * u2);
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(u1 + Float32(Float32(Float32(0.5) * u1) * u1))) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt((u1 + ((single(0.5) * u1) * u1))) * ((single(pi) * single(2.0)) * u2); end
\begin{array}{l}
\\
\sqrt{u1 + \left(0.5 \cdot u1\right) \cdot u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)
\end{array}
Initial program 56.7%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
lower-fma.f3288.1
Applied rewrites88.1%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3273.9
Applied rewrites73.9%
lift-*.f32N/A
lift-fma.f32N/A
*-commutativeN/A
+-commutativeN/A
distribute-rgt-inN/A
*-commutativeN/A
*-rgt-identityN/A
lower-+.f32N/A
lower-*.f32N/A
lower-*.f3274.0
Applied rewrites74.0%
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt (* (fma 0.5 u1 1.0) u1)) (* (* PI 2.0) u2)))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf((fmaf(0.5f, u1, 1.0f) * u1)) * ((((float) M_PI) * 2.0f) * u2);
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(Float32(fma(Float32(0.5), u1, Float32(1.0)) * u1)) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)) end
\begin{array}{l}
\\
\sqrt{\mathsf{fma}\left(0.5, u1, 1\right) \cdot u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)
\end{array}
Initial program 56.7%
Taylor expanded in u1 around 0
*-commutativeN/A
lower-*.f32N/A
+-commutativeN/A
lower-fma.f3288.1
Applied rewrites88.1%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3273.9
Applied rewrites73.9%
(FPCore (cosTheta_i u1 u2) :precision binary32 (* (sqrt u1) (* (* PI 2.0) u2)))
float code(float cosTheta_i, float u1, float u2) {
return sqrtf(u1) * ((((float) M_PI) * 2.0f) * u2);
}
function code(cosTheta_i, u1, u2) return Float32(sqrt(u1) * Float32(Float32(Float32(pi) * Float32(2.0)) * u2)) end
function tmp = code(cosTheta_i, u1, u2) tmp = sqrt(u1) * ((single(pi) * single(2.0)) * u2); end
\begin{array}{l}
\\
\sqrt{u1} \cdot \left(\left(\pi \cdot 2\right) \cdot u2\right)
\end{array}
Initial program 56.7%
Taylor expanded in u1 around 0
Applied rewrites77.1%
Taylor expanded in u2 around 0
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f32N/A
lift-PI.f3266.2
Applied rewrites66.2%
herbie shell --seed 2025105
(FPCore (cosTheta_i u1 u2)
:name "Beckmann Sample, near normal, slope_y"
:precision binary32
:pre (and (and (and (> cosTheta_i 0.9999) (<= cosTheta_i 1.0)) (and (<= 2.328306437e-10 u1) (<= u1 1.0))) (and (<= 2.328306437e-10 u2) (<= u2 1.0)))
(* (sqrt (- (log (- 1.0 u1)))) (sin (* (* 2.0 PI) u2))))