
(FPCore (alpha u0) :precision binary32 (* (* (- alpha) alpha) (log (- 1.0 u0))))
float code(float alpha, float u0) {
return (-alpha * alpha) * logf((1.0f - u0));
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (-alpha * alpha) * log((1.0e0 - u0))
end function
function code(alpha, u0) return Float32(Float32(Float32(-alpha) * alpha) * log(Float32(Float32(1.0) - u0))) end
function tmp = code(alpha, u0) tmp = (-alpha * alpha) * log((single(1.0) - u0)); end
\begin{array}{l}
\\
\left(\left(-\alpha\right) \cdot \alpha\right) \cdot \log \left(1 - u0\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 5 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (alpha u0) :precision binary32 (* (* (- alpha) alpha) (log (- 1.0 u0))))
float code(float alpha, float u0) {
return (-alpha * alpha) * logf((1.0f - u0));
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (-alpha * alpha) * log((1.0e0 - u0))
end function
function code(alpha, u0) return Float32(Float32(Float32(-alpha) * alpha) * log(Float32(Float32(1.0) - u0))) end
function tmp = code(alpha, u0) tmp = (-alpha * alpha) * log((single(1.0) - u0)); end
\begin{array}{l}
\\
\left(\left(-\alpha\right) \cdot \alpha\right) \cdot \log \left(1 - u0\right)
\end{array}
(FPCore (alpha u0) :precision binary32 (* (* u0 alpha) alpha))
float code(float alpha, float u0) {
return (u0 * alpha) * alpha;
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (u0 * alpha) * alpha
end function
function code(alpha, u0) return Float32(Float32(u0 * alpha) * alpha) end
function tmp = code(alpha, u0) tmp = (u0 * alpha) * alpha; end
\begin{array}{l}
\\
\left(u0 \cdot \alpha\right) \cdot \alpha
\end{array}
Initial program 54.3%
Taylor expanded in u0 around 0
lower-*.f32N/A
unpow2N/A
lower-*.f3275.4
Applied rewrites75.4%
Applied rewrites75.4%
(FPCore (alpha u0)
:precision binary32
(if (<= u0 0.003000000026077032)
(/
(*
(* alpha alpha)
(* (- (* (* alpha (fma -0.3333333333333333 u0 -0.5)) u0) alpha) u0))
(- alpha))
(* (/ alpha (/ -1.0 alpha)) (log (- 1.0 u0)))))
float code(float alpha, float u0) {
float tmp;
if (u0 <= 0.003000000026077032f) {
tmp = ((alpha * alpha) * ((((alpha * fmaf(-0.3333333333333333f, u0, -0.5f)) * u0) - alpha) * u0)) / -alpha;
} else {
tmp = (alpha / (-1.0f / alpha)) * logf((1.0f - u0));
}
return tmp;
}
function code(alpha, u0) tmp = Float32(0.0) if (u0 <= Float32(0.003000000026077032)) tmp = Float32(Float32(Float32(alpha * alpha) * Float32(Float32(Float32(Float32(alpha * fma(Float32(-0.3333333333333333), u0, Float32(-0.5))) * u0) - alpha) * u0)) / Float32(-alpha)); else tmp = Float32(Float32(alpha / Float32(Float32(-1.0) / alpha)) * log(Float32(Float32(1.0) - u0))); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;u0 \leq 0.003000000026077032:\\
\;\;\;\;\frac{\left(\alpha \cdot \alpha\right) \cdot \left(\left(\left(\alpha \cdot \mathsf{fma}\left(-0.3333333333333333, u0, -0.5\right)\right) \cdot u0 - \alpha\right) \cdot u0\right)}{-\alpha}\\
\mathbf{else}:\\
\;\;\;\;\frac{\alpha}{\frac{-1}{\alpha}} \cdot \log \left(1 - u0\right)\\
\end{array}
\end{array}
if u0 < 0.00300000003Initial program 42.2%
lift-neg.f32N/A
neg-sub0N/A
flip--N/A
metadata-evalN/A
neg-sub0N/A
distribute-lft-neg-outN/A
lift-neg.f32N/A
lift-*.f32N/A
div-invN/A
lower-*.f32N/A
+-lft-identityN/A
lower-/.f3242.2
Applied rewrites42.2%
Taylor expanded in u0 around 0
mul-1-negN/A
lower-neg.f3285.7
Applied rewrites85.7%
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
lift-*.f32N/A
lift-/.f32N/A
un-div-invN/A
associate-*l/N/A
lower-/.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f3285.7
Applied rewrites85.7%
Taylor expanded in u0 around 0
*-commutativeN/A
lower-*.f32N/A
Applied rewrites97.2%
if 0.00300000003 < u0 Initial program 94.8%
lift-*.f32N/A
*-commutativeN/A
lift-neg.f32N/A
neg-sub0N/A
flip3--N/A
clear-numN/A
un-div-invN/A
lower-/.f32N/A
metadata-evalN/A
+-lft-identityN/A
mul0-lftN/A
+-rgt-identityN/A
clear-numN/A
+-rgt-identityN/A
mul0-lftN/A
+-lft-identityN/A
metadata-evalN/A
flip3--N/A
neg-sub0N/A
lift-neg.f32N/A
lower-/.f3294.9
Applied rewrites94.9%
Final simplification72.8%
(FPCore (alpha u0)
:precision binary32
(if (<= (- 1.0 u0) 0.996999979019165)
(* (* (- alpha) alpha) (log (- 1.0 u0)))
(/
(*
(* alpha alpha)
(* (- (* (* alpha (fma -0.3333333333333333 u0 -0.5)) u0) alpha) u0))
(- alpha))))
float code(float alpha, float u0) {
float tmp;
if ((1.0f - u0) <= 0.996999979019165f) {
tmp = (-alpha * alpha) * logf((1.0f - u0));
} else {
tmp = ((alpha * alpha) * ((((alpha * fmaf(-0.3333333333333333f, u0, -0.5f)) * u0) - alpha) * u0)) / -alpha;
}
return tmp;
}
function code(alpha, u0) tmp = Float32(0.0) if (Float32(Float32(1.0) - u0) <= Float32(0.996999979019165)) tmp = Float32(Float32(Float32(-alpha) * alpha) * log(Float32(Float32(1.0) - u0))); else tmp = Float32(Float32(Float32(alpha * alpha) * Float32(Float32(Float32(Float32(alpha * fma(Float32(-0.3333333333333333), u0, Float32(-0.5))) * u0) - alpha) * u0)) / Float32(-alpha)); end return tmp end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - u0 \leq 0.996999979019165:\\
\;\;\;\;\left(\left(-\alpha\right) \cdot \alpha\right) \cdot \log \left(1 - u0\right)\\
\mathbf{else}:\\
\;\;\;\;\frac{\left(\alpha \cdot \alpha\right) \cdot \left(\left(\left(\alpha \cdot \mathsf{fma}\left(-0.3333333333333333, u0, -0.5\right)\right) \cdot u0 - \alpha\right) \cdot u0\right)}{-\alpha}\\
\end{array}
\end{array}
if (-.f32 #s(literal 1 binary32) u0) < 0.996999979Initial program 94.8%
if 0.996999979 < (-.f32 #s(literal 1 binary32) u0) Initial program 42.2%
lift-neg.f32N/A
neg-sub0N/A
flip--N/A
metadata-evalN/A
neg-sub0N/A
distribute-lft-neg-outN/A
lift-neg.f32N/A
lift-*.f32N/A
div-invN/A
lower-*.f32N/A
+-lft-identityN/A
lower-/.f3242.2
Applied rewrites42.2%
Taylor expanded in u0 around 0
mul-1-negN/A
lower-neg.f3285.7
Applied rewrites85.7%
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
lift-*.f32N/A
lift-/.f32N/A
un-div-invN/A
associate-*l/N/A
lower-/.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f3285.7
Applied rewrites85.7%
Taylor expanded in u0 around 0
*-commutativeN/A
lower-*.f32N/A
Applied rewrites97.4%
Final simplification71.5%
(FPCore (alpha u0) :precision binary32 (/ (* (* alpha alpha) (* (- (* (* alpha (fma -0.3333333333333333 u0 -0.5)) u0) alpha) u0)) (- alpha)))
float code(float alpha, float u0) {
return ((alpha * alpha) * ((((alpha * fmaf(-0.3333333333333333f, u0, -0.5f)) * u0) - alpha) * u0)) / -alpha;
}
function code(alpha, u0) return Float32(Float32(Float32(alpha * alpha) * Float32(Float32(Float32(Float32(alpha * fma(Float32(-0.3333333333333333), u0, Float32(-0.5))) * u0) - alpha) * u0)) / Float32(-alpha)) end
\begin{array}{l}
\\
\frac{\left(\alpha \cdot \alpha\right) \cdot \left(\left(\left(\alpha \cdot \mathsf{fma}\left(-0.3333333333333333, u0, -0.5\right)\right) \cdot u0 - \alpha\right) \cdot u0\right)}{-\alpha}
\end{array}
Initial program 54.3%
lift-neg.f32N/A
neg-sub0N/A
flip--N/A
metadata-evalN/A
neg-sub0N/A
distribute-lft-neg-outN/A
lift-neg.f32N/A
lift-*.f32N/A
div-invN/A
lower-*.f32N/A
+-lft-identityN/A
lower-/.f3254.3
Applied rewrites54.3%
Taylor expanded in u0 around 0
mul-1-negN/A
lower-neg.f3275.3
Applied rewrites75.3%
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
lift-*.f32N/A
lift-/.f32N/A
un-div-invN/A
associate-*l/N/A
lower-/.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-*.f3275.3
Applied rewrites75.3%
Taylor expanded in u0 around 0
*-commutativeN/A
lower-*.f32N/A
Applied rewrites87.3%
Final simplification87.8%
(FPCore (alpha u0) :precision binary32 (* (* alpha alpha) u0))
float code(float alpha, float u0) {
return (alpha * alpha) * u0;
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (alpha * alpha) * u0
end function
function code(alpha, u0) return Float32(Float32(alpha * alpha) * u0) end
function tmp = code(alpha, u0) tmp = (alpha * alpha) * u0; end
\begin{array}{l}
\\
\left(\alpha \cdot \alpha\right) \cdot u0
\end{array}
Initial program 54.3%
Taylor expanded in u0 around 0
lower-*.f32N/A
unpow2N/A
lower-*.f3275.4
Applied rewrites75.4%
herbie shell --seed 2024315
(FPCore (alpha u0)
:name "Beckmann Distribution sample, tan2theta, alphax == alphay"
:precision binary32
:pre (and (and (<= 0.0001 alpha) (<= alpha 1.0)) (and (<= 2.328306437e-10 u0) (<= u0 1.0)))
(* (* (- alpha) alpha) (log (- 1.0 u0))))