
(FPCore (alpha u0) :precision binary32 (* (* (- alpha) alpha) (log (- 1.0 u0))))
float code(float alpha, float u0) {
return (-alpha * alpha) * logf((1.0f - u0));
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (-alpha * alpha) * log((1.0e0 - u0))
end function
function code(alpha, u0) return Float32(Float32(Float32(-alpha) * alpha) * log(Float32(Float32(1.0) - u0))) end
function tmp = code(alpha, u0) tmp = (-alpha * alpha) * log((single(1.0) - u0)); end
\begin{array}{l}
\\
\left(\left(-\alpha\right) \cdot \alpha\right) \cdot \log \left(1 - u0\right)
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 4 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (alpha u0) :precision binary32 (* (* (- alpha) alpha) (log (- 1.0 u0))))
float code(float alpha, float u0) {
return (-alpha * alpha) * logf((1.0f - u0));
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (-alpha * alpha) * log((1.0e0 - u0))
end function
function code(alpha, u0) return Float32(Float32(Float32(-alpha) * alpha) * log(Float32(Float32(1.0) - u0))) end
function tmp = code(alpha, u0) tmp = (-alpha * alpha) * log((single(1.0) - u0)); end
\begin{array}{l}
\\
\left(\left(-\alpha\right) \cdot \alpha\right) \cdot \log \left(1 - u0\right)
\end{array}
(FPCore (alpha u0) :precision binary32 (if (<= (- 1.0 u0) 0.9959999918937683) (* (* (log (- 1.0 u0)) (- alpha)) alpha) (* (* alpha alpha) (+ (* (* 0.5 u0) u0) u0))))
float code(float alpha, float u0) {
float tmp;
if ((1.0f - u0) <= 0.9959999918937683f) {
tmp = (logf((1.0f - u0)) * -alpha) * alpha;
} else {
tmp = (alpha * alpha) * (((0.5f * u0) * u0) + u0);
}
return tmp;
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
real(4) :: tmp
if ((1.0e0 - u0) <= 0.9959999918937683e0) then
tmp = (log((1.0e0 - u0)) * -alpha) * alpha
else
tmp = (alpha * alpha) * (((0.5e0 * u0) * u0) + u0)
end if
code = tmp
end function
function code(alpha, u0) tmp = Float32(0.0) if (Float32(Float32(1.0) - u0) <= Float32(0.9959999918937683)) tmp = Float32(Float32(log(Float32(Float32(1.0) - u0)) * Float32(-alpha)) * alpha); else tmp = Float32(Float32(alpha * alpha) * Float32(Float32(Float32(Float32(0.5) * u0) * u0) + u0)); end return tmp end
function tmp_2 = code(alpha, u0) tmp = single(0.0); if ((single(1.0) - u0) <= single(0.9959999918937683)) tmp = (log((single(1.0) - u0)) * -alpha) * alpha; else tmp = (alpha * alpha) * (((single(0.5) * u0) * u0) + u0); end tmp_2 = tmp; end
\begin{array}{l}
\\
\begin{array}{l}
\mathbf{if}\;1 - u0 \leq 0.9959999918937683:\\
\;\;\;\;\left(\log \left(1 - u0\right) \cdot \left(-\alpha\right)\right) \cdot \alpha\\
\mathbf{else}:\\
\;\;\;\;\left(\alpha \cdot \alpha\right) \cdot \left(\left(0.5 \cdot u0\right) \cdot u0 + u0\right)\\
\end{array}
\end{array}
if (-.f32 #s(literal 1 binary32) u0) < 0.995999992Initial program 93.5%
Taylor expanded in alpha around 0
mul-1-negN/A
unpow2N/A
associate-*l*N/A
distribute-rgt-neg-inN/A
*-commutativeN/A
lower-*.f32N/A
distribute-lft-neg-inN/A
mul-1-negN/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f32N/A
sub-negN/A
lower-log1p.f32N/A
lower-neg.f3242.1
Applied rewrites42.1%
Applied rewrites93.6%
if 0.995999992 < (-.f32 #s(literal 1 binary32) u0) Initial program 45.2%
+-lft-identityN/A
flip-+N/A
neg-sub0N/A
lift-*.f32N/A
lift-neg.f32N/A
distribute-lft-neg-outN/A
remove-double-negN/A
lower-/.f32N/A
metadata-evalN/A
lower--.f32N/A
lower-*.f32N/A
lower-*.f3245.2
Applied rewrites45.2%
Taylor expanded in u0 around 0
distribute-lft-inN/A
associate-*r*N/A
*-commutativeN/A
distribute-lft1-inN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-fma.f32N/A
unpow2N/A
lower-*.f3284.7
Applied rewrites84.2%
Applied rewrites98.2%
Final simplification96.9%
(FPCore (alpha u0) :precision binary32 (* (* alpha alpha) (+ (* (* 0.5 u0) u0) u0)))
float code(float alpha, float u0) {
return (alpha * alpha) * (((0.5f * u0) * u0) + u0);
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (alpha * alpha) * (((0.5e0 * u0) * u0) + u0)
end function
function code(alpha, u0) return Float32(Float32(alpha * alpha) * Float32(Float32(Float32(Float32(0.5) * u0) * u0) + u0)) end
function tmp = code(alpha, u0) tmp = (alpha * alpha) * (((single(0.5) * u0) * u0) + u0); end
\begin{array}{l}
\\
\left(\alpha \cdot \alpha\right) \cdot \left(\left(0.5 \cdot u0\right) \cdot u0 + u0\right)
\end{array}
Initial program 58.8%
+-lft-identityN/A
flip-+N/A
neg-sub0N/A
lift-*.f32N/A
lift-neg.f32N/A
distribute-lft-neg-outN/A
remove-double-negN/A
lower-/.f32N/A
metadata-evalN/A
lower--.f32N/A
lower-*.f32N/A
lower-*.f3258.8
Applied rewrites58.8%
Taylor expanded in u0 around 0
distribute-lft-inN/A
associate-*r*N/A
*-commutativeN/A
distribute-lft1-inN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-fma.f32N/A
unpow2N/A
lower-*.f3272.7
Applied rewrites72.4%
Applied rewrites86.6%
Final simplification86.6%
(FPCore (alpha u0) :precision binary32 (* (* (+ (* 0.5 u0) 1.0) u0) (* alpha alpha)))
float code(float alpha, float u0) {
return (((0.5f * u0) + 1.0f) * u0) * (alpha * alpha);
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (((0.5e0 * u0) + 1.0e0) * u0) * (alpha * alpha)
end function
function code(alpha, u0) return Float32(Float32(Float32(Float32(Float32(0.5) * u0) + Float32(1.0)) * u0) * Float32(alpha * alpha)) end
function tmp = code(alpha, u0) tmp = (((single(0.5) * u0) + single(1.0)) * u0) * (alpha * alpha); end
\begin{array}{l}
\\
\left(\left(0.5 \cdot u0 + 1\right) \cdot u0\right) \cdot \left(\alpha \cdot \alpha\right)
\end{array}
Initial program 58.8%
+-lft-identityN/A
flip-+N/A
neg-sub0N/A
lift-*.f32N/A
lift-neg.f32N/A
distribute-lft-neg-outN/A
remove-double-negN/A
lower-/.f32N/A
metadata-evalN/A
lower--.f32N/A
lower-*.f32N/A
lower-*.f3258.8
Applied rewrites58.8%
Taylor expanded in u0 around 0
distribute-lft-inN/A
associate-*r*N/A
*-commutativeN/A
distribute-lft1-inN/A
*-commutativeN/A
associate-*r*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lower-fma.f32N/A
unpow2N/A
lower-*.f3272.7
Applied rewrites72.4%
Applied rewrites86.4%
(FPCore (alpha u0) :precision binary32 (* (* alpha alpha) u0))
float code(float alpha, float u0) {
return (alpha * alpha) * u0;
}
real(4) function code(alpha, u0)
real(4), intent (in) :: alpha
real(4), intent (in) :: u0
code = (alpha * alpha) * u0
end function
function code(alpha, u0) return Float32(Float32(alpha * alpha) * u0) end
function tmp = code(alpha, u0) tmp = (alpha * alpha) * u0; end
\begin{array}{l}
\\
\left(\alpha \cdot \alpha\right) \cdot u0
\end{array}
Initial program 58.8%
Taylor expanded in u0 around 0
*-commutativeN/A
lower-*.f32N/A
unpow2N/A
lower-*.f3272.7
Applied rewrites72.7%
Final simplification72.7%
herbie shell --seed 2024277
(FPCore (alpha u0)
:name "Beckmann Distribution sample, tan2theta, alphax == alphay"
:precision binary32
:pre (and (and (<= 0.0001 alpha) (<= alpha 1.0)) (and (<= 2.328306437e-10 u0) (<= u0 1.0)))
(* (* (- alpha) alpha) (log (- 1.0 u0))))