Beckmann Distribution sample, tan2theta, alphax != alphay, u1 <= 0.5

Percentage Accurate: 60.8% → 98.4%
Time: 15.8s
Alternatives: 21
Speedup: 3.5×

Specification

?
\[\left(\left(\left(\left(0.0001 \leq alphax \land alphax \leq 1\right) \land \left(0.0001 \leq alphay \land alphay \leq 1\right)\right) \land \left(2.328306437 \cdot 10^{-10} \leq u0 \land u0 \leq 1\right)\right) \land \left(0 \leq cos2phi \land cos2phi \leq 1\right)\right) \land 0 \leq sin2phi\]
\[\begin{array}{l} \\ \frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \end{array} \]
(FPCore (alphax alphay u0 cos2phi sin2phi)
 :precision binary32
 (/
  (- (log (- 1.0 u0)))
  (+ (/ cos2phi (* alphax alphax)) (/ sin2phi (* alphay alphay)))))
float code(float alphax, float alphay, float u0, float cos2phi, float sin2phi) {
	return -logf((1.0f - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)));
}
real(4) function code(alphax, alphay, u0, cos2phi, sin2phi)
    real(4), intent (in) :: alphax
    real(4), intent (in) :: alphay
    real(4), intent (in) :: u0
    real(4), intent (in) :: cos2phi
    real(4), intent (in) :: sin2phi
    code = -log((1.0e0 - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)))
end function
function code(alphax, alphay, u0, cos2phi, sin2phi)
	return Float32(Float32(-log(Float32(Float32(1.0) - u0))) / Float32(Float32(cos2phi / Float32(alphax * alphax)) + Float32(sin2phi / Float32(alphay * alphay))))
end
function tmp = code(alphax, alphay, u0, cos2phi, sin2phi)
	tmp = -log((single(1.0) - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)));
end
\begin{array}{l}

\\
\frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}}
\end{array}

Sampling outcomes in binary32 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 21 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 60.8% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \end{array} \]
(FPCore (alphax alphay u0 cos2phi sin2phi)
 :precision binary32
 (/
  (- (log (- 1.0 u0)))
  (+ (/ cos2phi (* alphax alphax)) (/ sin2phi (* alphay alphay)))))
float code(float alphax, float alphay, float u0, float cos2phi, float sin2phi) {
	return -logf((1.0f - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)));
}
real(4) function code(alphax, alphay, u0, cos2phi, sin2phi)
    real(4), intent (in) :: alphax
    real(4), intent (in) :: alphay
    real(4), intent (in) :: u0
    real(4), intent (in) :: cos2phi
    real(4), intent (in) :: sin2phi
    code = -log((1.0e0 - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)))
end function
function code(alphax, alphay, u0, cos2phi, sin2phi)
	return Float32(Float32(-log(Float32(Float32(1.0) - u0))) / Float32(Float32(cos2phi / Float32(alphax * alphax)) + Float32(sin2phi / Float32(alphay * alphay))))
end
function tmp = code(alphax, alphay, u0, cos2phi, sin2phi)
	tmp = -log((single(1.0) - u0)) / ((cos2phi / (alphax * alphax)) + (sin2phi / (alphay * alphay)));
end
\begin{array}{l}

\\
\frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}}
\end{array}

Alternative 1: 98.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \frac{\mathsf{log1p}\left(-u0\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{sin2phi}{alphay \cdot alphay}} \end{array} \]
(FPCore (alphax alphay u0 cos2phi sin2phi)
 :precision binary32
 (/
  (log1p (- u0))
  (- (/ (- cos2phi) (* alphax alphax)) (/ sin2phi (* alphay alphay)))))
float code(float alphax, float alphay, float u0, float cos2phi, float sin2phi) {
	return log1pf(-u0) / ((-cos2phi / (alphax * alphax)) - (sin2phi / (alphay * alphay)));
}
function code(alphax, alphay, u0, cos2phi, sin2phi)
	return Float32(log1p(Float32(-u0)) / Float32(Float32(Float32(-cos2phi) / Float32(alphax * alphax)) - Float32(sin2phi / Float32(alphay * alphay))))
end
\begin{array}{l}

\\
\frac{\mathsf{log1p}\left(-u0\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{sin2phi}{alphay \cdot alphay}}
\end{array}
Derivation
  1. Initial program 61.9%

    \[\frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  2. Add Preprocessing
  3. Step-by-step derivation
    1. sub-negN/A

      \[\leadsto \frac{\mathsf{neg}\left(\log \color{blue}{\left(1 + \left(\mathsf{neg}\left(u0\right)\right)\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    2. lower-log1p.f32N/A

      \[\leadsto \frac{\mathsf{neg}\left(\color{blue}{\mathsf{log1p}\left(\mathsf{neg}\left(u0\right)\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    3. lower-neg.f3298.7

      \[\leadsto \frac{-\mathsf{log1p}\left(\color{blue}{-u0}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  4. Applied egg-rr98.7%

    \[\leadsto \frac{-\color{blue}{\mathsf{log1p}\left(-u0\right)}}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  5. Final simplification98.7%

    \[\leadsto \frac{\mathsf{log1p}\left(-u0\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{sin2phi}{alphay \cdot alphay}} \]
  6. Add Preprocessing

Alternative 2: 93.0% accurate, 1.9× speedup?

\[\begin{array}{l} \\ \frac{u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{\frac{sin2phi}{alphay}}{alphay}} \end{array} \]
(FPCore (alphax alphay u0 cos2phi sin2phi)
 :precision binary32
 (/
  (* u0 (fma u0 (fma u0 (fma u0 -0.25 -0.3333333333333333) -0.5) -1.0))
  (- (/ (- cos2phi) (* alphax alphax)) (/ (/ sin2phi alphay) alphay))))
float code(float alphax, float alphay, float u0, float cos2phi, float sin2phi) {
	return (u0 * fmaf(u0, fmaf(u0, fmaf(u0, -0.25f, -0.3333333333333333f), -0.5f), -1.0f)) / ((-cos2phi / (alphax * alphax)) - ((sin2phi / alphay) / alphay));
}
function code(alphax, alphay, u0, cos2phi, sin2phi)
	return Float32(Float32(u0 * fma(u0, fma(u0, fma(u0, Float32(-0.25), Float32(-0.3333333333333333)), Float32(-0.5)), Float32(-1.0))) / Float32(Float32(Float32(-cos2phi) / Float32(alphax * alphax)) - Float32(Float32(sin2phi / alphay) / alphay)))
end
\begin{array}{l}

\\
\frac{u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{\frac{sin2phi}{alphay}}{alphay}}
\end{array}
Derivation
  1. Initial program 60.8%

    \[\frac{-\log \left(1 - u0\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  2. Add Preprocessing
  3. Taylor expanded in u0 around 0

    \[\leadsto \frac{\mathsf{neg}\left(\color{blue}{u0 \cdot \left(u0 \cdot \left(u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) - \frac{1}{2}\right) - 1\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  4. Step-by-step derivation
    1. lower-*.f32N/A

      \[\leadsto \frac{\mathsf{neg}\left(\color{blue}{u0 \cdot \left(u0 \cdot \left(u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) - \frac{1}{2}\right) - 1\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    2. sub-negN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \color{blue}{\left(u0 \cdot \left(u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) - \frac{1}{2}\right) + \left(\mathsf{neg}\left(1\right)\right)\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    3. metadata-evalN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \left(u0 \cdot \left(u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) - \frac{1}{2}\right) + \color{blue}{-1}\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    4. lower-fma.f32N/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \color{blue}{\mathsf{fma}\left(u0, u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) - \frac{1}{2}, -1\right)}\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    5. sub-negN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \color{blue}{u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) + \left(\mathsf{neg}\left(\frac{1}{2}\right)\right)}, -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    6. metadata-evalN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, u0 \cdot \left(\frac{-1}{4} \cdot u0 - \frac{1}{3}\right) + \color{blue}{\frac{-1}{2}}, -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    7. lower-fma.f32N/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \color{blue}{\mathsf{fma}\left(u0, \frac{-1}{4} \cdot u0 - \frac{1}{3}, \frac{-1}{2}\right)}, -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    8. sub-negN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \color{blue}{\frac{-1}{4} \cdot u0 + \left(\mathsf{neg}\left(\frac{1}{3}\right)\right)}, \frac{-1}{2}\right), -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    9. *-commutativeN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \color{blue}{u0 \cdot \frac{-1}{4}} + \left(\mathsf{neg}\left(\frac{1}{3}\right)\right), \frac{-1}{2}\right), -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    10. metadata-evalN/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, u0 \cdot \frac{-1}{4} + \color{blue}{\frac{-1}{3}}, \frac{-1}{2}\right), -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
    11. lower-fma.f3293.0

      \[\leadsto \frac{-u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \color{blue}{\mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right)}, -0.5\right), -1\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  5. Simplified93.0%

    \[\leadsto \frac{-\color{blue}{u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}}{\frac{cos2phi}{alphax \cdot alphax} + \frac{sin2phi}{alphay \cdot alphay}} \]
  6. Step-by-step derivation
    1. associate-/r*N/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \frac{-1}{4}, \frac{-1}{3}\right), \frac{-1}{2}\right), -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \color{blue}{\frac{\frac{sin2phi}{alphay}}{alphay}}} \]
    2. lower-/.f32N/A

      \[\leadsto \frac{\mathsf{neg}\left(u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \frac{-1}{4}, \frac{-1}{3}\right), \frac{-1}{2}\right), -1\right)\right)}{\frac{cos2phi}{alphax \cdot alphax} + \color{blue}{\frac{\frac{sin2phi}{alphay}}{alphay}}} \]
    3. lower-/.f3293.0

      \[\leadsto \frac{-u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}{\frac{cos2phi}{alphax \cdot alphax} + \frac{\color{blue}{\frac{sin2phi}{alphay}}}{alphay}} \]
  7. Applied egg-rr93.0%

    \[\leadsto \frac{-u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}{\frac{cos2phi}{alphax \cdot alphax} + \color{blue}{\frac{\frac{sin2phi}{alphay}}{alphay}}} \]
  8. Final simplification93.0%

    \[\leadsto \frac{u0 \cdot \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, \mathsf{fma}\left(u0, -0.25, -0.3333333333333333\right), -0.5\right), -1\right)}{\frac{-cos2phi}{alphax \cdot alphax} - \frac{\frac{sin2phi}{alphay}}{alphay}} \]
  9. Add Preprocessing

Reproduce

?
herbie shell --seed 2024218 
(FPCore (alphax alphay u0 cos2phi sin2phi)
  :name "Beckmann Distribution sample, tan2theta, alphax != alphay, u1 <= 0.5"
  :precision binary32
  :pre (and (and (and (and (and (<= 0.0001 alphax) (<= alphax 1.0)) (and (<= 0.0001 alphay) (<= alphay 1.0))) (and (<= 2.328306437e-10 u0) (<= u0 1.0))) (and (<= 0.0 cos2phi) (<= cos2phi 1.0))) (<= 0.0 sin2phi))
  (/ (- (log (- 1.0 u0))) (+ (/ cos2phi (* alphax alphax)) (/ sin2phi (* alphay alphay)))))