Average Error: 13.8 → 0.7
Time: 14.8s
Precision: binary64
Cost: 40260
\[wj - \frac{wj \cdot e^{wj} - x}{e^{wj} + wj \cdot e^{wj}} \]
\[\begin{array}{l} t_0 := wj \cdot e^{wj}\\ t_1 := x \cdot 4 + x \cdot -1.5\\ \mathbf{if}\;wj + \frac{x - t_0}{e^{wj} + t_0} \leq 2 \cdot 10^{-19}:\\ \;\;\;\;{wj}^{3} \cdot \left(x \cdot -0.6666666666666666 + \left(x \cdot 3 + \left(-1 - 2 \cdot t_1\right)\right)\right) + \left(\left(1 + t_1\right) \cdot {wj}^{2} + \left(x + -2 \cdot \left(wj \cdot x\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(wj - \frac{x}{e^{wj}}, \left(wj + -1\right) \cdot \frac{-1}{\mathsf{fma}\left(wj, wj, -1\right)}, wj\right)\\ \end{array} \]
(FPCore (wj x)
 :precision binary64
 (- wj (/ (- (* wj (exp wj)) x) (+ (exp wj) (* wj (exp wj))))))
(FPCore (wj x)
 :precision binary64
 (let* ((t_0 (* wj (exp wj))) (t_1 (+ (* x 4.0) (* x -1.5))))
   (if (<= (+ wj (/ (- x t_0) (+ (exp wj) t_0))) 2e-19)
     (+
      (*
       (pow wj 3.0)
       (+ (* x -0.6666666666666666) (+ (* x 3.0) (- -1.0 (* 2.0 t_1)))))
      (+ (* (+ 1.0 t_1) (pow wj 2.0)) (+ x (* -2.0 (* wj x)))))
     (fma
      (- wj (/ x (exp wj)))
      (* (+ wj -1.0) (/ -1.0 (fma wj wj -1.0)))
      wj))))
double code(double wj, double x) {
	return wj - (((wj * exp(wj)) - x) / (exp(wj) + (wj * exp(wj))));
}
double code(double wj, double x) {
	double t_0 = wj * exp(wj);
	double t_1 = (x * 4.0) + (x * -1.5);
	double tmp;
	if ((wj + ((x - t_0) / (exp(wj) + t_0))) <= 2e-19) {
		tmp = (pow(wj, 3.0) * ((x * -0.6666666666666666) + ((x * 3.0) + (-1.0 - (2.0 * t_1))))) + (((1.0 + t_1) * pow(wj, 2.0)) + (x + (-2.0 * (wj * x))));
	} else {
		tmp = fma((wj - (x / exp(wj))), ((wj + -1.0) * (-1.0 / fma(wj, wj, -1.0))), wj);
	}
	return tmp;
}
function code(wj, x)
	return Float64(wj - Float64(Float64(Float64(wj * exp(wj)) - x) / Float64(exp(wj) + Float64(wj * exp(wj)))))
end
function code(wj, x)
	t_0 = Float64(wj * exp(wj))
	t_1 = Float64(Float64(x * 4.0) + Float64(x * -1.5))
	tmp = 0.0
	if (Float64(wj + Float64(Float64(x - t_0) / Float64(exp(wj) + t_0))) <= 2e-19)
		tmp = Float64(Float64((wj ^ 3.0) * Float64(Float64(x * -0.6666666666666666) + Float64(Float64(x * 3.0) + Float64(-1.0 - Float64(2.0 * t_1))))) + Float64(Float64(Float64(1.0 + t_1) * (wj ^ 2.0)) + Float64(x + Float64(-2.0 * Float64(wj * x)))));
	else
		tmp = fma(Float64(wj - Float64(x / exp(wj))), Float64(Float64(wj + -1.0) * Float64(-1.0 / fma(wj, wj, -1.0))), wj);
	end
	return tmp
end
code[wj_, x_] := N[(wj - N[(N[(N[(wj * N[Exp[wj], $MachinePrecision]), $MachinePrecision] - x), $MachinePrecision] / N[(N[Exp[wj], $MachinePrecision] + N[(wj * N[Exp[wj], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
code[wj_, x_] := Block[{t$95$0 = N[(wj * N[Exp[wj], $MachinePrecision]), $MachinePrecision]}, Block[{t$95$1 = N[(N[(x * 4.0), $MachinePrecision] + N[(x * -1.5), $MachinePrecision]), $MachinePrecision]}, If[LessEqual[N[(wj + N[(N[(x - t$95$0), $MachinePrecision] / N[(N[Exp[wj], $MachinePrecision] + t$95$0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], 2e-19], N[(N[(N[Power[wj, 3.0], $MachinePrecision] * N[(N[(x * -0.6666666666666666), $MachinePrecision] + N[(N[(x * 3.0), $MachinePrecision] + N[(-1.0 - N[(2.0 * t$95$1), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + N[(N[(N[(1.0 + t$95$1), $MachinePrecision] * N[Power[wj, 2.0], $MachinePrecision]), $MachinePrecision] + N[(x + N[(-2.0 * N[(wj * x), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision], N[(N[(wj - N[(x / N[Exp[wj], $MachinePrecision]), $MachinePrecision]), $MachinePrecision] * N[(N[(wj + -1.0), $MachinePrecision] * N[(-1.0 / N[(wj * wj + -1.0), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] + wj), $MachinePrecision]]]]
wj - \frac{wj \cdot e^{wj} - x}{e^{wj} + wj \cdot e^{wj}}
\begin{array}{l}
t_0 := wj \cdot e^{wj}\\
t_1 := x \cdot 4 + x \cdot -1.5\\
\mathbf{if}\;wj + \frac{x - t_0}{e^{wj} + t_0} \leq 2 \cdot 10^{-19}:\\
\;\;\;\;{wj}^{3} \cdot \left(x \cdot -0.6666666666666666 + \left(x \cdot 3 + \left(-1 - 2 \cdot t_1\right)\right)\right) + \left(\left(1 + t_1\right) \cdot {wj}^{2} + \left(x + -2 \cdot \left(wj \cdot x\right)\right)\right)\\

\mathbf{else}:\\
\;\;\;\;\mathsf{fma}\left(wj - \frac{x}{e^{wj}}, \left(wj + -1\right) \cdot \frac{-1}{\mathsf{fma}\left(wj, wj, -1\right)}, wj\right)\\


\end{array}

Error

Target

Original13.8
Target13.0
Herbie0.7
\[wj - \left(\frac{wj}{wj + 1} - \frac{x}{e^{wj} + wj \cdot e^{wj}}\right) \]

Derivation

  1. Split input into 2 regimes
  2. if (-.f64 wj (/.f64 (-.f64 (*.f64 wj (exp.f64 wj)) x) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj))))) < 2e-19

    1. Initial program 18.0

      \[wj - \frac{wj \cdot e^{wj} - x}{e^{wj} + wj \cdot e^{wj}} \]
    2. Simplified18.0

      \[\leadsto \color{blue}{wj - \frac{wj - \frac{x}{e^{wj}}}{wj + 1}} \]
      Proof
      (-.f64 wj (/.f64 (-.f64 wj (/.f64 x (exp.f64 wj))) (+.f64 wj 1))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (Rewrite=> div-sub_binary64 (-.f64 (/.f64 wj (+.f64 wj 1)) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1))))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (Rewrite<= *-rgt-identity_binary64 (*.f64 (/.f64 wj (+.f64 wj 1)) 1)) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (*.f64 (/.f64 wj (+.f64 wj 1)) (Rewrite<= *-inverses_binary64 (/.f64 (exp.f64 wj) (exp.f64 wj)))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 2 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (Rewrite<= times-frac_binary64 (/.f64 (*.f64 wj (exp.f64 wj)) (*.f64 (+.f64 wj 1) (exp.f64 wj)))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 2 points increase in error, 1 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (Rewrite<= distribute-rgt1-in_binary64 (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj))))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))) (Rewrite=> associate-/l/_binary64 (/.f64 x (*.f64 (+.f64 wj 1) (exp.f64 wj)))))): 1 points increase in error, 1 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))) (/.f64 x (Rewrite<= distribute-rgt1-in_binary64 (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj))))))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (Rewrite<= div-sub_binary64 (/.f64 (-.f64 (*.f64 wj (exp.f64 wj)) x) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))))): 0 points increase in error, 0 points decrease in error
    3. Taylor expanded in wj around 0 0.6

      \[\leadsto \color{blue}{-1 \cdot \left(\left(0.6666666666666666 \cdot x + \left(-3 \cdot x + \left(1 + -2 \cdot \left(-4 \cdot x + 1.5 \cdot x\right)\right)\right)\right) \cdot {wj}^{3}\right) + \left(\left(1 - \left(-4 \cdot x + 1.5 \cdot x\right)\right) \cdot {wj}^{2} + \left(-2 \cdot \left(wj \cdot x\right) + x\right)\right)} \]

    if 2e-19 < (-.f64 wj (/.f64 (-.f64 (*.f64 wj (exp.f64 wj)) x) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))))

    1. Initial program 3.5

      \[wj - \frac{wj \cdot e^{wj} - x}{e^{wj} + wj \cdot e^{wj}} \]
    2. Simplified0.7

      \[\leadsto \color{blue}{wj - \frac{wj - \frac{x}{e^{wj}}}{wj + 1}} \]
      Proof
      (-.f64 wj (/.f64 (-.f64 wj (/.f64 x (exp.f64 wj))) (+.f64 wj 1))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (Rewrite=> div-sub_binary64 (-.f64 (/.f64 wj (+.f64 wj 1)) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1))))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (Rewrite<= *-rgt-identity_binary64 (*.f64 (/.f64 wj (+.f64 wj 1)) 1)) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (*.f64 (/.f64 wj (+.f64 wj 1)) (Rewrite<= *-inverses_binary64 (/.f64 (exp.f64 wj) (exp.f64 wj)))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 2 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (Rewrite<= times-frac_binary64 (/.f64 (*.f64 wj (exp.f64 wj)) (*.f64 (+.f64 wj 1) (exp.f64 wj)))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 2 points increase in error, 1 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (Rewrite<= distribute-rgt1-in_binary64 (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj))))) (/.f64 (/.f64 x (exp.f64 wj)) (+.f64 wj 1)))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))) (Rewrite=> associate-/l/_binary64 (/.f64 x (*.f64 (+.f64 wj 1) (exp.f64 wj)))))): 1 points increase in error, 1 points decrease in error
      (-.f64 wj (-.f64 (/.f64 (*.f64 wj (exp.f64 wj)) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))) (/.f64 x (Rewrite<= distribute-rgt1-in_binary64 (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj))))))): 0 points increase in error, 0 points decrease in error
      (-.f64 wj (Rewrite<= div-sub_binary64 (/.f64 (-.f64 (*.f64 wj (exp.f64 wj)) x) (+.f64 (exp.f64 wj) (*.f64 wj (exp.f64 wj)))))): 0 points increase in error, 0 points decrease in error
    3. Applied egg-rr0.8

      \[\leadsto \color{blue}{\mathsf{fma}\left(wj - \frac{x}{e^{wj}}, -\frac{1}{wj + 1}, wj\right)} \]
    4. Applied egg-rr0.8

      \[\leadsto \mathsf{fma}\left(wj - \frac{x}{e^{wj}}, -\color{blue}{\frac{1}{\mathsf{fma}\left(wj, wj, -1\right)} \cdot \left(wj + -1\right)}, wj\right) \]
  3. Recombined 2 regimes into one program.
  4. Final simplification0.7

    \[\leadsto \begin{array}{l} \mathbf{if}\;wj + \frac{x - wj \cdot e^{wj}}{e^{wj} + wj \cdot e^{wj}} \leq 2 \cdot 10^{-19}:\\ \;\;\;\;{wj}^{3} \cdot \left(x \cdot -0.6666666666666666 + \left(x \cdot 3 + \left(-1 - 2 \cdot \left(x \cdot 4 + x \cdot -1.5\right)\right)\right)\right) + \left(\left(1 + \left(x \cdot 4 + x \cdot -1.5\right)\right) \cdot {wj}^{2} + \left(x + -2 \cdot \left(wj \cdot x\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\mathsf{fma}\left(wj - \frac{x}{e^{wj}}, \left(wj + -1\right) \cdot \frac{-1}{\mathsf{fma}\left(wj, wj, -1\right)}, wj\right)\\ \end{array} \]

Alternatives

Alternative 1
Error0.7
Cost35652
\[\begin{array}{l} t_0 := wj \cdot e^{wj}\\ t_1 := x \cdot 4 + x \cdot -1.5\\ \mathbf{if}\;wj + \frac{x - t_0}{e^{wj} + t_0} \leq 2 \cdot 10^{-19}:\\ \;\;\;\;{wj}^{3} \cdot \left(x \cdot -0.6666666666666666 + \left(x \cdot 3 + \left(-1 - 2 \cdot t_1\right)\right)\right) + \left(\left(1 + t_1\right) \cdot {wj}^{2} + \left(x + -2 \cdot \left(wj \cdot x\right)\right)\right)\\ \mathbf{else}:\\ \;\;\;\;\frac{x}{e^{wj} \cdot \left(wj + 1\right)} + \left(wj - \frac{wj}{wj + 1}\right)\\ \end{array} \]
Alternative 2
Error2.2
Cost8576
\[{wj}^{3} \cdot \left(x \cdot -0.6666666666666666 + \left(x \cdot 3 + \left(-1 - 2 \cdot \left(x \cdot 4 + x \cdot -1.5\right)\right)\right)\right) + \left(\left(x + -2 \cdot \left(wj \cdot x\right)\right) + wj \cdot wj\right) \]
Alternative 3
Error2.1
Cost7296
\[\left(\left(x + -2 \cdot \left(wj \cdot x\right)\right) + wj \cdot wj\right) - {wj}^{3} \]
Alternative 4
Error2.4
Cost6848
\[\mathsf{fma}\left(wj, wj + x \cdot -2, x\right) \]
Alternative 5
Error2.4
Cost704
\[\left(x + -2 \cdot \left(wj \cdot x\right)\right) + wj \cdot wj \]
Alternative 6
Error9.6
Cost448
\[\frac{x}{1 + wj \cdot 2} \]
Alternative 7
Error10.0
Cost64
\[x \]

Error

Reproduce

herbie shell --seed 2022308 
(FPCore (wj x)
  :name "Jmat.Real.lambertw, newton loop step"
  :precision binary64

  :herbie-target
  (- wj (- (/ wj (+ wj 1.0)) (/ x (+ (exp wj) (* wj (exp wj))))))

  (- wj (/ (- (* wj (exp wj)) x) (+ (exp wj) (* wj (exp wj))))))