
(FPCore (x y z) :precision binary64 (sqrt (+ (* x x) (+ (* y y) (* z z)))))
double code(double x, double y, double z) {
return sqrt(((x * x) + ((y * y) + (z * z))));
}
module fmin_fmax_functions
implicit none
private
public fmax
public fmin
interface fmax
module procedure fmax88
module procedure fmax44
module procedure fmax84
module procedure fmax48
end interface
interface fmin
module procedure fmin88
module procedure fmin44
module procedure fmin84
module procedure fmin48
end interface
contains
real(8) function fmax88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(4) function fmax44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(8) function fmax84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, max(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmax48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), max(dble(x), y), y /= y), x /= x)
end function
real(8) function fmin88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(4) function fmin44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(8) function fmin84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, min(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmin48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), min(dble(x), y), y /= y), x /= x)
end function
end module
real(8) function code(x, y, z)
use fmin_fmax_functions
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
code = sqrt(((x * x) + ((y * y) + (z * z))))
end function
public static double code(double x, double y, double z) {
return Math.sqrt(((x * x) + ((y * y) + (z * z))));
}
def code(x, y, z): return math.sqrt(((x * x) + ((y * y) + (z * z))))
function code(x, y, z) return sqrt(Float64(Float64(x * x) + Float64(Float64(y * y) + Float64(z * z)))) end
function tmp = code(x, y, z) tmp = sqrt(((x * x) + ((y * y) + (z * z)))); end
code[x_, y_, z_] := N[Sqrt[N[(N[(x * x), $MachinePrecision] + N[(N[(y * y), $MachinePrecision] + N[(z * z), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{x \cdot x + \left(y \cdot y + z \cdot z\right)}
\end{array}
Herbie found 9 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x y z) :precision binary64 (sqrt (+ (* x x) (+ (* y y) (* z z)))))
double code(double x, double y, double z) {
return sqrt(((x * x) + ((y * y) + (z * z))));
}
module fmin_fmax_functions
implicit none
private
public fmax
public fmin
interface fmax
module procedure fmax88
module procedure fmax44
module procedure fmax84
module procedure fmax48
end interface
interface fmin
module procedure fmin88
module procedure fmin44
module procedure fmin84
module procedure fmin48
end interface
contains
real(8) function fmax88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(4) function fmax44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(8) function fmax84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, max(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmax48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), max(dble(x), y), y /= y), x /= x)
end function
real(8) function fmin88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(4) function fmin44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(8) function fmin84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, min(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmin48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), min(dble(x), y), y /= y), x /= x)
end function
end module
real(8) function code(x, y, z)
use fmin_fmax_functions
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
code = sqrt(((x * x) + ((y * y) + (z * z))))
end function
public static double code(double x, double y, double z) {
return Math.sqrt(((x * x) + ((y * y) + (z * z))));
}
def code(x, y, z): return math.sqrt(((x * x) + ((y * y) + (z * z))))
function code(x, y, z) return sqrt(Float64(Float64(x * x) + Float64(Float64(y * y) + Float64(z * z)))) end
function tmp = code(x, y, z) tmp = sqrt(((x * x) + ((y * y) + (z * z)))); end
code[x_, y_, z_] := N[Sqrt[N[(N[(x * x), $MachinePrecision] + N[(N[(y * y), $MachinePrecision] + N[(z * z), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{x \cdot x + \left(y \cdot y + z \cdot z\right)}
\end{array}
x_m = (fabs.f64 x)
y_m = (fabs.f64 y)
z_m = (fabs.f64 z)
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
(FPCore (x_m y_m z_m)
:precision binary64
(if (<= y_m 1.05e+120)
(* z_m (fma (/ 0.5 z_m) (/ (fma y_m y_m (* x_m x_m)) z_m) 1.0))
(*
(sqrt (fma (/ z_m y_m) (/ z_m y_m) (fma x_m (/ x_m (* y_m y_m)) 1.0)))
(fabs y_m))))x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
double tmp;
if (y_m <= 1.05e+120) {
tmp = z_m * fma((0.5 / z_m), (fma(y_m, y_m, (x_m * x_m)) / z_m), 1.0);
} else {
tmp = sqrt(fma((z_m / y_m), (z_m / y_m), fma(x_m, (x_m / (y_m * y_m)), 1.0))) * fabs(y_m);
}
return tmp;
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) tmp = 0.0 if (y_m <= 1.05e+120) tmp = Float64(z_m * fma(Float64(0.5 / z_m), Float64(fma(y_m, y_m, Float64(x_m * x_m)) / z_m), 1.0)); else tmp = Float64(sqrt(fma(Float64(z_m / y_m), Float64(z_m / y_m), fma(x_m, Float64(x_m / Float64(y_m * y_m)), 1.0))) * abs(y_m)); end return tmp end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := If[LessEqual[y$95$m, 1.05e+120], N[(z$95$m * N[(N[(0.5 / z$95$m), $MachinePrecision] * N[(N[(y$95$m * y$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision] / z$95$m), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision], N[(N[Sqrt[N[(N[(z$95$m / y$95$m), $MachinePrecision] * N[(z$95$m / y$95$m), $MachinePrecision] + N[(x$95$m * N[(x$95$m / N[(y$95$m * y$95$m), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision]], $MachinePrecision] * N[Abs[y$95$m], $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\begin{array}{l}
\mathbf{if}\;y\_m \leq 1.05 \cdot 10^{+120}:\\
\;\;\;\;z\_m \cdot \mathsf{fma}\left(\frac{0.5}{z\_m}, \frac{\mathsf{fma}\left(y\_m, y\_m, x\_m \cdot x\_m\right)}{z\_m}, 1\right)\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\frac{z\_m}{y\_m}, \frac{z\_m}{y\_m}, \mathsf{fma}\left(x\_m, \frac{x\_m}{y\_m \cdot y\_m}, 1\right)\right)} \cdot \left|y\_m\right|\\
\end{array}
\end{array}
if y < 1.05e120Initial program 44.9%
Taylor expanded in z around inf
lower-*.f64N/A
lower-+.f64N/A
lower-*.f64N/A
lower-/.f64N/A
lower-+.f64N/A
lower-pow.f64N/A
lower-pow.f64N/A
lower-pow.f6482.9
Applied rewrites82.9%
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lift-pow.f64N/A
pow2N/A
lower-/.f64N/A
associate-*r/N/A
times-fracN/A
lower-fma.f64N/A
lower-/.f64N/A
lower-/.f6485.3
lift-+.f64N/A
lift-pow.f64N/A
pow2N/A
lift-*.f64N/A
lift-pow.f64N/A
pow2N/A
lift-*.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6485.3
Applied rewrites85.3%
if 1.05e120 < y Initial program 44.9%
lift-+.f64N/A
+-commutativeN/A
lift-+.f64N/A
associate-+l+N/A
lift-*.f64N/A
lower-fma.f64N/A
lift-*.f64N/A
lower-fma.f6444.9
Applied rewrites44.9%
lift-sqrt.f64N/A
lift-fma.f64N/A
sum-to-multN/A
sqrt-prodN/A
rem-sqrt-square-revN/A
lower-*.f64N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f64N/A
lower-/.f64N/A
lower-*.f64N/A
lower-fabs.f6429.1
Applied rewrites29.1%
lift-+.f64N/A
lift-*.f64N/A
lift-/.f64N/A
lift-*.f64N/A
lift-fma.f64N/A
lift-*.f64N/A
div-addN/A
associate-+l+N/A
lift-*.f64N/A
times-fracN/A
lower-fma.f64N/A
lower-/.f64N/A
lower-/.f64N/A
associate-/l*N/A
lower-fma.f64N/A
lower-/.f64N/A
lift-*.f6457.0
Applied rewrites57.0%
x_m = (fabs.f64 x) y_m = (fabs.f64 y) z_m = (fabs.f64 z) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (if (<= y_m 1.32e+154) (* z_m (fma (/ 0.5 z_m) (/ (fma y_m y_m (* x_m x_m)) z_m) 1.0)) (/ 1.0 (exp (- (log z_m))))))
x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
double tmp;
if (y_m <= 1.32e+154) {
tmp = z_m * fma((0.5 / z_m), (fma(y_m, y_m, (x_m * x_m)) / z_m), 1.0);
} else {
tmp = 1.0 / exp(-log(z_m));
}
return tmp;
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) tmp = 0.0 if (y_m <= 1.32e+154) tmp = Float64(z_m * fma(Float64(0.5 / z_m), Float64(fma(y_m, y_m, Float64(x_m * x_m)) / z_m), 1.0)); else tmp = Float64(1.0 / exp(Float64(-log(z_m)))); end return tmp end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := If[LessEqual[y$95$m, 1.32e+154], N[(z$95$m * N[(N[(0.5 / z$95$m), $MachinePrecision] * N[(N[(y$95$m * y$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision] / z$95$m), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision], N[(1.0 / N[Exp[(-N[Log[z$95$m], $MachinePrecision])], $MachinePrecision]), $MachinePrecision]]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\begin{array}{l}
\mathbf{if}\;y\_m \leq 1.32 \cdot 10^{+154}:\\
\;\;\;\;z\_m \cdot \mathsf{fma}\left(\frac{0.5}{z\_m}, \frac{\mathsf{fma}\left(y\_m, y\_m, x\_m \cdot x\_m\right)}{z\_m}, 1\right)\\
\mathbf{else}:\\
\;\;\;\;\frac{1}{e^{-\log z\_m}}\\
\end{array}
\end{array}
if y < 1.31999999999999998e154Initial program 44.9%
Taylor expanded in z around inf
lower-*.f64N/A
lower-+.f64N/A
lower-*.f64N/A
lower-/.f64N/A
lower-+.f64N/A
lower-pow.f64N/A
lower-pow.f64N/A
lower-pow.f6482.9
Applied rewrites82.9%
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lift-pow.f64N/A
pow2N/A
lower-/.f64N/A
associate-*r/N/A
times-fracN/A
lower-fma.f64N/A
lower-/.f64N/A
lower-/.f6485.3
lift-+.f64N/A
lift-pow.f64N/A
pow2N/A
lift-*.f64N/A
lift-pow.f64N/A
pow2N/A
lift-*.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6485.3
Applied rewrites85.3%
if 1.31999999999999998e154 < y Initial program 44.9%
lift-sqrt.f64N/A
pow1/2N/A
pow-to-expN/A
lower-exp.f64N/A
lower-*.f64N/A
lower-log.f6441.8
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f6441.8
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6441.8
Applied rewrites41.8%
Taylor expanded in z around inf
lower-*.f64N/A
lower-log.f64N/A
lower-/.f6489.3
Applied rewrites89.3%
lift-*.f64N/A
mul-1-negN/A
lift-log.f64N/A
lift-/.f64N/A
log-recN/A
remove-double-negN/A
lower-log.f6489.3
Applied rewrites89.3%
lift-exp.f64N/A
sinh-+-cosh-revN/A
flip-+N/A
sinh-coshN/A
sinh---cosh-revN/A
Applied rewrites89.3%
x_m = (fabs.f64 x)
y_m = (fabs.f64 y)
z_m = (fabs.f64 z)
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
(FPCore (x_m y_m z_m)
:precision binary64
(let* ((t_0 (/ 1.0 (exp (- (log z_m))))))
(if (<= y_m 1.4e-256)
t_0
(if (<= y_m 1.32e+154)
(fma (* (/ (fma y_m y_m (* x_m x_m)) (* z_m z_m)) 0.5) z_m z_m)
t_0))))x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
double t_0 = 1.0 / exp(-log(z_m));
double tmp;
if (y_m <= 1.4e-256) {
tmp = t_0;
} else if (y_m <= 1.32e+154) {
tmp = fma(((fma(y_m, y_m, (x_m * x_m)) / (z_m * z_m)) * 0.5), z_m, z_m);
} else {
tmp = t_0;
}
return tmp;
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) t_0 = Float64(1.0 / exp(Float64(-log(z_m)))) tmp = 0.0 if (y_m <= 1.4e-256) tmp = t_0; elseif (y_m <= 1.32e+154) tmp = fma(Float64(Float64(fma(y_m, y_m, Float64(x_m * x_m)) / Float64(z_m * z_m)) * 0.5), z_m, z_m); else tmp = t_0; end return tmp end
x_m = N[Abs[x], $MachinePrecision]
y_m = N[Abs[y], $MachinePrecision]
z_m = N[Abs[z], $MachinePrecision]
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
code[x$95$m_, y$95$m_, z$95$m_] := Block[{t$95$0 = N[(1.0 / N[Exp[(-N[Log[z$95$m], $MachinePrecision])], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[y$95$m, 1.4e-256], t$95$0, If[LessEqual[y$95$m, 1.32e+154], N[(N[(N[(N[(y$95$m * y$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision] / N[(z$95$m * z$95$m), $MachinePrecision]), $MachinePrecision] * 0.5), $MachinePrecision] * z$95$m + z$95$m), $MachinePrecision], t$95$0]]]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\begin{array}{l}
t_0 := \frac{1}{e^{-\log z\_m}}\\
\mathbf{if}\;y\_m \leq 1.4 \cdot 10^{-256}:\\
\;\;\;\;t\_0\\
\mathbf{elif}\;y\_m \leq 1.32 \cdot 10^{+154}:\\
\;\;\;\;\mathsf{fma}\left(\frac{\mathsf{fma}\left(y\_m, y\_m, x\_m \cdot x\_m\right)}{z\_m \cdot z\_m} \cdot 0.5, z\_m, z\_m\right)\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if y < 1.40000000000000012e-256 or 1.31999999999999998e154 < y Initial program 44.9%
lift-sqrt.f64N/A
pow1/2N/A
pow-to-expN/A
lower-exp.f64N/A
lower-*.f64N/A
lower-log.f6441.8
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f6441.8
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6441.8
Applied rewrites41.8%
Taylor expanded in z around inf
lower-*.f64N/A
lower-log.f64N/A
lower-/.f6489.3
Applied rewrites89.3%
lift-*.f64N/A
mul-1-negN/A
lift-log.f64N/A
lift-/.f64N/A
log-recN/A
remove-double-negN/A
lower-log.f6489.3
Applied rewrites89.3%
lift-exp.f64N/A
sinh-+-cosh-revN/A
flip-+N/A
sinh-coshN/A
sinh---cosh-revN/A
Applied rewrites89.3%
if 1.40000000000000012e-256 < y < 1.31999999999999998e154Initial program 44.9%
Taylor expanded in z around inf
lower-*.f64N/A
lower-+.f64N/A
lower-*.f64N/A
lower-/.f64N/A
lower-+.f64N/A
lower-pow.f64N/A
lower-pow.f64N/A
lower-pow.f6482.9
Applied rewrites82.9%
lift-*.f64N/A
lift-+.f64N/A
+-commutativeN/A
distribute-rgt-inN/A
*-lft-identityN/A
lower-fma.f6482.9
Applied rewrites82.9%
x_m = (fabs.f64 x)
y_m = (fabs.f64 y)
z_m = (fabs.f64 z)
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
(FPCore (x_m y_m z_m)
:precision binary64
(let* ((t_0 (/ 1.0 (exp (- (log z_m))))))
(if (<= z_m 8.5e-157)
t_0
(if (<= z_m 1.12e+154)
(sqrt (fma y_m y_m (fma z_m z_m (* x_m x_m))))
t_0))))x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
double t_0 = 1.0 / exp(-log(z_m));
double tmp;
if (z_m <= 8.5e-157) {
tmp = t_0;
} else if (z_m <= 1.12e+154) {
tmp = sqrt(fma(y_m, y_m, fma(z_m, z_m, (x_m * x_m))));
} else {
tmp = t_0;
}
return tmp;
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) t_0 = Float64(1.0 / exp(Float64(-log(z_m)))) tmp = 0.0 if (z_m <= 8.5e-157) tmp = t_0; elseif (z_m <= 1.12e+154) tmp = sqrt(fma(y_m, y_m, fma(z_m, z_m, Float64(x_m * x_m)))); else tmp = t_0; end return tmp end
x_m = N[Abs[x], $MachinePrecision]
y_m = N[Abs[y], $MachinePrecision]
z_m = N[Abs[z], $MachinePrecision]
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
code[x$95$m_, y$95$m_, z$95$m_] := Block[{t$95$0 = N[(1.0 / N[Exp[(-N[Log[z$95$m], $MachinePrecision])], $MachinePrecision]), $MachinePrecision]}, If[LessEqual[z$95$m, 8.5e-157], t$95$0, If[LessEqual[z$95$m, 1.12e+154], N[Sqrt[N[(y$95$m * y$95$m + N[(z$95$m * z$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], t$95$0]]]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\begin{array}{l}
t_0 := \frac{1}{e^{-\log z\_m}}\\
\mathbf{if}\;z\_m \leq 8.5 \cdot 10^{-157}:\\
\;\;\;\;t\_0\\
\mathbf{elif}\;z\_m \leq 1.12 \cdot 10^{+154}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(y\_m, y\_m, \mathsf{fma}\left(z\_m, z\_m, x\_m \cdot x\_m\right)\right)}\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if z < 8.49999999999999976e-157 or 1.11999999999999994e154 < z Initial program 44.9%
lift-sqrt.f64N/A
pow1/2N/A
pow-to-expN/A
lower-exp.f64N/A
lower-*.f64N/A
lower-log.f6441.8
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f6441.8
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6441.8
Applied rewrites41.8%
Taylor expanded in z around inf
lower-*.f64N/A
lower-log.f64N/A
lower-/.f6489.3
Applied rewrites89.3%
lift-*.f64N/A
mul-1-negN/A
lift-log.f64N/A
lift-/.f64N/A
log-recN/A
remove-double-negN/A
lower-log.f6489.3
Applied rewrites89.3%
lift-exp.f64N/A
sinh-+-cosh-revN/A
flip-+N/A
sinh-coshN/A
sinh---cosh-revN/A
Applied rewrites89.3%
if 8.49999999999999976e-157 < z < 1.11999999999999994e154Initial program 44.9%
lift-+.f64N/A
+-commutativeN/A
lift-+.f64N/A
associate-+l+N/A
lift-*.f64N/A
lower-fma.f64N/A
lift-*.f64N/A
lower-fma.f6444.9
Applied rewrites44.9%
x_m = (fabs.f64 x)
y_m = (fabs.f64 y)
z_m = (fabs.f64 z)
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
(FPCore (x_m y_m z_m)
:precision binary64
(let* ((t_0 (exp (log z_m))))
(if (<= z_m 8.5e-157)
t_0
(if (<= z_m 1.12e+154)
(sqrt (fma y_m y_m (fma z_m z_m (* x_m x_m))))
t_0))))x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
double t_0 = exp(log(z_m));
double tmp;
if (z_m <= 8.5e-157) {
tmp = t_0;
} else if (z_m <= 1.12e+154) {
tmp = sqrt(fma(y_m, y_m, fma(z_m, z_m, (x_m * x_m))));
} else {
tmp = t_0;
}
return tmp;
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) t_0 = exp(log(z_m)) tmp = 0.0 if (z_m <= 8.5e-157) tmp = t_0; elseif (z_m <= 1.12e+154) tmp = sqrt(fma(y_m, y_m, fma(z_m, z_m, Float64(x_m * x_m)))); else tmp = t_0; end return tmp end
x_m = N[Abs[x], $MachinePrecision]
y_m = N[Abs[y], $MachinePrecision]
z_m = N[Abs[z], $MachinePrecision]
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
code[x$95$m_, y$95$m_, z$95$m_] := Block[{t$95$0 = N[Exp[N[Log[z$95$m], $MachinePrecision]], $MachinePrecision]}, If[LessEqual[z$95$m, 8.5e-157], t$95$0, If[LessEqual[z$95$m, 1.12e+154], N[Sqrt[N[(y$95$m * y$95$m + N[(z$95$m * z$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision], t$95$0]]]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\begin{array}{l}
t_0 := e^{\log z\_m}\\
\mathbf{if}\;z\_m \leq 8.5 \cdot 10^{-157}:\\
\;\;\;\;t\_0\\
\mathbf{elif}\;z\_m \leq 1.12 \cdot 10^{+154}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(y\_m, y\_m, \mathsf{fma}\left(z\_m, z\_m, x\_m \cdot x\_m\right)\right)}\\
\mathbf{else}:\\
\;\;\;\;t\_0\\
\end{array}
\end{array}
if z < 8.49999999999999976e-157 or 1.11999999999999994e154 < z Initial program 44.9%
lift-sqrt.f64N/A
pow1/2N/A
pow-to-expN/A
lower-exp.f64N/A
lower-*.f64N/A
lower-log.f6441.8
lift-+.f64N/A
lift-*.f64N/A
lower-fma.f6441.8
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f6441.8
Applied rewrites41.8%
Taylor expanded in z around inf
lower-*.f64N/A
lower-log.f64N/A
lower-/.f6489.3
Applied rewrites89.3%
lift-*.f64N/A
mul-1-negN/A
lift-log.f64N/A
lift-/.f64N/A
log-recN/A
remove-double-negN/A
lower-log.f6489.3
Applied rewrites89.3%
if 8.49999999999999976e-157 < z < 1.11999999999999994e154Initial program 44.9%
lift-+.f64N/A
+-commutativeN/A
lift-+.f64N/A
associate-+l+N/A
lift-*.f64N/A
lower-fma.f64N/A
lift-*.f64N/A
lower-fma.f6444.9
Applied rewrites44.9%
x_m = (fabs.f64 x) y_m = (fabs.f64 y) z_m = (fabs.f64 z) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (sqrt (fma y_m y_m (fma z_m z_m (* x_m x_m)))))
x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return sqrt(fma(y_m, y_m, fma(z_m, z_m, (x_m * x_m))));
}
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return sqrt(fma(y_m, y_m, fma(z_m, z_m, Float64(x_m * x_m)))) end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := N[Sqrt[N[(y$95$m * y$95$m + N[(z$95$m * z$95$m + N[(x$95$m * x$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\sqrt{\mathsf{fma}\left(y\_m, y\_m, \mathsf{fma}\left(z\_m, z\_m, x\_m \cdot x\_m\right)\right)}
\end{array}
Initial program 44.9%
lift-+.f64N/A
+-commutativeN/A
lift-+.f64N/A
associate-+l+N/A
lift-*.f64N/A
lower-fma.f64N/A
lift-*.f64N/A
lower-fma.f6444.9
Applied rewrites44.9%
x_m = (fabs.f64 x) y_m = (fabs.f64 y) z_m = (fabs.f64 z) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (* (/ y_m x_m) (fabs x_m)))
x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return (y_m / x_m) * fabs(x_m);
}
x_m = private
y_m = private
z_m = private
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
module fmin_fmax_functions
implicit none
private
public fmax
public fmin
interface fmax
module procedure fmax88
module procedure fmax44
module procedure fmax84
module procedure fmax48
end interface
interface fmin
module procedure fmin88
module procedure fmin44
module procedure fmin84
module procedure fmin48
end interface
contains
real(8) function fmax88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(4) function fmax44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(8) function fmax84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, max(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmax48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), max(dble(x), y), y /= y), x /= x)
end function
real(8) function fmin88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(4) function fmin44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(8) function fmin84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, min(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmin48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), min(dble(x), y), y /= y), x /= x)
end function
end module
real(8) function code(x_m, y_m, z_m)
use fmin_fmax_functions
real(8), intent (in) :: x_m
real(8), intent (in) :: y_m
real(8), intent (in) :: z_m
code = (y_m / x_m) * abs(x_m)
end function
x_m = Math.abs(x);
y_m = Math.abs(y);
z_m = Math.abs(z);
assert x_m < y_m && y_m < z_m;
public static double code(double x_m, double y_m, double z_m) {
return (y_m / x_m) * Math.abs(x_m);
}
x_m = math.fabs(x) y_m = math.fabs(y) z_m = math.fabs(z) [x_m, y_m, z_m] = sort([x_m, y_m, z_m]) def code(x_m, y_m, z_m): return (y_m / x_m) * math.fabs(x_m)
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return Float64(Float64(y_m / x_m) * abs(x_m)) end
x_m = abs(x);
y_m = abs(y);
z_m = abs(z);
x_m, y_m, z_m = num2cell(sort([x_m, y_m, z_m])){:}
function tmp = code(x_m, y_m, z_m)
tmp = (y_m / x_m) * abs(x_m);
end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := N[(N[(y$95$m / x$95$m), $MachinePrecision] * N[Abs[x$95$m], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
\frac{y\_m}{x\_m} \cdot \left|x\_m\right|
\end{array}
Initial program 44.9%
lift-sqrt.f64N/A
lift-+.f64N/A
sum-to-multN/A
sqrt-prodN/A
lift-*.f64N/A
rem-sqrt-square-revN/A
lower-*.f64N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f64N/A
lower-/.f64N/A
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f64N/A
lower-fabs.f6411.9
Applied rewrites11.9%
Taylor expanded in y around inf
lower-*.f64N/A
lower-sqrt.f64N/A
lower-/.f64N/A
lower-pow.f645.6
Applied rewrites5.6%
Taylor expanded in x around 0
lower-/.f645.7
Applied rewrites5.7%
x_m = (fabs.f64 x) y_m = (fabs.f64 y) z_m = (fabs.f64 z) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (* 1.0 (fabs x_m)))
x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return 1.0 * fabs(x_m);
}
x_m = private
y_m = private
z_m = private
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
module fmin_fmax_functions
implicit none
private
public fmax
public fmin
interface fmax
module procedure fmax88
module procedure fmax44
module procedure fmax84
module procedure fmax48
end interface
interface fmin
module procedure fmin88
module procedure fmin44
module procedure fmin84
module procedure fmin48
end interface
contains
real(8) function fmax88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(4) function fmax44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(8) function fmax84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, max(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmax48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), max(dble(x), y), y /= y), x /= x)
end function
real(8) function fmin88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(4) function fmin44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(8) function fmin84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, min(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmin48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), min(dble(x), y), y /= y), x /= x)
end function
end module
real(8) function code(x_m, y_m, z_m)
use fmin_fmax_functions
real(8), intent (in) :: x_m
real(8), intent (in) :: y_m
real(8), intent (in) :: z_m
code = 1.0d0 * abs(x_m)
end function
x_m = Math.abs(x);
y_m = Math.abs(y);
z_m = Math.abs(z);
assert x_m < y_m && y_m < z_m;
public static double code(double x_m, double y_m, double z_m) {
return 1.0 * Math.abs(x_m);
}
x_m = math.fabs(x) y_m = math.fabs(y) z_m = math.fabs(z) [x_m, y_m, z_m] = sort([x_m, y_m, z_m]) def code(x_m, y_m, z_m): return 1.0 * math.fabs(x_m)
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return Float64(1.0 * abs(x_m)) end
x_m = abs(x);
y_m = abs(y);
z_m = abs(z);
x_m, y_m, z_m = num2cell(sort([x_m, y_m, z_m])){:}
function tmp = code(x_m, y_m, z_m)
tmp = 1.0 * abs(x_m);
end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := N[(1.0 * N[Abs[x$95$m], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
1 \cdot \left|x\_m\right|
\end{array}
Initial program 44.9%
lift-sqrt.f64N/A
lift-+.f64N/A
sum-to-multN/A
sqrt-prodN/A
lift-*.f64N/A
rem-sqrt-square-revN/A
lower-*.f64N/A
lower-sqrt.f64N/A
+-commutativeN/A
lower-+.f64N/A
lower-/.f64N/A
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lower-fma.f64N/A
lower-fabs.f6411.9
Applied rewrites11.9%
Taylor expanded in x around inf
Applied rewrites3.4%
x_m = (fabs.f64 x) y_m = (fabs.f64 y) z_m = (fabs.f64 z) NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. (FPCore (x_m y_m z_m) :precision binary64 (- x_m))
x_m = fabs(x);
y_m = fabs(y);
z_m = fabs(z);
assert(x_m < y_m && y_m < z_m);
double code(double x_m, double y_m, double z_m) {
return -x_m;
}
x_m = private
y_m = private
z_m = private
NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function.
module fmin_fmax_functions
implicit none
private
public fmax
public fmin
interface fmax
module procedure fmax88
module procedure fmax44
module procedure fmax84
module procedure fmax48
end interface
interface fmin
module procedure fmin88
module procedure fmin44
module procedure fmin84
module procedure fmin48
end interface
contains
real(8) function fmax88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(4) function fmax44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, max(x, y), y /= y), x /= x)
end function
real(8) function fmax84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, max(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmax48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), max(dble(x), y), y /= y), x /= x)
end function
real(8) function fmin88(x, y) result (res)
real(8), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(4) function fmin44(x, y) result (res)
real(4), intent (in) :: x
real(4), intent (in) :: y
res = merge(y, merge(x, min(x, y), y /= y), x /= x)
end function
real(8) function fmin84(x, y) result(res)
real(8), intent (in) :: x
real(4), intent (in) :: y
res = merge(dble(y), merge(x, min(x, dble(y)), y /= y), x /= x)
end function
real(8) function fmin48(x, y) result(res)
real(4), intent (in) :: x
real(8), intent (in) :: y
res = merge(y, merge(dble(x), min(dble(x), y), y /= y), x /= x)
end function
end module
real(8) function code(x_m, y_m, z_m)
use fmin_fmax_functions
real(8), intent (in) :: x_m
real(8), intent (in) :: y_m
real(8), intent (in) :: z_m
code = -x_m
end function
x_m = Math.abs(x);
y_m = Math.abs(y);
z_m = Math.abs(z);
assert x_m < y_m && y_m < z_m;
public static double code(double x_m, double y_m, double z_m) {
return -x_m;
}
x_m = math.fabs(x) y_m = math.fabs(y) z_m = math.fabs(z) [x_m, y_m, z_m] = sort([x_m, y_m, z_m]) def code(x_m, y_m, z_m): return -x_m
x_m = abs(x) y_m = abs(y) z_m = abs(z) x_m, y_m, z_m = sort([x_m, y_m, z_m]) function code(x_m, y_m, z_m) return Float64(-x_m) end
x_m = abs(x);
y_m = abs(y);
z_m = abs(z);
x_m, y_m, z_m = num2cell(sort([x_m, y_m, z_m])){:}
function tmp = code(x_m, y_m, z_m)
tmp = -x_m;
end
x_m = N[Abs[x], $MachinePrecision] y_m = N[Abs[y], $MachinePrecision] z_m = N[Abs[z], $MachinePrecision] NOTE: x_m, y_m, and z_m should be sorted in increasing order before calling this function. code[x$95$m_, y$95$m_, z$95$m_] := (-x$95$m)
\begin{array}{l}
x_m = \left|x\right|
\\
y_m = \left|y\right|
\\
z_m = \left|z\right|
\\
[x_m, y_m, z_m] = \mathsf{sort}([x_m, y_m, z_m])\\
\\
-x\_m
\end{array}
Initial program 44.9%
Taylor expanded in x around -inf
lower-*.f641.7
Applied rewrites1.7%
lift-*.f64N/A
mul-1-negN/A
lower-neg.f641.7
Applied rewrites1.7%
herbie shell --seed 2025142
(FPCore (x y z)
:name "bug366 (missed optimization)"
:precision binary64
(sqrt (+ (* x x) (+ (* y y) (* z z)))))