
(FPCore (x y z t a b) :precision binary64 (* (* x (cos (/ (* (* (+ (* y 2.0) 1.0) z) t) 16.0))) (cos (/ (* (* (+ (* a 2.0) 1.0) b) t) 16.0))))
double code(double x, double y, double z, double t, double a, double b) {
return (x * cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * cos((((((a * 2.0) + 1.0) * b) * t) / 16.0));
}
real(8) function code(x, y, z, t, a, b)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
real(8), intent (in) :: t
real(8), intent (in) :: a
real(8), intent (in) :: b
code = (x * cos((((((y * 2.0d0) + 1.0d0) * z) * t) / 16.0d0))) * cos((((((a * 2.0d0) + 1.0d0) * b) * t) / 16.0d0))
end function
public static double code(double x, double y, double z, double t, double a, double b) {
return (x * Math.cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * Math.cos((((((a * 2.0) + 1.0) * b) * t) / 16.0));
}
def code(x, y, z, t, a, b): return (x * math.cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * math.cos((((((a * 2.0) + 1.0) * b) * t) / 16.0))
function code(x, y, z, t, a, b) return Float64(Float64(x * cos(Float64(Float64(Float64(Float64(Float64(y * 2.0) + 1.0) * z) * t) / 16.0))) * cos(Float64(Float64(Float64(Float64(Float64(a * 2.0) + 1.0) * b) * t) / 16.0))) end
function tmp = code(x, y, z, t, a, b) tmp = (x * cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * cos((((((a * 2.0) + 1.0) * b) * t) / 16.0)); end
code[x_, y_, z_, t_, a_, b_] := N[(N[(x * N[Cos[N[(N[(N[(N[(N[(y * 2.0), $MachinePrecision] + 1.0), $MachinePrecision] * z), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] * N[Cos[N[(N[(N[(N[(N[(a * 2.0), $MachinePrecision] + 1.0), $MachinePrecision] * b), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(x \cdot \cos \left(\frac{\left(\left(y \cdot 2 + 1\right) \cdot z\right) \cdot t}{16}\right)\right) \cdot \cos \left(\frac{\left(\left(a \cdot 2 + 1\right) \cdot b\right) \cdot t}{16}\right)
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 3 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (x y z t a b) :precision binary64 (* (* x (cos (/ (* (* (+ (* y 2.0) 1.0) z) t) 16.0))) (cos (/ (* (* (+ (* a 2.0) 1.0) b) t) 16.0))))
double code(double x, double y, double z, double t, double a, double b) {
return (x * cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * cos((((((a * 2.0) + 1.0) * b) * t) / 16.0));
}
real(8) function code(x, y, z, t, a, b)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
real(8), intent (in) :: t
real(8), intent (in) :: a
real(8), intent (in) :: b
code = (x * cos((((((y * 2.0d0) + 1.0d0) * z) * t) / 16.0d0))) * cos((((((a * 2.0d0) + 1.0d0) * b) * t) / 16.0d0))
end function
public static double code(double x, double y, double z, double t, double a, double b) {
return (x * Math.cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * Math.cos((((((a * 2.0) + 1.0) * b) * t) / 16.0));
}
def code(x, y, z, t, a, b): return (x * math.cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * math.cos((((((a * 2.0) + 1.0) * b) * t) / 16.0))
function code(x, y, z, t, a, b) return Float64(Float64(x * cos(Float64(Float64(Float64(Float64(Float64(y * 2.0) + 1.0) * z) * t) / 16.0))) * cos(Float64(Float64(Float64(Float64(Float64(a * 2.0) + 1.0) * b) * t) / 16.0))) end
function tmp = code(x, y, z, t, a, b) tmp = (x * cos((((((y * 2.0) + 1.0) * z) * t) / 16.0))) * cos((((((a * 2.0) + 1.0) * b) * t) / 16.0)); end
code[x_, y_, z_, t_, a_, b_] := N[(N[(x * N[Cos[N[(N[(N[(N[(N[(y * 2.0), $MachinePrecision] + 1.0), $MachinePrecision] * z), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] * N[Cos[N[(N[(N[(N[(N[(a * 2.0), $MachinePrecision] + 1.0), $MachinePrecision] * b), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
\left(x \cdot \cos \left(\frac{\left(\left(y \cdot 2 + 1\right) \cdot z\right) \cdot t}{16}\right)\right) \cdot \cos \left(\frac{\left(\left(a \cdot 2 + 1\right) \cdot b\right) \cdot t}{16}\right)
\end{array}
x\_m = (fabs.f64 x)
x\_s = (copysign.f64 #s(literal 1 binary64) x)
(FPCore (x_s x_m y z t a b)
:precision binary64
(let* ((t_1 (cos (/ (* (* b (+ (* a 2.0) 1.0)) t) 16.0))))
(*
x_s
(if (<=
(* t_1 (* (cos (/ (* t (* z (+ 1.0 (* 2.0 y)))) 16.0)) x_m))
1e+150)
(*
(*
(cos
(/
(*
(*
(* (* (/ -1.0 (fma -2.0 y 1.0)) (fma 2.0 y -1.0)) (fma 2.0 y 1.0))
z)
t)
16.0))
x_m)
t_1)
(* 1.0 (* 1.0 x_m))))))x\_m = fabs(x);
x\_s = copysign(1.0, x);
double code(double x_s, double x_m, double y, double z, double t, double a, double b) {
double t_1 = cos((((b * ((a * 2.0) + 1.0)) * t) / 16.0));
double tmp;
if ((t_1 * (cos(((t * (z * (1.0 + (2.0 * y)))) / 16.0)) * x_m)) <= 1e+150) {
tmp = (cos(((((((-1.0 / fma(-2.0, y, 1.0)) * fma(2.0, y, -1.0)) * fma(2.0, y, 1.0)) * z) * t) / 16.0)) * x_m) * t_1;
} else {
tmp = 1.0 * (1.0 * x_m);
}
return x_s * tmp;
}
x\_m = abs(x) x\_s = copysign(1.0, x) function code(x_s, x_m, y, z, t, a, b) t_1 = cos(Float64(Float64(Float64(b * Float64(Float64(a * 2.0) + 1.0)) * t) / 16.0)) tmp = 0.0 if (Float64(t_1 * Float64(cos(Float64(Float64(t * Float64(z * Float64(1.0 + Float64(2.0 * y)))) / 16.0)) * x_m)) <= 1e+150) tmp = Float64(Float64(cos(Float64(Float64(Float64(Float64(Float64(Float64(-1.0 / fma(-2.0, y, 1.0)) * fma(2.0, y, -1.0)) * fma(2.0, y, 1.0)) * z) * t) / 16.0)) * x_m) * t_1); else tmp = Float64(1.0 * Float64(1.0 * x_m)); end return Float64(x_s * tmp) end
x\_m = N[Abs[x], $MachinePrecision]
x\_s = N[With[{TMP1 = Abs[1.0], TMP2 = Sign[x]}, TMP1 * If[TMP2 == 0, 1, TMP2]], $MachinePrecision]
code[x$95$s_, x$95$m_, y_, z_, t_, a_, b_] := Block[{t$95$1 = N[Cos[N[(N[(N[(b * N[(N[(a * 2.0), $MachinePrecision] + 1.0), $MachinePrecision]), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision]}, N[(x$95$s * If[LessEqual[N[(t$95$1 * N[(N[Cos[N[(N[(t * N[(z * N[(1.0 + N[(2.0 * y), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision] * x$95$m), $MachinePrecision]), $MachinePrecision], 1e+150], N[(N[(N[Cos[N[(N[(N[(N[(N[(N[(-1.0 / N[(-2.0 * y + 1.0), $MachinePrecision]), $MachinePrecision] * N[(2.0 * y + -1.0), $MachinePrecision]), $MachinePrecision] * N[(2.0 * y + 1.0), $MachinePrecision]), $MachinePrecision] * z), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision] * x$95$m), $MachinePrecision] * t$95$1), $MachinePrecision], N[(1.0 * N[(1.0 * x$95$m), $MachinePrecision]), $MachinePrecision]]), $MachinePrecision]]
\begin{array}{l}
x\_m = \left|x\right|
\\
x\_s = \mathsf{copysign}\left(1, x\right)
\\
\begin{array}{l}
t_1 := \cos \left(\frac{\left(b \cdot \left(a \cdot 2 + 1\right)\right) \cdot t}{16}\right)\\
x\_s \cdot \begin{array}{l}
\mathbf{if}\;t\_1 \cdot \left(\cos \left(\frac{t \cdot \left(z \cdot \left(1 + 2 \cdot y\right)\right)}{16}\right) \cdot x\_m\right) \leq 10^{+150}:\\
\;\;\;\;\left(\cos \left(\frac{\left(\left(\left(\frac{-1}{\mathsf{fma}\left(-2, y, 1\right)} \cdot \mathsf{fma}\left(2, y, -1\right)\right) \cdot \mathsf{fma}\left(2, y, 1\right)\right) \cdot z\right) \cdot t}{16}\right) \cdot x\_m\right) \cdot t\_1\\
\mathbf{else}:\\
\;\;\;\;1 \cdot \left(1 \cdot x\_m\right)\\
\end{array}
\end{array}
\end{array}
if (*.f64 (*.f64 x (cos.f64 (/.f64 (*.f64 (*.f64 (+.f64 (*.f64 y #s(literal 2 binary64)) #s(literal 1 binary64)) z) t) #s(literal 16 binary64)))) (cos.f64 (/.f64 (*.f64 (*.f64 (+.f64 (*.f64 a #s(literal 2 binary64)) #s(literal 1 binary64)) b) t) #s(literal 16 binary64)))) < 9.99999999999999981e149Initial program 49.0%
lift-+.f64N/A
flip-+N/A
div-invN/A
metadata-evalN/A
difference-of-sqr-1N/A
lift-+.f64N/A
associate-*l*N/A
lower-*.f64N/A
lift-+.f64N/A
lift-*.f64N/A
*-commutativeN/A
lower-fma.f64N/A
lower-*.f64N/A
sub-negN/A
lift-*.f64N/A
*-commutativeN/A
metadata-evalN/A
lower-fma.f64N/A
frac-2negN/A
metadata-evalN/A
sub-negN/A
metadata-evalN/A
distribute-neg-inN/A
metadata-evalN/A
+-commutativeN/A
Applied rewrites49.2%
if 9.99999999999999981e149 < (*.f64 (*.f64 x (cos.f64 (/.f64 (*.f64 (*.f64 (+.f64 (*.f64 y #s(literal 2 binary64)) #s(literal 1 binary64)) z) t) #s(literal 16 binary64)))) (cos.f64 (/.f64 (*.f64 (*.f64 (+.f64 (*.f64 a #s(literal 2 binary64)) #s(literal 1 binary64)) b) t) #s(literal 16 binary64)))) Initial program 5.4%
Taylor expanded in t around 0
Applied rewrites8.8%
Taylor expanded in b around 0
Applied rewrites13.3%
Final simplification30.6%
x\_m = (fabs.f64 x) x\_s = (copysign.f64 #s(literal 1 binary64) x) (FPCore (x_s x_m y z t a b) :precision binary64 (* x_s (* (cos (/ (* (* (/ 1.0 (fma (fma (fma 8.0 a 4.0) a 2.0) a 1.0)) b) t) 16.0)) (* 1.0 x_m))))
x\_m = fabs(x);
x\_s = copysign(1.0, x);
double code(double x_s, double x_m, double y, double z, double t, double a, double b) {
return x_s * (cos(((((1.0 / fma(fma(fma(8.0, a, 4.0), a, 2.0), a, 1.0)) * b) * t) / 16.0)) * (1.0 * x_m));
}
x\_m = abs(x) x\_s = copysign(1.0, x) function code(x_s, x_m, y, z, t, a, b) return Float64(x_s * Float64(cos(Float64(Float64(Float64(Float64(1.0 / fma(fma(fma(8.0, a, 4.0), a, 2.0), a, 1.0)) * b) * t) / 16.0)) * Float64(1.0 * x_m))) end
x\_m = N[Abs[x], $MachinePrecision]
x\_s = N[With[{TMP1 = Abs[1.0], TMP2 = Sign[x]}, TMP1 * If[TMP2 == 0, 1, TMP2]], $MachinePrecision]
code[x$95$s_, x$95$m_, y_, z_, t_, a_, b_] := N[(x$95$s * N[(N[Cos[N[(N[(N[(N[(1.0 / N[(N[(N[(8.0 * a + 4.0), $MachinePrecision] * a + 2.0), $MachinePrecision] * a + 1.0), $MachinePrecision]), $MachinePrecision] * b), $MachinePrecision] * t), $MachinePrecision] / 16.0), $MachinePrecision]], $MachinePrecision] * N[(1.0 * x$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
x\_m = \left|x\right|
\\
x\_s = \mathsf{copysign}\left(1, x\right)
\\
x\_s \cdot \left(\cos \left(\frac{\left(\frac{1}{\mathsf{fma}\left(\mathsf{fma}\left(\mathsf{fma}\left(8, a, 4\right), a, 2\right), a, 1\right)} \cdot b\right) \cdot t}{16}\right) \cdot \left(1 \cdot x\_m\right)\right)
\end{array}
Initial program 26.3%
Taylor expanded in t around 0
Applied rewrites27.2%
Applied rewrites20.3%
Taylor expanded in a around 0
+-commutativeN/A
*-commutativeN/A
lower-fma.f64N/A
+-commutativeN/A
*-commutativeN/A
lower-fma.f64N/A
+-commutativeN/A
lower-fma.f6429.1
Applied rewrites29.1%
Final simplification29.1%
x\_m = (fabs.f64 x) x\_s = (copysign.f64 #s(literal 1 binary64) x) (FPCore (x_s x_m y z t a b) :precision binary64 (* x_s (* 1.0 (* 1.0 x_m))))
x\_m = fabs(x);
x\_s = copysign(1.0, x);
double code(double x_s, double x_m, double y, double z, double t, double a, double b) {
return x_s * (1.0 * (1.0 * x_m));
}
x\_m = abs(x)
x\_s = copysign(1.0d0, x)
real(8) function code(x_s, x_m, y, z, t, a, b)
real(8), intent (in) :: x_s
real(8), intent (in) :: x_m
real(8), intent (in) :: y
real(8), intent (in) :: z
real(8), intent (in) :: t
real(8), intent (in) :: a
real(8), intent (in) :: b
code = x_s * (1.0d0 * (1.0d0 * x_m))
end function
x\_m = Math.abs(x);
x\_s = Math.copySign(1.0, x);
public static double code(double x_s, double x_m, double y, double z, double t, double a, double b) {
return x_s * (1.0 * (1.0 * x_m));
}
x\_m = math.fabs(x) x\_s = math.copysign(1.0, x) def code(x_s, x_m, y, z, t, a, b): return x_s * (1.0 * (1.0 * x_m))
x\_m = abs(x) x\_s = copysign(1.0, x) function code(x_s, x_m, y, z, t, a, b) return Float64(x_s * Float64(1.0 * Float64(1.0 * x_m))) end
x\_m = abs(x); x\_s = sign(x) * abs(1.0); function tmp = code(x_s, x_m, y, z, t, a, b) tmp = x_s * (1.0 * (1.0 * x_m)); end
x\_m = N[Abs[x], $MachinePrecision]
x\_s = N[With[{TMP1 = Abs[1.0], TMP2 = Sign[x]}, TMP1 * If[TMP2 == 0, 1, TMP2]], $MachinePrecision]
code[x$95$s_, x$95$m_, y_, z_, t_, a_, b_] := N[(x$95$s * N[(1.0 * N[(1.0 * x$95$m), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
x\_m = \left|x\right|
\\
x\_s = \mathsf{copysign}\left(1, x\right)
\\
x\_s \cdot \left(1 \cdot \left(1 \cdot x\_m\right)\right)
\end{array}
Initial program 26.3%
Taylor expanded in t around 0
Applied rewrites27.2%
Taylor expanded in b around 0
Applied rewrites29.0%
Final simplification29.0%
(FPCore (x y z t a b) :precision binary64 (* x (cos (* (/ b 16.0) (/ t (+ (- 1.0 (* a 2.0)) (pow (* a 2.0) 2.0)))))))
double code(double x, double y, double z, double t, double a, double b) {
return x * cos(((b / 16.0) * (t / ((1.0 - (a * 2.0)) + pow((a * 2.0), 2.0)))));
}
real(8) function code(x, y, z, t, a, b)
real(8), intent (in) :: x
real(8), intent (in) :: y
real(8), intent (in) :: z
real(8), intent (in) :: t
real(8), intent (in) :: a
real(8), intent (in) :: b
code = x * cos(((b / 16.0d0) * (t / ((1.0d0 - (a * 2.0d0)) + ((a * 2.0d0) ** 2.0d0)))))
end function
public static double code(double x, double y, double z, double t, double a, double b) {
return x * Math.cos(((b / 16.0) * (t / ((1.0 - (a * 2.0)) + Math.pow((a * 2.0), 2.0)))));
}
def code(x, y, z, t, a, b): return x * math.cos(((b / 16.0) * (t / ((1.0 - (a * 2.0)) + math.pow((a * 2.0), 2.0)))))
function code(x, y, z, t, a, b) return Float64(x * cos(Float64(Float64(b / 16.0) * Float64(t / Float64(Float64(1.0 - Float64(a * 2.0)) + (Float64(a * 2.0) ^ 2.0)))))) end
function tmp = code(x, y, z, t, a, b) tmp = x * cos(((b / 16.0) * (t / ((1.0 - (a * 2.0)) + ((a * 2.0) ^ 2.0))))); end
code[x_, y_, z_, t_, a_, b_] := N[(x * N[Cos[N[(N[(b / 16.0), $MachinePrecision] * N[(t / N[(N[(1.0 - N[(a * 2.0), $MachinePrecision]), $MachinePrecision] + N[Power[N[(a * 2.0), $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]
\begin{array}{l}
\\
x \cdot \cos \left(\frac{b}{16} \cdot \frac{t}{\left(1 - a \cdot 2\right) + {\left(a \cdot 2\right)}^{2}}\right)
\end{array}
herbie shell --seed 2024235
(FPCore (x y z t a b)
:name "Codec.Picture.Jpg.FastDct:referenceDct from JuicyPixels-3.2.6.1"
:precision binary64
:alt
(! :herbie-platform default (* x (cos (* (/ b 16) (/ t (+ (- 1 (* a 2)) (pow (* a 2) 2)))))))
(* (* x (cos (/ (* (* (+ (* y 2.0) 1.0) z) t) 16.0))) (cos (/ (* (* (+ (* a 2.0) 1.0) b) t) 16.0))))