
(FPCore (l Om kx ky)
:precision binary64
(sqrt
(*
(/ 1.0 2.0)
(+
1.0
(/
1.0
(sqrt
(+
1.0
(*
(pow (/ (* 2.0 l) Om) 2.0)
(+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))
double code(double l, double Om, double kx, double ky) {
return sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + (pow(((2.0 * l) / Om), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0)))))))));
}
real(8) function code(l, om, kx, ky)
real(8), intent (in) :: l
real(8), intent (in) :: om
real(8), intent (in) :: kx
real(8), intent (in) :: ky
code = sqrt(((1.0d0 / 2.0d0) * (1.0d0 + (1.0d0 / sqrt((1.0d0 + ((((2.0d0 * l) / om) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0)))))))))
end function
public static double code(double l, double Om, double kx, double ky) {
return Math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / Math.sqrt((1.0 + (Math.pow(((2.0 * l) / Om), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0)))))))));
}
def code(l, Om, kx, ky): return math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / math.sqrt((1.0 + (math.pow(((2.0 * l) / Om), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0)))))))))
function code(l, Om, kx, ky) return sqrt(Float64(Float64(1.0 / 2.0) * Float64(1.0 + Float64(1.0 / sqrt(Float64(1.0 + Float64((Float64(Float64(2.0 * l) / Om) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))))))))) end
function tmp = code(l, Om, kx, ky) tmp = sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + ((((2.0 * l) / Om) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))))))))); end
code[l_, Om_, kx_, ky_] := N[Sqrt[N[(N[(1.0 / 2.0), $MachinePrecision] * N[(1.0 + N[(1.0 / N[Sqrt[N[(1.0 + N[(N[Power[N[(N[(2.0 * l), $MachinePrecision] / Om), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)}
\end{array}
Sampling outcomes in binary64 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (l Om kx ky)
:precision binary64
(sqrt
(*
(/ 1.0 2.0)
(+
1.0
(/
1.0
(sqrt
(+
1.0
(*
(pow (/ (* 2.0 l) Om) 2.0)
(+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))
double code(double l, double Om, double kx, double ky) {
return sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + (pow(((2.0 * l) / Om), 2.0) * (pow(sin(kx), 2.0) + pow(sin(ky), 2.0)))))))));
}
real(8) function code(l, om, kx, ky)
real(8), intent (in) :: l
real(8), intent (in) :: om
real(8), intent (in) :: kx
real(8), intent (in) :: ky
code = sqrt(((1.0d0 / 2.0d0) * (1.0d0 + (1.0d0 / sqrt((1.0d0 + ((((2.0d0 * l) / om) ** 2.0d0) * ((sin(kx) ** 2.0d0) + (sin(ky) ** 2.0d0)))))))))
end function
public static double code(double l, double Om, double kx, double ky) {
return Math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / Math.sqrt((1.0 + (Math.pow(((2.0 * l) / Om), 2.0) * (Math.pow(Math.sin(kx), 2.0) + Math.pow(Math.sin(ky), 2.0)))))))));
}
def code(l, Om, kx, ky): return math.sqrt(((1.0 / 2.0) * (1.0 + (1.0 / math.sqrt((1.0 + (math.pow(((2.0 * l) / Om), 2.0) * (math.pow(math.sin(kx), 2.0) + math.pow(math.sin(ky), 2.0)))))))))
function code(l, Om, kx, ky) return sqrt(Float64(Float64(1.0 / 2.0) * Float64(1.0 + Float64(1.0 / sqrt(Float64(1.0 + Float64((Float64(Float64(2.0 * l) / Om) ^ 2.0) * Float64((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))))))))) end
function tmp = code(l, Om, kx, ky) tmp = sqrt(((1.0 / 2.0) * (1.0 + (1.0 / sqrt((1.0 + ((((2.0 * l) / Om) ^ 2.0) * ((sin(kx) ^ 2.0) + (sin(ky) ^ 2.0))))))))); end
code[l_, Om_, kx_, ky_] := N[Sqrt[N[(N[(1.0 / 2.0), $MachinePrecision] * N[(1.0 + N[(1.0 / N[Sqrt[N[(1.0 + N[(N[Power[N[(N[(2.0 * l), $MachinePrecision] / Om), $MachinePrecision], 2.0], $MachinePrecision] * N[(N[Power[N[Sin[kx], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[ky], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]), $MachinePrecision]), $MachinePrecision]), $MachinePrecision]], $MachinePrecision]
\begin{array}{l}
\\
\sqrt{\frac{1}{2} \cdot \left(1 + \frac{1}{\sqrt{1 + {\left(\frac{2 \cdot \ell}{Om}\right)}^{2} \cdot \left({\sin kx}^{2} + {\sin ky}^{2}\right)}}\right)}
\end{array}
ky_m = (fabs.f64 ky)
kx_m = (fabs.f64 kx)
NOTE: l, Om, kx_m, and ky_m should be sorted in increasing order before calling this function.
(FPCore (l Om kx_m ky_m)
:precision binary64
(let* ((t_0 (* (/ l Om) 2.0)))
(if (<= (pow (sin ky_m) 2.0) 2e-38)
(sqrt
(*
(+
(/ 1.0 (sqrt (fma t_0 (* (+ (* kx_m kx_m) (* ky_m ky_m)) t_0) 1.0)))
1.0)
0.5))
(sqrt
(*
(+
(/
1.0
(sqrt
(fma
(* 4.0 (/ l Om))
(*
(- 1.0 (* (+ (cos (* kx_m 2.0)) (cos (+ ky_m ky_m))) 0.5))
(/ l Om))
1.0)))
1.0)
0.5)))))ky_m = fabs(ky);
kx_m = fabs(kx);
assert(l < Om && Om < kx_m && kx_m < ky_m);
double code(double l, double Om, double kx_m, double ky_m) {
double t_0 = (l / Om) * 2.0;
double tmp;
if (pow(sin(ky_m), 2.0) <= 2e-38) {
tmp = sqrt((((1.0 / sqrt(fma(t_0, (((kx_m * kx_m) + (ky_m * ky_m)) * t_0), 1.0))) + 1.0) * 0.5));
} else {
tmp = sqrt((((1.0 / sqrt(fma((4.0 * (l / Om)), ((1.0 - ((cos((kx_m * 2.0)) + cos((ky_m + ky_m))) * 0.5)) * (l / Om)), 1.0))) + 1.0) * 0.5));
}
return tmp;
}
ky_m = abs(ky) kx_m = abs(kx) l, Om, kx_m, ky_m = sort([l, Om, kx_m, ky_m]) function code(l, Om, kx_m, ky_m) t_0 = Float64(Float64(l / Om) * 2.0) tmp = 0.0 if ((sin(ky_m) ^ 2.0) <= 2e-38) tmp = sqrt(Float64(Float64(Float64(1.0 / sqrt(fma(t_0, Float64(Float64(Float64(kx_m * kx_m) + Float64(ky_m * ky_m)) * t_0), 1.0))) + 1.0) * 0.5)); else tmp = sqrt(Float64(Float64(Float64(1.0 / sqrt(fma(Float64(4.0 * Float64(l / Om)), Float64(Float64(1.0 - Float64(Float64(cos(Float64(kx_m * 2.0)) + cos(Float64(ky_m + ky_m))) * 0.5)) * Float64(l / Om)), 1.0))) + 1.0) * 0.5)); end return tmp end
ky_m = N[Abs[ky], $MachinePrecision]
kx_m = N[Abs[kx], $MachinePrecision]
NOTE: l, Om, kx_m, and ky_m should be sorted in increasing order before calling this function.
code[l_, Om_, kx$95$m_, ky$95$m_] := Block[{t$95$0 = N[(N[(l / Om), $MachinePrecision] * 2.0), $MachinePrecision]}, If[LessEqual[N[Power[N[Sin[ky$95$m], $MachinePrecision], 2.0], $MachinePrecision], 2e-38], N[Sqrt[N[(N[(N[(1.0 / N[Sqrt[N[(t$95$0 * N[(N[(N[(kx$95$m * kx$95$m), $MachinePrecision] + N[(ky$95$m * ky$95$m), $MachinePrecision]), $MachinePrecision] * t$95$0), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision] * 0.5), $MachinePrecision]], $MachinePrecision], N[Sqrt[N[(N[(N[(1.0 / N[Sqrt[N[(N[(4.0 * N[(l / Om), $MachinePrecision]), $MachinePrecision] * N[(N[(1.0 - N[(N[(N[Cos[N[(kx$95$m * 2.0), $MachinePrecision]], $MachinePrecision] + N[Cos[N[(ky$95$m + ky$95$m), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] * 0.5), $MachinePrecision]), $MachinePrecision] * N[(l / Om), $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision] * 0.5), $MachinePrecision]], $MachinePrecision]]]
\begin{array}{l}
ky_m = \left|ky\right|
\\
kx_m = \left|kx\right|
\\
[l, Om, kx_m, ky_m] = \mathsf{sort}([l, Om, kx_m, ky_m])\\
\\
\begin{array}{l}
t_0 := \frac{\ell}{Om} \cdot 2\\
\mathbf{if}\;{\sin ky\_m}^{2} \leq 2 \cdot 10^{-38}:\\
\;\;\;\;\sqrt{\left(\frac{1}{\sqrt{\mathsf{fma}\left(t\_0, \left(kx\_m \cdot kx\_m + ky\_m \cdot ky\_m\right) \cdot t\_0, 1\right)}} + 1\right) \cdot 0.5}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\left(\frac{1}{\sqrt{\mathsf{fma}\left(4 \cdot \frac{\ell}{Om}, \left(1 - \left(\cos \left(kx\_m \cdot 2\right) + \cos \left(ky\_m + ky\_m\right)\right) \cdot 0.5\right) \cdot \frac{\ell}{Om}, 1\right)}} + 1\right) \cdot 0.5}\\
\end{array}
\end{array}
if (pow.f64 (sin.f64 ky) #s(literal 2 binary64)) < 1.9999999999999999e-38Initial program 96.9%
Taylor expanded in ky around 0
unpow2N/A
lower-*.f6496.9
Applied rewrites96.9%
lift-+.f64N/A
+-commutativeN/A
lift-*.f64N/A
lift-pow.f64N/A
unpow2N/A
associate-*l*N/A
lower-fma.f64N/A
Applied rewrites98.7%
Taylor expanded in kx around 0
unpow2N/A
lower-*.f6498.7
Applied rewrites98.7%
lift-/.f64N/A
metadata-eval98.7
Applied rewrites98.7%
if 1.9999999999999999e-38 < (pow.f64 (sin.f64 ky) #s(literal 2 binary64)) Initial program 100.0%
Applied rewrites100.0%
lift-/.f64N/A
metadata-eval100.0
Applied rewrites100.0%
Taylor expanded in ky around inf
lower--.f64N/A
+-commutativeN/A
*-commutativeN/A
metadata-evalN/A
distribute-lft-neg-inN/A
*-commutativeN/A
distribute-lft-outN/A
lower-*.f64N/A
distribute-lft-neg-inN/A
metadata-evalN/A
lower-+.f64N/A
metadata-evalN/A
distribute-lft-neg-inN/A
lower-cos.f64N/A
distribute-lft-neg-inN/A
metadata-evalN/A
*-commutativeN/A
lower-*.f64N/A
Applied rewrites100.0%
Applied rewrites100.0%
Final simplification99.7%
ky_m = (fabs.f64 ky)
kx_m = (fabs.f64 kx)
NOTE: l, Om, kx_m, and ky_m should be sorted in increasing order before calling this function.
(FPCore (l Om kx_m ky_m)
:precision binary64
(let* ((t_0 (* (/ l Om) 2.0)))
(if (<=
(/
1.0
(sqrt
(+
(*
(+ (pow (sin ky_m) 2.0) (pow (sin kx_m) 2.0))
(pow (/ (* l 2.0) Om) 2.0))
1.0)))
0.0001)
(sqrt (fma (/ Om (* (sin ky_m) l)) -0.25 0.5))
(sqrt
(fma
(sqrt (/ 1.0 (fma (* (fma -0.5 (cos (+ kx_m kx_m)) 0.5) t_0) t_0 1.0)))
0.5
0.5)))))ky_m = fabs(ky);
kx_m = fabs(kx);
assert(l < Om && Om < kx_m && kx_m < ky_m);
double code(double l, double Om, double kx_m, double ky_m) {
double t_0 = (l / Om) * 2.0;
double tmp;
if ((1.0 / sqrt((((pow(sin(ky_m), 2.0) + pow(sin(kx_m), 2.0)) * pow(((l * 2.0) / Om), 2.0)) + 1.0))) <= 0.0001) {
tmp = sqrt(fma((Om / (sin(ky_m) * l)), -0.25, 0.5));
} else {
tmp = sqrt(fma(sqrt((1.0 / fma((fma(-0.5, cos((kx_m + kx_m)), 0.5) * t_0), t_0, 1.0))), 0.5, 0.5));
}
return tmp;
}
ky_m = abs(ky) kx_m = abs(kx) l, Om, kx_m, ky_m = sort([l, Om, kx_m, ky_m]) function code(l, Om, kx_m, ky_m) t_0 = Float64(Float64(l / Om) * 2.0) tmp = 0.0 if (Float64(1.0 / sqrt(Float64(Float64(Float64((sin(ky_m) ^ 2.0) + (sin(kx_m) ^ 2.0)) * (Float64(Float64(l * 2.0) / Om) ^ 2.0)) + 1.0))) <= 0.0001) tmp = sqrt(fma(Float64(Om / Float64(sin(ky_m) * l)), -0.25, 0.5)); else tmp = sqrt(fma(sqrt(Float64(1.0 / fma(Float64(fma(-0.5, cos(Float64(kx_m + kx_m)), 0.5) * t_0), t_0, 1.0))), 0.5, 0.5)); end return tmp end
ky_m = N[Abs[ky], $MachinePrecision]
kx_m = N[Abs[kx], $MachinePrecision]
NOTE: l, Om, kx_m, and ky_m should be sorted in increasing order before calling this function.
code[l_, Om_, kx$95$m_, ky$95$m_] := Block[{t$95$0 = N[(N[(l / Om), $MachinePrecision] * 2.0), $MachinePrecision]}, If[LessEqual[N[(1.0 / N[Sqrt[N[(N[(N[(N[Power[N[Sin[ky$95$m], $MachinePrecision], 2.0], $MachinePrecision] + N[Power[N[Sin[kx$95$m], $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision] * N[Power[N[(N[(l * 2.0), $MachinePrecision] / Om), $MachinePrecision], 2.0], $MachinePrecision]), $MachinePrecision] + 1.0), $MachinePrecision]], $MachinePrecision]), $MachinePrecision], 0.0001], N[Sqrt[N[(N[(Om / N[(N[Sin[ky$95$m], $MachinePrecision] * l), $MachinePrecision]), $MachinePrecision] * -0.25 + 0.5), $MachinePrecision]], $MachinePrecision], N[Sqrt[N[(N[Sqrt[N[(1.0 / N[(N[(N[(-0.5 * N[Cos[N[(kx$95$m + kx$95$m), $MachinePrecision]], $MachinePrecision] + 0.5), $MachinePrecision] * t$95$0), $MachinePrecision] * t$95$0 + 1.0), $MachinePrecision]), $MachinePrecision]], $MachinePrecision] * 0.5 + 0.5), $MachinePrecision]], $MachinePrecision]]]
\begin{array}{l}
ky_m = \left|ky\right|
\\
kx_m = \left|kx\right|
\\
[l, Om, kx_m, ky_m] = \mathsf{sort}([l, Om, kx_m, ky_m])\\
\\
\begin{array}{l}
t_0 := \frac{\ell}{Om} \cdot 2\\
\mathbf{if}\;\frac{1}{\sqrt{\left({\sin ky\_m}^{2} + {\sin kx\_m}^{2}\right) \cdot {\left(\frac{\ell \cdot 2}{Om}\right)}^{2} + 1}} \leq 0.0001:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\frac{Om}{\sin ky\_m \cdot \ell}, -0.25, 0.5\right)}\\
\mathbf{else}:\\
\;\;\;\;\sqrt{\mathsf{fma}\left(\sqrt{\frac{1}{\mathsf{fma}\left(\mathsf{fma}\left(-0.5, \cos \left(kx\_m + kx\_m\right), 0.5\right) \cdot t\_0, t\_0, 1\right)}}, 0.5, 0.5\right)}\\
\end{array}
\end{array}
if (/.f64 #s(literal 1 binary64) (sqrt.f64 (+.f64 #s(literal 1 binary64) (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))))) < 1.00000000000000005e-4Initial program 100.0%
Taylor expanded in kx around 0
+-commutativeN/A
distribute-rgt-inN/A
metadata-evalN/A
lower-fma.f64N/A
Applied rewrites90.0%
Taylor expanded in l around -inf
Applied rewrites99.4%
if 1.00000000000000005e-4 < (/.f64 #s(literal 1 binary64) (sqrt.f64 (+.f64 #s(literal 1 binary64) (*.f64 (pow.f64 (/.f64 (*.f64 #s(literal 2 binary64) l) Om) #s(literal 2 binary64)) (+.f64 (pow.f64 (sin.f64 kx) #s(literal 2 binary64)) (pow.f64 (sin.f64 ky) #s(literal 2 binary64))))))) Initial program 97.3%
Taylor expanded in kx around 0
+-commutativeN/A
distribute-rgt-inN/A
metadata-evalN/A
lower-fma.f64N/A
Applied rewrites82.8%
Applied rewrites96.5%
Final simplification97.8%
herbie shell --seed 2024234
(FPCore (l Om kx ky)
:name "Toniolo and Linder, Equation (3a)"
:precision binary64
(sqrt (* (/ 1.0 2.0) (+ 1.0 (/ 1.0 (sqrt (+ 1.0 (* (pow (/ (* 2.0 l) Om) 2.0) (+ (pow (sin kx) 2.0) (pow (sin ky) 2.0))))))))))