Isotropic LOD (LOD)

Percentage Accurate: 67.9% → 67.9%
Time: 7.3s
Alternatives: 6
Speedup: N/A×

Specification

?
\[\left(\left(\left(\left(\left(\left(\left(\left(1 \leq w \land w \leq 16384\right) \land \left(1 \leq h \land h \leq 16384\right)\right) \land \left(1 \leq d \land d \leq 4096\right)\right) \land \left(10^{-20} \leq \left|dX.u\right| \land \left|dX.u\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dX.v\right| \land \left|dX.v\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dX.w\right| \land \left|dX.w\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.u\right| \land \left|dY.u\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.v\right| \land \left|dY.v\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.w\right| \land \left|dY.w\right| \leq 10^{+20}\right)\]
\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_1 := \left\lfloor h\right\rfloor \cdot dY.v\\ t_2 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_3 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_4 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_5 := \left\lfloor w\right\rfloor \cdot dX.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dY.u))
        (t_1 (* (floor h) dY.v))
        (t_2 (* (floor h) dX.v))
        (t_3 (* (floor d) dY.w))
        (t_4 (* (floor d) dX.w))
        (t_5 (* (floor w) dX.u)))
   (log2
    (sqrt
     (fmax
      (+ (+ (* t_5 t_5) (* t_2 t_2)) (* t_4 t_4))
      (+ (+ (* t_0 t_0) (* t_1 t_1)) (* t_3 t_3)))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(w) * dY_46_u;
	float t_1 = floorf(h) * dY_46_v;
	float t_2 = floorf(h) * dX_46_v;
	float t_3 = floorf(d) * dY_46_w;
	float t_4 = floorf(d) * dX_46_w;
	float t_5 = floorf(w) * dX_46_u;
	return log2f(sqrtf(fmaxf((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(w) * dY_46_u)
	t_1 = Float32(floor(h) * dY_46_v)
	t_2 = Float32(floor(h) * dX_46_v)
	t_3 = Float32(floor(d) * dY_46_w)
	t_4 = Float32(floor(d) * dX_46_w)
	t_5 = Float32(floor(w) * dX_46_u)
	return log2(sqrt(fmax(Float32(Float32(Float32(t_5 * t_5) + Float32(t_2 * t_2)) + Float32(t_4 * t_4)), Float32(Float32(Float32(t_0 * t_0) + Float32(t_1 * t_1)) + Float32(t_3 * t_3)))))
end
function tmp = code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = floor(w) * dY_46_u;
	t_1 = floor(h) * dY_46_v;
	t_2 = floor(h) * dX_46_v;
	t_3 = floor(d) * dY_46_w;
	t_4 = floor(d) * dX_46_w;
	t_5 = floor(w) * dX_46_u;
	tmp = log2(sqrt(max((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_1 := \left\lfloor h\right\rfloor  \cdot dY.v\\
t_2 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_3 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_4 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_5 := \left\lfloor w\right\rfloor  \cdot dX.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right)
\end{array}
\end{array}

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 6 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 67.9% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_1 := \left\lfloor h\right\rfloor \cdot dY.v\\ t_2 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_3 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_4 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_5 := \left\lfloor w\right\rfloor \cdot dX.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dY.u))
        (t_1 (* (floor h) dY.v))
        (t_2 (* (floor h) dX.v))
        (t_3 (* (floor d) dY.w))
        (t_4 (* (floor d) dX.w))
        (t_5 (* (floor w) dX.u)))
   (log2
    (sqrt
     (fmax
      (+ (+ (* t_5 t_5) (* t_2 t_2)) (* t_4 t_4))
      (+ (+ (* t_0 t_0) (* t_1 t_1)) (* t_3 t_3)))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(w) * dY_46_u;
	float t_1 = floorf(h) * dY_46_v;
	float t_2 = floorf(h) * dX_46_v;
	float t_3 = floorf(d) * dY_46_w;
	float t_4 = floorf(d) * dX_46_w;
	float t_5 = floorf(w) * dX_46_u;
	return log2f(sqrtf(fmaxf((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(w) * dY_46_u)
	t_1 = Float32(floor(h) * dY_46_v)
	t_2 = Float32(floor(h) * dX_46_v)
	t_3 = Float32(floor(d) * dY_46_w)
	t_4 = Float32(floor(d) * dX_46_w)
	t_5 = Float32(floor(w) * dX_46_u)
	return log2(sqrt(fmax(Float32(Float32(Float32(t_5 * t_5) + Float32(t_2 * t_2)) + Float32(t_4 * t_4)), Float32(Float32(Float32(t_0 * t_0) + Float32(t_1 * t_1)) + Float32(t_3 * t_3)))))
end
function tmp = code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = floor(w) * dY_46_u;
	t_1 = floor(h) * dY_46_v;
	t_2 = floor(h) * dX_46_v;
	t_3 = floor(d) * dY_46_w;
	t_4 = floor(d) * dX_46_w;
	t_5 = floor(w) * dX_46_u;
	tmp = log2(sqrt(max((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_1 := \left\lfloor h\right\rfloor  \cdot dY.v\\
t_2 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_3 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_4 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_5 := \left\lfloor w\right\rfloor  \cdot dX.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right)
\end{array}
\end{array}

Alternative 1: 67.9% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_1 := \left\lfloor h\right\rfloor \cdot dY.v\\ t_2 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_3 := \left\lfloor w\right\rfloor \cdot dX.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_3 \cdot t\_3 + t\_0 \cdot t\_0\right) + t\_2 \cdot t\_2, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor , dY.u, t\_1 \cdot t\_1\right)\right)\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor h) dX.v))
        (t_1 (* (floor h) dY.v))
        (t_2 (* (floor d) dX.w))
        (t_3 (* (floor w) dX.u)))
   (log2
    (sqrt
     (fmax
      (+ (+ (* t_3 t_3) (* t_0 t_0)) (* t_2 t_2))
      (fma
       (* (* (floor d) dY.w) (floor d))
       dY.w
       (fma (* (* (floor w) dY.u) (floor w)) dY.u (* t_1 t_1))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(h) * dX_46_v;
	float t_1 = floorf(h) * dY_46_v;
	float t_2 = floorf(d) * dX_46_w;
	float t_3 = floorf(w) * dX_46_u;
	return log2f(sqrtf(fmaxf((((t_3 * t_3) + (t_0 * t_0)) + (t_2 * t_2)), fmaf(((floorf(d) * dY_46_w) * floorf(d)), dY_46_w, fmaf(((floorf(w) * dY_46_u) * floorf(w)), dY_46_u, (t_1 * t_1))))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(h) * dX_46_v)
	t_1 = Float32(floor(h) * dY_46_v)
	t_2 = Float32(floor(d) * dX_46_w)
	t_3 = Float32(floor(w) * dX_46_u)
	return log2(sqrt(fmax(Float32(Float32(Float32(t_3 * t_3) + Float32(t_0 * t_0)) + Float32(t_2 * t_2)), fma(Float32(Float32(floor(d) * dY_46_w) * floor(d)), dY_46_w, fma(Float32(Float32(floor(w) * dY_46_u) * floor(w)), dY_46_u, Float32(t_1 * t_1))))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_1 := \left\lfloor h\right\rfloor  \cdot dY.v\\
t_2 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_3 := \left\lfloor w\right\rfloor  \cdot dX.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_3 \cdot t\_3 + t\_0 \cdot t\_0\right) + t\_2 \cdot t\_2, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor  \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor w\right\rfloor  \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor , dY.u, t\_1 \cdot t\_1\right)\right)\right)}\right)
\end{array}
\end{array}
Derivation
  1. Initial program 67.9%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Applied rewrites67.9%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \color{blue}{\mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor , dY.u, \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right)\right)}\right)}\right) \]
  3. Add Preprocessing

Alternative 2: 67.9% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_1 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_2 := \left\lfloor w\right\rfloor \cdot dX.u\\ t_3 := \left\lfloor w\right\rfloor \cdot dY.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_2, t\_2, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, t\_1 \cdot t\_1\right)\right), \mathsf{fma}\left(t\_3, t\_3, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor d) dY.w))
        (t_1 (* (floor d) dX.w))
        (t_2 (* (floor w) dX.u))
        (t_3 (* (floor w) dY.u)))
   (log2
    (sqrt
     (fmax
      (fma t_2 t_2 (fma (* (* (floor h) dX.v) (floor h)) dX.v (* t_1 t_1)))
      (fma
       t_3
       t_3
       (fma (* (* (floor h) dY.v) (floor h)) dY.v (* t_0 t_0))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(d) * dY_46_w;
	float t_1 = floorf(d) * dX_46_w;
	float t_2 = floorf(w) * dX_46_u;
	float t_3 = floorf(w) * dY_46_u;
	return log2f(sqrtf(fmaxf(fmaf(t_2, t_2, fmaf(((floorf(h) * dX_46_v) * floorf(h)), dX_46_v, (t_1 * t_1))), fmaf(t_3, t_3, fmaf(((floorf(h) * dY_46_v) * floorf(h)), dY_46_v, (t_0 * t_0))))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(d) * dY_46_w)
	t_1 = Float32(floor(d) * dX_46_w)
	t_2 = Float32(floor(w) * dX_46_u)
	t_3 = Float32(floor(w) * dY_46_u)
	return log2(sqrt(fmax(fma(t_2, t_2, fma(Float32(Float32(floor(h) * dX_46_v) * floor(h)), dX_46_v, Float32(t_1 * t_1))), fma(t_3, t_3, fma(Float32(Float32(floor(h) * dY_46_v) * floor(h)), dY_46_v, Float32(t_0 * t_0))))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_1 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_2 := \left\lfloor w\right\rfloor  \cdot dX.u\\
t_3 := \left\lfloor w\right\rfloor  \cdot dY.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_2, t\_2, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, t\_1 \cdot t\_1\right)\right), \mathsf{fma}\left(t\_3, t\_3, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right)
\end{array}
\end{array}
Derivation
  1. Initial program 67.9%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Applied rewrites67.9%

    \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dX.u, \left\lfloor w\right\rfloor \cdot dX.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right)\right), \mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dY.u, \left\lfloor w\right\rfloor \cdot dY.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)\right)}\right)} \]
  3. Add Preprocessing

Alternative 3: 62.9% accurate, 1.2× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_1 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_2 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_3 := \left\lfloor w\right\rfloor \cdot dX.u\\ t_4 := \left\lfloor d\right\rfloor \cdot dY.w\\ \mathbf{if}\;dX.u \leq 30000:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot \left\lfloor h\right\rfloor , dX.v, t\_2 \cdot t\_2\right), \mathsf{fma}\left(t\_4 \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_1 \cdot t\_1\right)\right)\right)}\right)\\ \mathbf{else}:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_3, t\_3, \mathsf{fma}\left(t\_2 \cdot \left\lfloor d\right\rfloor , dX.w, t\_0 \cdot t\_0\right)\right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , t\_4 \cdot t\_4\right)\right)}\right)\\ \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor h) dX.v))
        (t_1 (* (floor w) dY.u))
        (t_2 (* (floor d) dX.w))
        (t_3 (* (floor w) dX.u))
        (t_4 (* (floor d) dY.w)))
   (if (<= dX.u 30000.0)
     (log2
      (sqrt
       (fmax
        (fma (* t_0 (floor h)) dX.v (* t_2 t_2))
        (fma
         (* t_4 (floor d))
         dY.w
         (fma (* (* (floor h) dY.v) (floor h)) dY.v (* t_1 t_1))))))
     (log2
      (sqrt
       (fmax
        (fma t_3 t_3 (fma (* t_2 (floor d)) dX.w (* t_0 t_0)))
        (fma (* dY.u dY.u) (* (floor w) (floor w)) (* t_4 t_4))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(h) * dX_46_v;
	float t_1 = floorf(w) * dY_46_u;
	float t_2 = floorf(d) * dX_46_w;
	float t_3 = floorf(w) * dX_46_u;
	float t_4 = floorf(d) * dY_46_w;
	float tmp;
	if (dX_46_u <= 30000.0f) {
		tmp = log2f(sqrtf(fmaxf(fmaf((t_0 * floorf(h)), dX_46_v, (t_2 * t_2)), fmaf((t_4 * floorf(d)), dY_46_w, fmaf(((floorf(h) * dY_46_v) * floorf(h)), dY_46_v, (t_1 * t_1))))));
	} else {
		tmp = log2f(sqrtf(fmaxf(fmaf(t_3, t_3, fmaf((t_2 * floorf(d)), dX_46_w, (t_0 * t_0))), fmaf((dY_46_u * dY_46_u), (floorf(w) * floorf(w)), (t_4 * t_4)))));
	}
	return tmp;
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(h) * dX_46_v)
	t_1 = Float32(floor(w) * dY_46_u)
	t_2 = Float32(floor(d) * dX_46_w)
	t_3 = Float32(floor(w) * dX_46_u)
	t_4 = Float32(floor(d) * dY_46_w)
	tmp = Float32(0.0)
	if (dX_46_u <= Float32(30000.0))
		tmp = log2(sqrt(fmax(fma(Float32(t_0 * floor(h)), dX_46_v, Float32(t_2 * t_2)), fma(Float32(t_4 * floor(d)), dY_46_w, fma(Float32(Float32(floor(h) * dY_46_v) * floor(h)), dY_46_v, Float32(t_1 * t_1))))));
	else
		tmp = log2(sqrt(fmax(fma(t_3, t_3, fma(Float32(t_2 * floor(d)), dX_46_w, Float32(t_0 * t_0))), fma(Float32(dY_46_u * dY_46_u), Float32(floor(w) * floor(w)), Float32(t_4 * t_4)))));
	end
	return tmp
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_1 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_2 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_3 := \left\lfloor w\right\rfloor  \cdot dX.u\\
t_4 := \left\lfloor d\right\rfloor  \cdot dY.w\\
\mathbf{if}\;dX.u \leq 30000:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot \left\lfloor h\right\rfloor , dX.v, t\_2 \cdot t\_2\right), \mathsf{fma}\left(t\_4 \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_1 \cdot t\_1\right)\right)\right)}\right)\\

\mathbf{else}:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_3, t\_3, \mathsf{fma}\left(t\_2 \cdot \left\lfloor d\right\rfloor , dX.w, t\_0 \cdot t\_0\right)\right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor  \cdot \left\lfloor w\right\rfloor , t\_4 \cdot t\_4\right)\right)}\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if dX.u < 3e4

    1. Initial program 67.9%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dX.u around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.v}^{2} \cdot {\left(\left\lfloor h\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. Applied rewrites60.4%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.v}^{2}, {\left(\left\lfloor h\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. Applied rewrites60.4%

      \[\leadsto \log_{2} \color{blue}{\left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right)\right)\right)\right)}\right)} \]

    if 3e4 < dX.u

    1. Initial program 67.9%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dY.v around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \color{blue}{{dY.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dY.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}\right)}\right) \]
    3. Applied rewrites61.0%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \color{blue}{\mathsf{fma}\left({dY.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dY.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}\right)}\right) \]
    4. Applied rewrites61.0%

      \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dX.u, \left\lfloor w\right\rfloor \cdot dX.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right)\right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)}\right)} \]
    5. Applied rewrites61.0%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dX.u, \left\lfloor w\right\rfloor \cdot dX.u, \color{blue}{\mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right)}\right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)}\right) \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 4: 62.6% accurate, 1.2× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor \\ t_1 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_2 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_3 := t\_2 \cdot t\_2\\ t_4 := \left\lfloor d\right\rfloor \cdot dY.w\\ \mathbf{if}\;dX.u \leq 13480000:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, t\_3\right), \mathsf{fma}\left(t\_4 \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(t\_0, dY.v, t\_1 \cdot t\_1\right)\right)\right)}\right)\\ \mathbf{else}:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , t\_3\right), \mathsf{fma}\left(t\_1, t\_1, \mathsf{fma}\left(t\_0, dY.v, t\_4 \cdot t\_4\right)\right)\right)}\right)\\ \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (* (floor h) dY.v) (floor h)))
        (t_1 (* (floor w) dY.u))
        (t_2 (* (floor d) dX.w))
        (t_3 (* t_2 t_2))
        (t_4 (* (floor d) dY.w)))
   (if (<= dX.u 13480000.0)
     (log2
      (sqrt
       (fmax
        (fma (* (* (floor h) dX.v) (floor h)) dX.v t_3)
        (fma (* t_4 (floor d)) dY.w (fma t_0 dY.v (* t_1 t_1))))))
     (log2
      (sqrt
       (fmax
        (fma (* dX.u dX.u) (* (floor w) (floor w)) t_3)
        (fma t_1 t_1 (fma t_0 dY.v (* t_4 t_4)))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = (floorf(h) * dY_46_v) * floorf(h);
	float t_1 = floorf(w) * dY_46_u;
	float t_2 = floorf(d) * dX_46_w;
	float t_3 = t_2 * t_2;
	float t_4 = floorf(d) * dY_46_w;
	float tmp;
	if (dX_46_u <= 13480000.0f) {
		tmp = log2f(sqrtf(fmaxf(fmaf(((floorf(h) * dX_46_v) * floorf(h)), dX_46_v, t_3), fmaf((t_4 * floorf(d)), dY_46_w, fmaf(t_0, dY_46_v, (t_1 * t_1))))));
	} else {
		tmp = log2f(sqrtf(fmaxf(fmaf((dX_46_u * dX_46_u), (floorf(w) * floorf(w)), t_3), fmaf(t_1, t_1, fmaf(t_0, dY_46_v, (t_4 * t_4))))));
	}
	return tmp;
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(Float32(floor(h) * dY_46_v) * floor(h))
	t_1 = Float32(floor(w) * dY_46_u)
	t_2 = Float32(floor(d) * dX_46_w)
	t_3 = Float32(t_2 * t_2)
	t_4 = Float32(floor(d) * dY_46_w)
	tmp = Float32(0.0)
	if (dX_46_u <= Float32(13480000.0))
		tmp = log2(sqrt(fmax(fma(Float32(Float32(floor(h) * dX_46_v) * floor(h)), dX_46_v, t_3), fma(Float32(t_4 * floor(d)), dY_46_w, fma(t_0, dY_46_v, Float32(t_1 * t_1))))));
	else
		tmp = log2(sqrt(fmax(fma(Float32(dX_46_u * dX_46_u), Float32(floor(w) * floor(w)), t_3), fma(t_1, t_1, fma(t_0, dY_46_v, Float32(t_4 * t_4))))));
	end
	return tmp
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left(\left\lfloor h\right\rfloor  \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor \\
t_1 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_2 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_3 := t\_2 \cdot t\_2\\
t_4 := \left\lfloor d\right\rfloor  \cdot dY.w\\
\mathbf{if}\;dX.u \leq 13480000:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, t\_3\right), \mathsf{fma}\left(t\_4 \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(t\_0, dY.v, t\_1 \cdot t\_1\right)\right)\right)}\right)\\

\mathbf{else}:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor  \cdot \left\lfloor w\right\rfloor , t\_3\right), \mathsf{fma}\left(t\_1, t\_1, \mathsf{fma}\left(t\_0, dY.v, t\_4 \cdot t\_4\right)\right)\right)}\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if dX.u < 1.348e7

    1. Initial program 67.9%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dX.u around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.v}^{2} \cdot {\left(\left\lfloor h\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. Applied rewrites60.4%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.v}^{2}, {\left(\left\lfloor h\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. Applied rewrites60.4%

      \[\leadsto \log_{2} \color{blue}{\left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor , dX.v, \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right)\right)\right)\right)}\right)} \]

    if 1.348e7 < dX.u

    1. Initial program 67.9%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dX.v around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. Applied rewrites60.7%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. Applied rewrites60.7%

      \[\leadsto \log_{2} \left(\sqrt{\color{blue}{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dY.u, \left\lfloor w\right\rfloor \cdot dY.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)\right)}}\right) \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 5: 60.7% accurate, 1.2× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_1 := \left\lfloor d\right\rfloor \cdot dX.w\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , t\_1 \cdot t\_1\right), \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dY.u)) (t_1 (* (floor d) dX.w)))
   (log2
    (sqrt
     (fmax
      (fma (* dX.u dX.u) (* (floor w) (floor w)) (* t_1 t_1))
      (fma
       (* (* (floor d) dY.w) (floor d))
       dY.w
       (fma (* (* (floor h) dY.v) (floor h)) dY.v (* t_0 t_0))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(w) * dY_46_u;
	float t_1 = floorf(d) * dX_46_w;
	return log2f(sqrtf(fmaxf(fmaf((dX_46_u * dX_46_u), (floorf(w) * floorf(w)), (t_1 * t_1)), fmaf(((floorf(d) * dY_46_w) * floorf(d)), dY_46_w, fmaf(((floorf(h) * dY_46_v) * floorf(h)), dY_46_v, (t_0 * t_0))))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(w) * dY_46_u)
	t_1 = Float32(floor(d) * dX_46_w)
	return log2(sqrt(fmax(fma(Float32(dX_46_u * dX_46_u), Float32(floor(w) * floor(w)), Float32(t_1 * t_1)), fma(Float32(Float32(floor(d) * dY_46_w) * floor(d)), dY_46_w, fma(Float32(Float32(floor(h) * dY_46_v) * floor(h)), dY_46_v, Float32(t_0 * t_0))))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_1 := \left\lfloor d\right\rfloor  \cdot dX.w\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor  \cdot \left\lfloor w\right\rfloor , t\_1 \cdot t\_1\right), \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor  \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right)
\end{array}
\end{array}
Derivation
  1. Initial program 67.9%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Taylor expanded in dX.v around 0

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  3. Applied rewrites60.7%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  4. Applied rewrites60.7%

    \[\leadsto \log_{2} \left(\sqrt{\color{blue}{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dY.u, \left\lfloor w\right\rfloor \cdot dY.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)\right)}}\right) \]
  5. Applied rewrites60.7%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \color{blue}{\mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left\lfloor d\right\rfloor , dY.w, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right)\right)\right)}\right)}\right) \]
  6. Add Preprocessing

Alternative 6: 60.7% accurate, 1.2× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_1 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_2 := \left\lfloor w\right\rfloor \cdot dY.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , t\_1 \cdot t\_1\right), \mathsf{fma}\left(t\_2, t\_2, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor d) dY.w))
        (t_1 (* (floor d) dX.w))
        (t_2 (* (floor w) dY.u)))
   (log2
    (sqrt
     (fmax
      (fma (* dX.u dX.u) (* (floor w) (floor w)) (* t_1 t_1))
      (fma
       t_2
       t_2
       (fma (* (* (floor h) dY.v) (floor h)) dY.v (* t_0 t_0))))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(d) * dY_46_w;
	float t_1 = floorf(d) * dX_46_w;
	float t_2 = floorf(w) * dY_46_u;
	return log2f(sqrtf(fmaxf(fmaf((dX_46_u * dX_46_u), (floorf(w) * floorf(w)), (t_1 * t_1)), fmaf(t_2, t_2, fmaf(((floorf(h) * dY_46_v) * floorf(h)), dY_46_v, (t_0 * t_0))))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(d) * dY_46_w)
	t_1 = Float32(floor(d) * dX_46_w)
	t_2 = Float32(floor(w) * dY_46_u)
	return log2(sqrt(fmax(fma(Float32(dX_46_u * dX_46_u), Float32(floor(w) * floor(w)), Float32(t_1 * t_1)), fma(t_2, t_2, fma(Float32(Float32(floor(h) * dY_46_v) * floor(h)), dY_46_v, Float32(t_0 * t_0))))))
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_1 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_2 := \left\lfloor w\right\rfloor  \cdot dY.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor  \cdot \left\lfloor w\right\rfloor , t\_1 \cdot t\_1\right), \mathsf{fma}\left(t\_2, t\_2, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor  \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, t\_0 \cdot t\_0\right)\right)\right)}\right)
\end{array}
\end{array}
Derivation
  1. Initial program 67.9%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Taylor expanded in dX.v around 0

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  3. Applied rewrites60.7%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  4. Applied rewrites60.7%

    \[\leadsto \log_{2} \left(\sqrt{\color{blue}{\mathsf{max}\left(\mathsf{fma}\left(dX.u \cdot dX.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right)\right), \mathsf{fma}\left(\left\lfloor w\right\rfloor \cdot dY.u, \left\lfloor w\right\rfloor \cdot dY.u, \mathsf{fma}\left(\left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor , dY.v, \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)\right)\right)}}\right) \]
  5. Add Preprocessing

Reproduce

?
herbie shell --seed 2025161 
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
  :name "Isotropic LOD (LOD)"
  :precision binary32
  :pre (and (and (and (and (and (and (and (and (and (<= 1.0 w) (<= w 16384.0)) (and (<= 1.0 h) (<= h 16384.0))) (and (<= 1.0 d) (<= d 4096.0))) (and (<= 1e-20 (fabs dX.u)) (<= (fabs dX.u) 1e+20))) (and (<= 1e-20 (fabs dX.v)) (<= (fabs dX.v) 1e+20))) (and (<= 1e-20 (fabs dX.w)) (<= (fabs dX.w) 1e+20))) (and (<= 1e-20 (fabs dY.u)) (<= (fabs dY.u) 1e+20))) (and (<= 1e-20 (fabs dY.v)) (<= (fabs dY.v) 1e+20))) (and (<= 1e-20 (fabs dY.w)) (<= (fabs dY.w) 1e+20)))
  (log2 (sqrt (fmax (+ (+ (* (* (floor w) dX.u) (* (floor w) dX.u)) (* (* (floor h) dX.v) (* (floor h) dX.v))) (* (* (floor d) dX.w) (* (floor d) dX.w))) (+ (+ (* (* (floor w) dY.u) (* (floor w) dY.u)) (* (* (floor h) dY.v) (* (floor h) dY.v))) (* (* (floor d) dY.w) (* (floor d) dY.w)))))))