Isotropic LOD (LOD)

Percentage Accurate: 67.6% → 71.2%
Time: 9.0s
Alternatives: 4
Speedup: 0.5×

Specification

?
\[\left(\left(\left(\left(\left(\left(\left(\left(1 \leq w \land w \leq 16384\right) \land \left(1 \leq h \land h \leq 16384\right)\right) \land \left(1 \leq d \land d \leq 4096\right)\right) \land \left(10^{-20} \leq \left|dX.u\right| \land \left|dX.u\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dX.v\right| \land \left|dX.v\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dX.w\right| \land \left|dX.w\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.u\right| \land \left|dY.u\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.v\right| \land \left|dY.v\right| \leq 10^{+20}\right)\right) \land \left(10^{-20} \leq \left|dY.w\right| \land \left|dY.w\right| \leq 10^{+20}\right)\]
\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_1 := \left\lfloor h\right\rfloor \cdot dY.v\\ t_2 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_3 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_4 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_5 := \left\lfloor w\right\rfloor \cdot dX.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dY.u))
        (t_1 (* (floor h) dY.v))
        (t_2 (* (floor h) dX.v))
        (t_3 (* (floor d) dY.w))
        (t_4 (* (floor d) dX.w))
        (t_5 (* (floor w) dX.u)))
   (log2
    (sqrt
     (fmax
      (+ (+ (* t_5 t_5) (* t_2 t_2)) (* t_4 t_4))
      (+ (+ (* t_0 t_0) (* t_1 t_1)) (* t_3 t_3)))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(w) * dY_46_u;
	float t_1 = floorf(h) * dY_46_v;
	float t_2 = floorf(h) * dX_46_v;
	float t_3 = floorf(d) * dY_46_w;
	float t_4 = floorf(d) * dX_46_w;
	float t_5 = floorf(w) * dX_46_u;
	return log2f(sqrtf(fmaxf((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(w) * dY_46_u)
	t_1 = Float32(floor(h) * dY_46_v)
	t_2 = Float32(floor(h) * dX_46_v)
	t_3 = Float32(floor(d) * dY_46_w)
	t_4 = Float32(floor(d) * dX_46_w)
	t_5 = Float32(floor(w) * dX_46_u)
	return log2(sqrt(fmax(Float32(Float32(Float32(t_5 * t_5) + Float32(t_2 * t_2)) + Float32(t_4 * t_4)), Float32(Float32(Float32(t_0 * t_0) + Float32(t_1 * t_1)) + Float32(t_3 * t_3)))))
end
function tmp = code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = floor(w) * dY_46_u;
	t_1 = floor(h) * dY_46_v;
	t_2 = floor(h) * dX_46_v;
	t_3 = floor(d) * dY_46_w;
	t_4 = floor(d) * dX_46_w;
	t_5 = floor(w) * dX_46_u;
	tmp = log2(sqrt(max((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_1 := \left\lfloor h\right\rfloor  \cdot dY.v\\
t_2 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_3 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_4 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_5 := \left\lfloor w\right\rfloor  \cdot dX.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right)
\end{array}
\end{array}

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 4 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 67.6% accurate, 1.0× speedup?

\[\begin{array}{l} \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_1 := \left\lfloor h\right\rfloor \cdot dY.v\\ t_2 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_3 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_4 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_5 := \left\lfloor w\right\rfloor \cdot dX.u\\ \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right) \end{array} \end{array} \]
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dY.u))
        (t_1 (* (floor h) dY.v))
        (t_2 (* (floor h) dX.v))
        (t_3 (* (floor d) dY.w))
        (t_4 (* (floor d) dX.w))
        (t_5 (* (floor w) dX.u)))
   (log2
    (sqrt
     (fmax
      (+ (+ (* t_5 t_5) (* t_2 t_2)) (* t_4 t_4))
      (+ (+ (* t_0 t_0) (* t_1 t_1)) (* t_3 t_3)))))))
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v, float dY_46_w) {
	float t_0 = floorf(w) * dY_46_u;
	float t_1 = floorf(h) * dY_46_v;
	float t_2 = floorf(h) * dX_46_v;
	float t_3 = floorf(d) * dY_46_w;
	float t_4 = floorf(d) * dX_46_w;
	float t_5 = floorf(w) * dX_46_u;
	return log2f(sqrtf(fmaxf((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
}
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = Float32(floor(w) * dY_46_u)
	t_1 = Float32(floor(h) * dY_46_v)
	t_2 = Float32(floor(h) * dX_46_v)
	t_3 = Float32(floor(d) * dY_46_w)
	t_4 = Float32(floor(d) * dX_46_w)
	t_5 = Float32(floor(w) * dX_46_u)
	return log2(sqrt(fmax(Float32(Float32(Float32(t_5 * t_5) + Float32(t_2 * t_2)) + Float32(t_4 * t_4)), Float32(Float32(Float32(t_0 * t_0) + Float32(t_1 * t_1)) + Float32(t_3 * t_3)))))
end
function tmp = code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v, dY_46_w)
	t_0 = floor(w) * dY_46_u;
	t_1 = floor(h) * dY_46_v;
	t_2 = floor(h) * dX_46_v;
	t_3 = floor(d) * dY_46_w;
	t_4 = floor(d) * dX_46_w;
	t_5 = floor(w) * dX_46_u;
	tmp = log2(sqrt(max((((t_5 * t_5) + (t_2 * t_2)) + (t_4 * t_4)), (((t_0 * t_0) + (t_1 * t_1)) + (t_3 * t_3)))));
end
\begin{array}{l}

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_1 := \left\lfloor h\right\rfloor  \cdot dY.v\\
t_2 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_3 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_4 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_5 := \left\lfloor w\right\rfloor  \cdot dX.u\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_5 \cdot t\_5 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4, \left(t\_0 \cdot t\_0 + t\_1 \cdot t\_1\right) + t\_3 \cdot t\_3\right)}\right)
\end{array}
\end{array}

Alternative 1: 71.2% accurate, 0.5× speedup?

\[\begin{array}{l} dY.v_m = \left|dY.v\right| \\ \begin{array}{l} t_0 := \left\lfloor w\right\rfloor \cdot dX.u\\ t_1 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_2 := \left\lfloor h\right\rfloor \cdot dY.v\_m\\ t_3 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_4 := \sqrt{-dY.v\_m}\\ t_5 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_6 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_7 := \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_0 \cdot t\_0 + t\_3 \cdot t\_3\right) + t\_6 \cdot t\_6, \left(t\_1 \cdot t\_1 + t\_2 \cdot t\_2\right) + t\_5 \cdot t\_5\right)}\right)\\ \mathbf{if}\;t\_7 \leq 100:\\ \;\;\;\;t\_7\\ \mathbf{else}:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(t\_4 \cdot t\_4\right) \cdot \left(dY.v\_m \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right)\\ \end{array} \end{array} \]
dY.v_m = (fabs.f32 dY.v)
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v_m dY.w)
 :precision binary32
 (let* ((t_0 (* (floor w) dX.u))
        (t_1 (* (floor w) dY.u))
        (t_2 (* (floor h) dY.v_m))
        (t_3 (* (floor h) dX.v))
        (t_4 (sqrt (- dY.v_m)))
        (t_5 (* (floor d) dY.w))
        (t_6 (* (floor d) dX.w))
        (t_7
         (log2
          (sqrt
           (fmax
            (+ (+ (* t_0 t_0) (* t_3 t_3)) (* t_6 t_6))
            (+ (+ (* t_1 t_1) (* t_2 t_2)) (* t_5 t_5)))))))
   (if (<= t_7 100.0)
     t_7
     (log2
      (sqrt
       (fmax
        (fma
         (* (* dX.w (floor d)) (floor d))
         dX.w
         (* (* (* dX.u (floor w)) dX.u) (floor w)))
        (fma
         (* (* t_4 t_4) (* dY.v_m (floor h)))
         (fabs (floor h))
         (fma
          (* (* (floor d) (floor d)) dY.w)
          dY.w
          (* (* (* dY.u (floor w)) dY.u) (floor w))))))))))
dY.v_m = fabs(dY_46_v);
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v_m, float dY_46_w) {
	float t_0 = floorf(w) * dX_46_u;
	float t_1 = floorf(w) * dY_46_u;
	float t_2 = floorf(h) * dY_46_v_m;
	float t_3 = floorf(h) * dX_46_v;
	float t_4 = sqrtf(-dY_46_v_m);
	float t_5 = floorf(d) * dY_46_w;
	float t_6 = floorf(d) * dX_46_w;
	float t_7 = log2f(sqrtf(fmaxf((((t_0 * t_0) + (t_3 * t_3)) + (t_6 * t_6)), (((t_1 * t_1) + (t_2 * t_2)) + (t_5 * t_5)))));
	float tmp;
	if (t_7 <= 100.0f) {
		tmp = t_7;
	} else {
		tmp = log2f(sqrtf(fmaxf(fmaf(((dX_46_w * floorf(d)) * floorf(d)), dX_46_w, (((dX_46_u * floorf(w)) * dX_46_u) * floorf(w))), fmaf(((t_4 * t_4) * (dY_46_v_m * floorf(h))), fabsf(floorf(h)), fmaf(((floorf(d) * floorf(d)) * dY_46_w), dY_46_w, (((dY_46_u * floorf(w)) * dY_46_u) * floorf(w)))))));
	}
	return tmp;
}
dY.v_m = abs(dY_46_v)
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v_m, dY_46_w)
	t_0 = Float32(floor(w) * dX_46_u)
	t_1 = Float32(floor(w) * dY_46_u)
	t_2 = Float32(floor(h) * dY_46_v_m)
	t_3 = Float32(floor(h) * dX_46_v)
	t_4 = sqrt(Float32(-dY_46_v_m))
	t_5 = Float32(floor(d) * dY_46_w)
	t_6 = Float32(floor(d) * dX_46_w)
	t_7 = log2(sqrt(fmax(Float32(Float32(Float32(t_0 * t_0) + Float32(t_3 * t_3)) + Float32(t_6 * t_6)), Float32(Float32(Float32(t_1 * t_1) + Float32(t_2 * t_2)) + Float32(t_5 * t_5)))))
	tmp = Float32(0.0)
	if (t_7 <= Float32(100.0))
		tmp = t_7;
	else
		tmp = log2(sqrt(fmax(fma(Float32(Float32(dX_46_w * floor(d)) * floor(d)), dX_46_w, Float32(Float32(Float32(dX_46_u * floor(w)) * dX_46_u) * floor(w))), fma(Float32(Float32(t_4 * t_4) * Float32(dY_46_v_m * floor(h))), abs(floor(h)), fma(Float32(Float32(floor(d) * floor(d)) * dY_46_w), dY_46_w, Float32(Float32(Float32(dY_46_u * floor(w)) * dY_46_u) * floor(w)))))));
	end
	return tmp
end
\begin{array}{l}
dY.v_m = \left|dY.v\right|

\\
\begin{array}{l}
t_0 := \left\lfloor w\right\rfloor  \cdot dX.u\\
t_1 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_2 := \left\lfloor h\right\rfloor  \cdot dY.v\_m\\
t_3 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_4 := \sqrt{-dY.v\_m}\\
t_5 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_6 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_7 := \log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_0 \cdot t\_0 + t\_3 \cdot t\_3\right) + t\_6 \cdot t\_6, \left(t\_1 \cdot t\_1 + t\_2 \cdot t\_2\right) + t\_5 \cdot t\_5\right)}\right)\\
\mathbf{if}\;t\_7 \leq 100:\\
\;\;\;\;t\_7\\

\mathbf{else}:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(t\_4 \cdot t\_4\right) \cdot \left(dY.v\_m \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor  \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (log2.f32 (sqrt.f32 (fmax.f32 (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dX.u) (*.f32 (floor.f32 w) dX.u)) (*.f32 (*.f32 (floor.f32 h) dX.v) (*.f32 (floor.f32 h) dX.v))) (*.f32 (*.f32 (floor.f32 d) dX.w) (*.f32 (floor.f32 d) dX.w))) (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dY.u) (*.f32 (floor.f32 w) dY.u)) (*.f32 (*.f32 (floor.f32 h) dY.v) (*.f32 (floor.f32 h) dY.v))) (*.f32 (*.f32 (floor.f32 d) dY.w) (*.f32 (floor.f32 d) dY.w)))))) < 100

    1. Initial program 67.6%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]

    if 100 < (log2.f32 (sqrt.f32 (fmax.f32 (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dX.u) (*.f32 (floor.f32 w) dX.u)) (*.f32 (*.f32 (floor.f32 h) dX.v) (*.f32 (floor.f32 h) dX.v))) (*.f32 (*.f32 (floor.f32 d) dX.w) (*.f32 (floor.f32 d) dX.w))) (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dY.u) (*.f32 (floor.f32 w) dY.u)) (*.f32 (*.f32 (floor.f32 h) dY.v) (*.f32 (floor.f32 h) dY.v))) (*.f32 (*.f32 (floor.f32 d) dY.w) (*.f32 (floor.f32 d) dY.w))))))

    1. Initial program 67.6%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dX.v around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. Step-by-step derivation
      1. lower-fma.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, \color{blue}{{\left(\left\lfloor w\right\rfloor \right)}^{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      2. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\color{blue}{\left(\left\lfloor w\right\rfloor \right)}}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      3. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{\color{blue}{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      4. lower-floor.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      5. lower-*.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      6. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      7. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      8. lower-floor.f3260.8

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. Applied rewrites60.8%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    5. Applied rewrites60.8%

      \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(dY.v \cdot \left\lfloor h\right\rfloor , dY.v \cdot \left\lfloor h\right\rfloor , \left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left(dY.w \cdot \left\lfloor d\right\rfloor \right)\right)\right)\right)}\right)} \]
    6. Applied rewrites60.8%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \color{blue}{\mathsf{fma}\left(\left|dY.v\right| \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)}\right)}\right) \]
    7. Step-by-step derivation
      1. lift-fabs.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left|dY.v\right|} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      2. rem-sqrt-square-revN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\sqrt{dY.v \cdot dY.v}} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      3. sqr-neg-revN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\sqrt{\color{blue}{\left(\mathsf{neg}\left(dY.v\right)\right) \cdot \left(\mathsf{neg}\left(dY.v\right)\right)}} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      4. sqrt-prodN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{\mathsf{neg}\left(dY.v\right)} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      5. lower-unsound-*.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{\mathsf{neg}\left(dY.v\right)} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      6. lower-unsound-sqrt.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\color{blue}{\sqrt{\mathsf{neg}\left(dY.v\right)}} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      7. lower-neg.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{\color{blue}{-dY.v}} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      8. lower-unsound-sqrt.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{-dY.v} \cdot \color{blue}{\sqrt{\mathsf{neg}\left(dY.v\right)}}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      9. lower-neg.f3236.1

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{-dY.v} \cdot \sqrt{\color{blue}{-dY.v}}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
    8. Applied rewrites36.1%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{-dY.v} \cdot \sqrt{-dY.v}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 2: 71.2% accurate, 0.5× speedup?

\[\begin{array}{l} dY.v_m = \left|dY.v\right| \\ \begin{array}{l} t_0 := dX.w \cdot \left\lfloor d\right\rfloor \\ t_1 := \left\lfloor w\right\rfloor \cdot dX.u\\ t_2 := \left\lfloor h\right\rfloor \cdot dY.v\_m\\ t_3 := \left\lfloor h\right\rfloor \cdot dX.v\\ t_4 := \left\lfloor d\right\rfloor \cdot dY.w\\ t_5 := \sqrt{-dY.v\_m}\\ t_6 := dY.v\_m \cdot \left\lfloor h\right\rfloor \\ t_7 := \left\lfloor w\right\rfloor \cdot dY.u\\ t_8 := \left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\\ t_9 := \left\lfloor d\right\rfloor \cdot dX.w\\ t_10 := \left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\\ \mathbf{if}\;\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_1 \cdot t\_1 + t\_3 \cdot t\_3\right) + t\_9 \cdot t\_9, \left(t\_7 \cdot t\_7 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4\right)}\right) \leq 100:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot dX.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(t\_8, \left\lfloor w\right\rfloor , \left(\left(dX.v \cdot \left\lfloor h\right\rfloor \right) \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor \right)\right), \mathsf{fma}\left(\left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(t\_10, \left\lfloor w\right\rfloor , \left(t\_6 \cdot dY.v\_m\right) \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right)\\ \mathbf{else}:\\ \;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot \left\lfloor d\right\rfloor , dX.w, t\_8 \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(t\_5 \cdot t\_5\right) \cdot t\_6, \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, t\_10 \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right)\\ \end{array} \end{array} \]
dY.v_m = (fabs.f32 dY.v)
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v_m dY.w)
 :precision binary32
 (let* ((t_0 (* dX.w (floor d)))
        (t_1 (* (floor w) dX.u))
        (t_2 (* (floor h) dY.v_m))
        (t_3 (* (floor h) dX.v))
        (t_4 (* (floor d) dY.w))
        (t_5 (sqrt (- dY.v_m)))
        (t_6 (* dY.v_m (floor h)))
        (t_7 (* (floor w) dY.u))
        (t_8 (* (* dX.u (floor w)) dX.u))
        (t_9 (* (floor d) dX.w))
        (t_10 (* (* dY.u (floor w)) dY.u)))
   (if (<=
        (log2
         (sqrt
          (fmax
           (+ (+ (* t_1 t_1) (* t_3 t_3)) (* t_9 t_9))
           (+ (+ (* t_7 t_7) (* t_2 t_2)) (* t_4 t_4)))))
        100.0)
     (log2
      (sqrt
       (fmax
        (fma
         (* t_0 dX.w)
         (floor d)
         (fma t_8 (floor w) (* (* (* dX.v (floor h)) dX.v) (floor h))))
        (fma
         (* (* dY.w (floor d)) dY.w)
         (floor d)
         (fma t_10 (floor w) (* (* t_6 dY.v_m) (floor h)))))))
     (log2
      (sqrt
       (fmax
        (fma (* t_0 (floor d)) dX.w (* t_8 (floor w)))
        (fma
         (* (* t_5 t_5) t_6)
         (fabs (floor h))
         (fma (* (* (floor d) (floor d)) dY.w) dY.w (* t_10 (floor w))))))))))
dY.v_m = fabs(dY_46_v);
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v_m, float dY_46_w) {
	float t_0 = dX_46_w * floorf(d);
	float t_1 = floorf(w) * dX_46_u;
	float t_2 = floorf(h) * dY_46_v_m;
	float t_3 = floorf(h) * dX_46_v;
	float t_4 = floorf(d) * dY_46_w;
	float t_5 = sqrtf(-dY_46_v_m);
	float t_6 = dY_46_v_m * floorf(h);
	float t_7 = floorf(w) * dY_46_u;
	float t_8 = (dX_46_u * floorf(w)) * dX_46_u;
	float t_9 = floorf(d) * dX_46_w;
	float t_10 = (dY_46_u * floorf(w)) * dY_46_u;
	float tmp;
	if (log2f(sqrtf(fmaxf((((t_1 * t_1) + (t_3 * t_3)) + (t_9 * t_9)), (((t_7 * t_7) + (t_2 * t_2)) + (t_4 * t_4))))) <= 100.0f) {
		tmp = log2f(sqrtf(fmaxf(fmaf((t_0 * dX_46_w), floorf(d), fmaf(t_8, floorf(w), (((dX_46_v * floorf(h)) * dX_46_v) * floorf(h)))), fmaf(((dY_46_w * floorf(d)) * dY_46_w), floorf(d), fmaf(t_10, floorf(w), ((t_6 * dY_46_v_m) * floorf(h)))))));
	} else {
		tmp = log2f(sqrtf(fmaxf(fmaf((t_0 * floorf(d)), dX_46_w, (t_8 * floorf(w))), fmaf(((t_5 * t_5) * t_6), fabsf(floorf(h)), fmaf(((floorf(d) * floorf(d)) * dY_46_w), dY_46_w, (t_10 * floorf(w)))))));
	}
	return tmp;
}
dY.v_m = abs(dY_46_v)
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v_m, dY_46_w)
	t_0 = Float32(dX_46_w * floor(d))
	t_1 = Float32(floor(w) * dX_46_u)
	t_2 = Float32(floor(h) * dY_46_v_m)
	t_3 = Float32(floor(h) * dX_46_v)
	t_4 = Float32(floor(d) * dY_46_w)
	t_5 = sqrt(Float32(-dY_46_v_m))
	t_6 = Float32(dY_46_v_m * floor(h))
	t_7 = Float32(floor(w) * dY_46_u)
	t_8 = Float32(Float32(dX_46_u * floor(w)) * dX_46_u)
	t_9 = Float32(floor(d) * dX_46_w)
	t_10 = Float32(Float32(dY_46_u * floor(w)) * dY_46_u)
	tmp = Float32(0.0)
	if (log2(sqrt(fmax(Float32(Float32(Float32(t_1 * t_1) + Float32(t_3 * t_3)) + Float32(t_9 * t_9)), Float32(Float32(Float32(t_7 * t_7) + Float32(t_2 * t_2)) + Float32(t_4 * t_4))))) <= Float32(100.0))
		tmp = log2(sqrt(fmax(fma(Float32(t_0 * dX_46_w), floor(d), fma(t_8, floor(w), Float32(Float32(Float32(dX_46_v * floor(h)) * dX_46_v) * floor(h)))), fma(Float32(Float32(dY_46_w * floor(d)) * dY_46_w), floor(d), fma(t_10, floor(w), Float32(Float32(t_6 * dY_46_v_m) * floor(h)))))));
	else
		tmp = log2(sqrt(fmax(fma(Float32(t_0 * floor(d)), dX_46_w, Float32(t_8 * floor(w))), fma(Float32(Float32(t_5 * t_5) * t_6), abs(floor(h)), fma(Float32(Float32(floor(d) * floor(d)) * dY_46_w), dY_46_w, Float32(t_10 * floor(w)))))));
	end
	return tmp
end
\begin{array}{l}
dY.v_m = \left|dY.v\right|

\\
\begin{array}{l}
t_0 := dX.w \cdot \left\lfloor d\right\rfloor \\
t_1 := \left\lfloor w\right\rfloor  \cdot dX.u\\
t_2 := \left\lfloor h\right\rfloor  \cdot dY.v\_m\\
t_3 := \left\lfloor h\right\rfloor  \cdot dX.v\\
t_4 := \left\lfloor d\right\rfloor  \cdot dY.w\\
t_5 := \sqrt{-dY.v\_m}\\
t_6 := dY.v\_m \cdot \left\lfloor h\right\rfloor \\
t_7 := \left\lfloor w\right\rfloor  \cdot dY.u\\
t_8 := \left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\\
t_9 := \left\lfloor d\right\rfloor  \cdot dX.w\\
t_10 := \left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\\
\mathbf{if}\;\log_{2} \left(\sqrt{\mathsf{max}\left(\left(t\_1 \cdot t\_1 + t\_3 \cdot t\_3\right) + t\_9 \cdot t\_9, \left(t\_7 \cdot t\_7 + t\_2 \cdot t\_2\right) + t\_4 \cdot t\_4\right)}\right) \leq 100:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot dX.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(t\_8, \left\lfloor w\right\rfloor , \left(\left(dX.v \cdot \left\lfloor h\right\rfloor \right) \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor \right)\right), \mathsf{fma}\left(\left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(t\_10, \left\lfloor w\right\rfloor , \left(t\_6 \cdot dY.v\_m\right) \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right)\\

\mathbf{else}:\\
\;\;\;\;\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(t\_0 \cdot \left\lfloor d\right\rfloor , dX.w, t\_8 \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(t\_5 \cdot t\_5\right) \cdot t\_6, \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor  \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, t\_10 \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right)\\


\end{array}
\end{array}
Derivation
  1. Split input into 2 regimes
  2. if (log2.f32 (sqrt.f32 (fmax.f32 (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dX.u) (*.f32 (floor.f32 w) dX.u)) (*.f32 (*.f32 (floor.f32 h) dX.v) (*.f32 (floor.f32 h) dX.v))) (*.f32 (*.f32 (floor.f32 d) dX.w) (*.f32 (floor.f32 d) dX.w))) (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dY.u) (*.f32 (floor.f32 w) dY.u)) (*.f32 (*.f32 (floor.f32 h) dY.v) (*.f32 (floor.f32 h) dY.v))) (*.f32 (*.f32 (floor.f32 d) dY.w) (*.f32 (floor.f32 d) dY.w)))))) < 100

    1. Initial program 67.6%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Applied rewrites67.6%

      \[\leadsto \log_{2} \left(\sqrt{\color{blue}{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot dX.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u, \left\lfloor w\right\rfloor , \left(\left(dX.v \cdot \left\lfloor h\right\rfloor \right) \cdot dX.v\right) \cdot \left\lfloor h\right\rfloor \right)\right), \mathsf{fma}\left(\left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, \left\lfloor d\right\rfloor , \mathsf{fma}\left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u, \left\lfloor w\right\rfloor , \left(\left(dY.v \cdot \left\lfloor h\right\rfloor \right) \cdot dY.v\right) \cdot \left\lfloor h\right\rfloor \right)\right)\right)}}\right) \]

    if 100 < (log2.f32 (sqrt.f32 (fmax.f32 (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dX.u) (*.f32 (floor.f32 w) dX.u)) (*.f32 (*.f32 (floor.f32 h) dX.v) (*.f32 (floor.f32 h) dX.v))) (*.f32 (*.f32 (floor.f32 d) dX.w) (*.f32 (floor.f32 d) dX.w))) (+.f32 (+.f32 (*.f32 (*.f32 (floor.f32 w) dY.u) (*.f32 (floor.f32 w) dY.u)) (*.f32 (*.f32 (floor.f32 h) dY.v) (*.f32 (floor.f32 h) dY.v))) (*.f32 (*.f32 (floor.f32 d) dY.w) (*.f32 (floor.f32 d) dY.w))))))

    1. Initial program 67.6%

      \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. Taylor expanded in dX.v around 0

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. Step-by-step derivation
      1. lower-fma.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, \color{blue}{{\left(\left\lfloor w\right\rfloor \right)}^{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      2. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\color{blue}{\left(\left\lfloor w\right\rfloor \right)}}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      3. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{\color{blue}{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      4. lower-floor.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      5. lower-*.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      6. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      7. lower-pow.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
      8. lower-floor.f3260.8

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. Applied rewrites60.8%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    5. Applied rewrites60.8%

      \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(dY.v \cdot \left\lfloor h\right\rfloor , dY.v \cdot \left\lfloor h\right\rfloor , \left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left(dY.w \cdot \left\lfloor d\right\rfloor \right)\right)\right)\right)}\right)} \]
    6. Applied rewrites60.8%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \color{blue}{\mathsf{fma}\left(\left|dY.v\right| \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)}\right)}\right) \]
    7. Step-by-step derivation
      1. lift-fabs.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left|dY.v\right|} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      2. rem-sqrt-square-revN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\sqrt{dY.v \cdot dY.v}} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      3. sqr-neg-revN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\sqrt{\color{blue}{\left(\mathsf{neg}\left(dY.v\right)\right) \cdot \left(\mathsf{neg}\left(dY.v\right)\right)}} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      4. sqrt-prodN/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{\mathsf{neg}\left(dY.v\right)} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      5. lower-unsound-*.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{\mathsf{neg}\left(dY.v\right)} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      6. lower-unsound-sqrt.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\color{blue}{\sqrt{\mathsf{neg}\left(dY.v\right)}} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      7. lower-neg.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{\color{blue}{-dY.v}} \cdot \sqrt{\mathsf{neg}\left(dY.v\right)}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      8. lower-unsound-sqrt.f32N/A

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{-dY.v} \cdot \color{blue}{\sqrt{\mathsf{neg}\left(dY.v\right)}}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
      9. lower-neg.f3236.1

        \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\left(\sqrt{-dY.v} \cdot \sqrt{\color{blue}{-dY.v}}\right) \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
    8. Applied rewrites36.1%

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(\color{blue}{\left(\sqrt{-dY.v} \cdot \sqrt{-dY.v}\right)} \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)\right)}\right) \]
  3. Recombined 2 regimes into one program.
  4. Add Preprocessing

Alternative 3: 60.8% accurate, 1.2× speedup?

\[\begin{array}{l} dY.v_m = \left|dY.v\right| \\ \begin{array}{l} t_0 := dY.w \cdot \left\lfloor d\right\rfloor \\ t_1 := dY.v\_m \cdot \left\lfloor h\right\rfloor \\ \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(t\_1, t\_1, t\_0 \cdot t\_0\right)\right)\right)}\right) \end{array} \end{array} \]
dY.v_m = (fabs.f32 dY.v)
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v_m dY.w)
 :precision binary32
 (let* ((t_0 (* dY.w (floor d))) (t_1 (* dY.v_m (floor h))))
   (log2
    (sqrt
     (fmax
      (fma
       (* (* dX.w (floor d)) (floor d))
       dX.w
       (* (* (* dX.u (floor w)) dX.u) (floor w)))
      (fma
       (* dY.u dY.u)
       (* (floor w) (floor w))
       (fma t_1 t_1 (* t_0 t_0))))))))
dY.v_m = fabs(dY_46_v);
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v_m, float dY_46_w) {
	float t_0 = dY_46_w * floorf(d);
	float t_1 = dY_46_v_m * floorf(h);
	return log2f(sqrtf(fmaxf(fmaf(((dX_46_w * floorf(d)) * floorf(d)), dX_46_w, (((dX_46_u * floorf(w)) * dX_46_u) * floorf(w))), fmaf((dY_46_u * dY_46_u), (floorf(w) * floorf(w)), fmaf(t_1, t_1, (t_0 * t_0))))));
}
dY.v_m = abs(dY_46_v)
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v_m, dY_46_w)
	t_0 = Float32(dY_46_w * floor(d))
	t_1 = Float32(dY_46_v_m * floor(h))
	return log2(sqrt(fmax(fma(Float32(Float32(dX_46_w * floor(d)) * floor(d)), dX_46_w, Float32(Float32(Float32(dX_46_u * floor(w)) * dX_46_u) * floor(w))), fma(Float32(dY_46_u * dY_46_u), Float32(floor(w) * floor(w)), fma(t_1, t_1, Float32(t_0 * t_0))))))
end
\begin{array}{l}
dY.v_m = \left|dY.v\right|

\\
\begin{array}{l}
t_0 := dY.w \cdot \left\lfloor d\right\rfloor \\
t_1 := dY.v\_m \cdot \left\lfloor h\right\rfloor \\
\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor  \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(t\_1, t\_1, t\_0 \cdot t\_0\right)\right)\right)}\right)
\end{array}
\end{array}
Derivation
  1. Initial program 67.6%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Taylor expanded in dX.v around 0

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  3. Step-by-step derivation
    1. lower-fma.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, \color{blue}{{\left(\left\lfloor w\right\rfloor \right)}^{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\color{blue}{\left(\left\lfloor w\right\rfloor \right)}}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{\color{blue}{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. lower-floor.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    5. lower-*.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    6. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    7. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    8. lower-floor.f3260.8

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  4. Applied rewrites60.8%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  5. Applied rewrites60.8%

    \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(dY.v \cdot \left\lfloor h\right\rfloor , dY.v \cdot \left\lfloor h\right\rfloor , \left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left(dY.w \cdot \left\lfloor d\right\rfloor \right)\right)\right)\right)}\right)} \]
  6. Add Preprocessing

Alternative 4: 45.3% accurate, 1.8× speedup?

\[\begin{array}{l} dY.v_m = \left|dY.v\right| \\ \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v\_m \cdot \left(\left|dY.v\_m\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right) \end{array} \]
dY.v_m = (fabs.f32 dY.v)
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v_m dY.w)
 :precision binary32
 (log2
  (sqrt
   (fmax
    (fma
     (* (* dX.w (floor d)) (floor d))
     dX.w
     (* (* (* dX.u (floor w)) dX.u) (floor w)))
    (* dY.v_m (* (fabs dY.v_m) (* (fabs (floor h)) (floor h))))))))
dY.v_m = fabs(dY_46_v);
float code(float w, float h, float d, float dX_46_u, float dX_46_v, float dX_46_w, float dY_46_u, float dY_46_v_m, float dY_46_w) {
	return log2f(sqrtf(fmaxf(fmaf(((dX_46_w * floorf(d)) * floorf(d)), dX_46_w, (((dX_46_u * floorf(w)) * dX_46_u) * floorf(w))), (dY_46_v_m * (fabsf(dY_46_v_m) * (fabsf(floorf(h)) * floorf(h)))))));
}
dY.v_m = abs(dY_46_v)
function code(w, h, d, dX_46_u, dX_46_v, dX_46_w, dY_46_u, dY_46_v_m, dY_46_w)
	return log2(sqrt(fmax(fma(Float32(Float32(dX_46_w * floor(d)) * floor(d)), dX_46_w, Float32(Float32(Float32(dX_46_u * floor(w)) * dX_46_u) * floor(w))), Float32(dY_46_v_m * Float32(abs(dY_46_v_m) * Float32(abs(floor(h)) * floor(h)))))))
end
\begin{array}{l}
dY.v_m = \left|dY.v\right|

\\
\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v\_m \cdot \left(\left|dY.v\_m\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right)
\end{array}
Derivation
  1. Initial program 67.6%

    \[\log_{2} \left(\sqrt{\mathsf{max}\left(\left(\left(\left\lfloor w\right\rfloor \cdot dX.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dX.u\right) + \left(\left\lfloor h\right\rfloor \cdot dX.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dX.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dX.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dX.w\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  2. Taylor expanded in dX.v around 0

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{{dX.u}^{2} \cdot {\left(\left\lfloor w\right\rfloor \right)}^{2} + {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  3. Step-by-step derivation
    1. lower-fma.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, \color{blue}{{\left(\left\lfloor w\right\rfloor \right)}^{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    2. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\color{blue}{\left(\left\lfloor w\right\rfloor \right)}}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    3. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{\color{blue}{2}}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    4. lower-floor.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    5. lower-*.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    6. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    7. lower-pow.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
    8. lower-floor.f3260.8

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right), \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  4. Applied rewrites60.8%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\color{blue}{\mathsf{fma}\left({dX.u}^{2}, {\left(\left\lfloor w\right\rfloor \right)}^{2}, {dX.w}^{2} \cdot {\left(\left\lfloor d\right\rfloor \right)}^{2}\right)}, \left(\left(\left\lfloor w\right\rfloor \cdot dY.u\right) \cdot \left(\left\lfloor w\right\rfloor \cdot dY.u\right) + \left(\left\lfloor h\right\rfloor \cdot dY.v\right) \cdot \left(\left\lfloor h\right\rfloor \cdot dY.v\right)\right) + \left(\left\lfloor d\right\rfloor \cdot dY.w\right) \cdot \left(\left\lfloor d\right\rfloor \cdot dY.w\right)\right)}\right) \]
  5. Applied rewrites60.8%

    \[\leadsto \color{blue}{\log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \mathsf{fma}\left(dY.u \cdot dY.u, \left\lfloor w\right\rfloor \cdot \left\lfloor w\right\rfloor , \mathsf{fma}\left(dY.v \cdot \left\lfloor h\right\rfloor , dY.v \cdot \left\lfloor h\right\rfloor , \left(dY.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left(dY.w \cdot \left\lfloor d\right\rfloor \right)\right)\right)\right)}\right)} \]
  6. Applied rewrites60.8%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \color{blue}{\mathsf{fma}\left(\left|dY.v\right| \cdot \left(dY.v \cdot \left\lfloor h\right\rfloor \right), \left|\left\lfloor h\right\rfloor \right|, \mathsf{fma}\left(\left(\left\lfloor d\right\rfloor \cdot \left\lfloor d\right\rfloor \right) \cdot dY.w, dY.w, \left(\left(dY.u \cdot \left\lfloor w\right\rfloor \right) \cdot dY.u\right) \cdot \left\lfloor w\right\rfloor \right)\right)}\right)}\right) \]
  7. Taylor expanded in dY.v around inf

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \color{blue}{dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)}\right)}\right) \]
  8. Step-by-step derivation
    1. lower-*.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \color{blue}{\left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)}\right)}\right) \]
    2. lower-*.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \color{blue}{\left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)}\right)\right)}\right) \]
    3. lower-fabs.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \left(\color{blue}{\left|\left\lfloor h\right\rfloor \right|} \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right) \]
    4. lower-*.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \color{blue}{\left\lfloor h\right\rfloor }\right)\right)\right)}\right) \]
    5. lower-fabs.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor \color{blue}{h}\right\rfloor \right)\right)\right)}\right) \]
    6. lower-floor.f32N/A

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right) \]
    7. lower-floor.f3245.3

      \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)\right)}\right) \]
  9. Applied rewrites45.3%

    \[\leadsto \log_{2} \left(\sqrt{\mathsf{max}\left(\mathsf{fma}\left(\left(dX.w \cdot \left\lfloor d\right\rfloor \right) \cdot \left\lfloor d\right\rfloor , dX.w, \left(\left(dX.u \cdot \left\lfloor w\right\rfloor \right) \cdot dX.u\right) \cdot \left\lfloor w\right\rfloor \right), \color{blue}{dY.v \cdot \left(\left|dY.v\right| \cdot \left(\left|\left\lfloor h\right\rfloor \right| \cdot \left\lfloor h\right\rfloor \right)\right)}\right)}\right) \]
  10. Add Preprocessing

Reproduce

?
herbie shell --seed 2025159 
(FPCore (w h d dX.u dX.v dX.w dY.u dY.v dY.w)
  :name "Isotropic LOD (LOD)"
  :precision binary32
  :pre (and (and (and (and (and (and (and (and (and (<= 1.0 w) (<= w 16384.0)) (and (<= 1.0 h) (<= h 16384.0))) (and (<= 1.0 d) (<= d 4096.0))) (and (<= 1e-20 (fabs dX.u)) (<= (fabs dX.u) 1e+20))) (and (<= 1e-20 (fabs dX.v)) (<= (fabs dX.v) 1e+20))) (and (<= 1e-20 (fabs dX.w)) (<= (fabs dX.w) 1e+20))) (and (<= 1e-20 (fabs dY.u)) (<= (fabs dY.u) 1e+20))) (and (<= 1e-20 (fabs dY.v)) (<= (fabs dY.v) 1e+20))) (and (<= 1e-20 (fabs dY.w)) (<= (fabs dY.w) 1e+20)))
  (log2 (sqrt (fmax (+ (+ (* (* (floor w) dX.u) (* (floor w) dX.u)) (* (* (floor h) dX.v) (* (floor h) dX.v))) (* (* (floor d) dX.w) (* (floor d) dX.w))) (+ (+ (* (* (floor w) dY.u) (* (floor w) dY.u)) (* (* (floor h) dY.v) (* (floor h) dY.v))) (* (* (floor d) dY.w) (* (floor d) dY.w)))))))