Disney BSSRDF, sample scattering profile, lower

Percentage Accurate: 61.4% → 99.3%
Time: 14.4s
Alternatives: 10
Speedup: 21.8×

Specification

?
\[\left(0 \leq s \land s \leq 256\right) \land \left(2.328306437 \cdot 10^{-10} \leq u \land u \leq 0.25\right)\]
\[\begin{array}{l} \\ s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \end{array} \]
(FPCore (s u) :precision binary32 (* s (log (/ 1.0 (- 1.0 (* 4.0 u))))))
float code(float s, float u) {
	return s * logf((1.0f / (1.0f - (4.0f * u))));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * log((1.0e0 / (1.0e0 - (4.0e0 * u))))
end function
function code(s, u)
	return Float32(s * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(4.0) * u)))))
end
function tmp = code(s, u)
	tmp = s * log((single(1.0) / (single(1.0) - (single(4.0) * u))));
end
\begin{array}{l}

\\
s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right)
\end{array}

Sampling outcomes in binary32 precision:

Local Percentage Accuracy vs ?

The average percentage accuracy by input value. Horizontal axis shows value of an input variable; the variable is choosen in the title. Vertical axis is accuracy; higher is better. Red represent the original program, while blue represents Herbie's suggestion. These can be toggled with buttons below the plot. The line is an average while dots represent individual samples.

Accuracy vs Speed?

Herbie found 10 alternatives:

AlternativeAccuracySpeedup
The accuracy (vertical axis) and speed (horizontal axis) of each alternatives. Up and to the right is better. The red square shows the initial program, and each blue circle shows an alternative.The line shows the best available speed-accuracy tradeoffs.

Initial Program: 61.4% accurate, 1.0× speedup?

\[\begin{array}{l} \\ s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \end{array} \]
(FPCore (s u) :precision binary32 (* s (log (/ 1.0 (- 1.0 (* 4.0 u))))))
float code(float s, float u) {
	return s * logf((1.0f / (1.0f - (4.0f * u))));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * log((1.0e0 / (1.0e0 - (4.0e0 * u))))
end function
function code(s, u)
	return Float32(s * log(Float32(Float32(1.0) / Float32(Float32(1.0) - Float32(Float32(4.0) * u)))))
end
function tmp = code(s, u)
	tmp = s * log((single(1.0) / (single(1.0) - (single(4.0) * u))));
end
\begin{array}{l}

\\
s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right)
\end{array}

Alternative 1: 99.3% accurate, 1.0× speedup?

\[\begin{array}{l} \\ s \cdot \left(-\mathsf{log1p}\left(u \cdot -4\right)\right) \end{array} \]
(FPCore (s u) :precision binary32 (* s (- (log1p (* u -4.0)))))
float code(float s, float u) {
	return s * -log1pf((u * -4.0f));
}
function code(s, u)
	return Float32(s * Float32(-log1p(Float32(u * Float32(-4.0)))))
end
\begin{array}{l}

\\
s \cdot \left(-\mathsf{log1p}\left(u \cdot -4\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Step-by-step derivation
    1. log-rec66.3%

      \[\leadsto s \cdot \color{blue}{\left(-\log \left(1 - 4 \cdot u\right)\right)} \]
    2. distribute-rgt-neg-out66.3%

      \[\leadsto \color{blue}{-s \cdot \log \left(1 - 4 \cdot u\right)} \]
    3. distribute-lft-neg-in66.3%

      \[\leadsto \color{blue}{\left(-s\right) \cdot \log \left(1 - 4 \cdot u\right)} \]
    4. cancel-sign-sub-inv66.3%

      \[\leadsto \left(-s\right) \cdot \log \color{blue}{\left(1 + \left(-4\right) \cdot u\right)} \]
    5. log1p-def99.3%

      \[\leadsto \left(-s\right) \cdot \color{blue}{\mathsf{log1p}\left(\left(-4\right) \cdot u\right)} \]
    6. *-commutative99.3%

      \[\leadsto \left(-s\right) \cdot \mathsf{log1p}\left(\color{blue}{u \cdot \left(-4\right)}\right) \]
    7. metadata-eval99.3%

      \[\leadsto \left(-s\right) \cdot \mathsf{log1p}\left(u \cdot \color{blue}{-4}\right) \]
  3. Simplified99.3%

    \[\leadsto \color{blue}{\left(-s\right) \cdot \mathsf{log1p}\left(u \cdot -4\right)} \]
  4. Final simplification99.3%

    \[\leadsto s \cdot \left(-\mathsf{log1p}\left(u \cdot -4\right)\right) \]

Alternative 2: 90.7% accurate, 6.4× speedup?

\[\begin{array}{l} \\ 4 \cdot \left(s \cdot u\right) + s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right) \end{array} \]
(FPCore (s u)
 :precision binary32
 (+ (* 4.0 (* s u)) (* s (* (* u u) (+ 8.0 (* u 21.333333333333332))))))
float code(float s, float u) {
	return (4.0f * (s * u)) + (s * ((u * u) * (8.0f + (u * 21.333333333333332f))));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = (4.0e0 * (s * u)) + (s * ((u * u) * (8.0e0 + (u * 21.333333333333332e0))))
end function
function code(s, u)
	return Float32(Float32(Float32(4.0) * Float32(s * u)) + Float32(s * Float32(Float32(u * u) * Float32(Float32(8.0) + Float32(u * Float32(21.333333333333332))))))
end
function tmp = code(s, u)
	tmp = (single(4.0) * (s * u)) + (s * ((u * u) * (single(8.0) + (u * single(21.333333333333332)))));
end
\begin{array}{l}

\\
4 \cdot \left(s \cdot u\right) + s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 90.3%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right) + \left(8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right)} \]
  3. Step-by-step derivation
    1. fma-def90.3%

      \[\leadsto \color{blue}{\mathsf{fma}\left(4, s \cdot u, 8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right)} \]
    2. *-commutative90.3%

      \[\leadsto \mathsf{fma}\left(4, \color{blue}{u \cdot s}, 8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) \]
    3. *-commutative90.3%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, 8 \cdot \color{blue}{\left({u}^{2} \cdot s\right)} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) \]
    4. associate-*r*90.4%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, \color{blue}{\left(8 \cdot {u}^{2}\right) \cdot s} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) \]
    5. *-commutative90.4%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, \left(8 \cdot {u}^{2}\right) \cdot s + 21.333333333333332 \cdot \color{blue}{\left({u}^{3} \cdot s\right)}\right) \]
    6. associate-*r*90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, \left(8 \cdot {u}^{2}\right) \cdot s + \color{blue}{\left(21.333333333333332 \cdot {u}^{3}\right) \cdot s}\right) \]
    7. distribute-rgt-out90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, \color{blue}{s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right)}\right) \]
    8. cube-mult90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot \color{blue}{\left(u \cdot \left(u \cdot u\right)\right)}\right)\right) \]
    9. unpow290.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot \left(u \cdot \color{blue}{{u}^{2}}\right)\right)\right) \]
    10. associate-*r*90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \left(8 \cdot {u}^{2} + \color{blue}{\left(21.333333333333332 \cdot u\right) \cdot {u}^{2}}\right)\right) \]
    11. distribute-rgt-out90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \color{blue}{\left({u}^{2} \cdot \left(8 + 21.333333333333332 \cdot u\right)\right)}\right) \]
    12. *-commutative90.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \left({u}^{2} \cdot \left(8 + \color{blue}{u \cdot 21.333333333333332}\right)\right)\right) \]
    13. unpow290.5%

      \[\leadsto \mathsf{fma}\left(4, u \cdot s, s \cdot \left(\color{blue}{\left(u \cdot u\right)} \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right) \]
  4. Simplified90.5%

    \[\leadsto \color{blue}{\mathsf{fma}\left(4, u \cdot s, s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right)} \]
  5. Step-by-step derivation
    1. fma-udef90.5%

      \[\leadsto \color{blue}{4 \cdot \left(u \cdot s\right) + s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right)} \]
  6. Applied egg-rr90.5%

    \[\leadsto \color{blue}{4 \cdot \left(u \cdot s\right) + s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right)} \]
  7. Final simplification90.5%

    \[\leadsto 4 \cdot \left(s \cdot u\right) + s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right) \]

Alternative 3: 90.7% accurate, 8.4× speedup?

\[\begin{array}{l} \\ s \cdot \left(u \cdot \left(4 + u \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right) \end{array} \]
(FPCore (s u)
 :precision binary32
 (* s (* u (+ 4.0 (* u (+ 8.0 (* u 21.333333333333332)))))))
float code(float s, float u) {
	return s * (u * (4.0f + (u * (8.0f + (u * 21.333333333333332f)))));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * (u * (4.0e0 + (u * (8.0e0 + (u * 21.333333333333332e0)))))
end function
function code(s, u)
	return Float32(s * Float32(u * Float32(Float32(4.0) + Float32(u * Float32(Float32(8.0) + Float32(u * Float32(21.333333333333332)))))))
end
function tmp = code(s, u)
	tmp = s * (u * (single(4.0) + (u * (single(8.0) + (u * single(21.333333333333332))))));
end
\begin{array}{l}

\\
s \cdot \left(u \cdot \left(4 + u \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 90.7%

    \[\leadsto s \cdot \color{blue}{\left(4 \cdot u + \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right)\right)} \]
  3. Step-by-step derivation
    1. *-commutative90.7%

      \[\leadsto s \cdot \left(\color{blue}{u \cdot 4} + \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right)\right) \]
    2. unpow290.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \left(8 \cdot \color{blue}{\left(u \cdot u\right)} + 21.333333333333332 \cdot {u}^{3}\right)\right) \]
    3. associate-*r*90.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \left(\color{blue}{\left(8 \cdot u\right) \cdot u} + 21.333333333333332 \cdot {u}^{3}\right)\right) \]
    4. unpow390.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \left(\left(8 \cdot u\right) \cdot u + 21.333333333333332 \cdot \color{blue}{\left(\left(u \cdot u\right) \cdot u\right)}\right)\right) \]
    5. unpow290.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \left(\left(8 \cdot u\right) \cdot u + 21.333333333333332 \cdot \left(\color{blue}{{u}^{2}} \cdot u\right)\right)\right) \]
    6. associate-*r*90.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \left(\left(8 \cdot u\right) \cdot u + \color{blue}{\left(21.333333333333332 \cdot {u}^{2}\right) \cdot u}\right)\right) \]
    7. distribute-rgt-out90.7%

      \[\leadsto s \cdot \left(u \cdot 4 + \color{blue}{u \cdot \left(8 \cdot u + 21.333333333333332 \cdot {u}^{2}\right)}\right) \]
    8. distribute-lft-out90.5%

      \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + \left(8 \cdot u + 21.333333333333332 \cdot {u}^{2}\right)\right)\right)} \]
    9. unpow290.5%

      \[\leadsto s \cdot \left(u \cdot \left(4 + \left(8 \cdot u + 21.333333333333332 \cdot \color{blue}{\left(u \cdot u\right)}\right)\right)\right) \]
    10. associate-*r*90.5%

      \[\leadsto s \cdot \left(u \cdot \left(4 + \left(8 \cdot u + \color{blue}{\left(21.333333333333332 \cdot u\right) \cdot u}\right)\right)\right) \]
    11. distribute-rgt-out90.5%

      \[\leadsto s \cdot \left(u \cdot \left(4 + \color{blue}{u \cdot \left(8 + 21.333333333333332 \cdot u\right)}\right)\right) \]
    12. *-commutative90.5%

      \[\leadsto s \cdot \left(u \cdot \left(4 + u \cdot \left(8 + \color{blue}{u \cdot 21.333333333333332}\right)\right)\right) \]
  4. Simplified90.5%

    \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + u \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right)} \]
  5. Final simplification90.5%

    \[\leadsto s \cdot \left(u \cdot \left(4 + u \cdot \left(8 + u \cdot 21.333333333333332\right)\right)\right) \]

Alternative 4: 86.7% accurate, 9.9× speedup?

\[\begin{array}{l} \\ s \cdot \left(u \cdot 4 + u \cdot \left(u \cdot 8\right)\right) \end{array} \]
(FPCore (s u) :precision binary32 (* s (+ (* u 4.0) (* u (* u 8.0)))))
float code(float s, float u) {
	return s * ((u * 4.0f) + (u * (u * 8.0f)));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * ((u * 4.0e0) + (u * (u * 8.0e0)))
end function
function code(s, u)
	return Float32(s * Float32(Float32(u * Float32(4.0)) + Float32(u * Float32(u * Float32(8.0)))))
end
function tmp = code(s, u)
	tmp = s * ((u * single(4.0)) + (u * (u * single(8.0))));
end
\begin{array}{l}

\\
s \cdot \left(u \cdot 4 + u \cdot \left(u \cdot 8\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 86.2%

    \[\leadsto s \cdot \color{blue}{\left(4 \cdot u + 8 \cdot {u}^{2}\right)} \]
  3. Step-by-step derivation
    1. unpow286.2%

      \[\leadsto s \cdot \left(4 \cdot u + 8 \cdot \color{blue}{\left(u \cdot u\right)}\right) \]
    2. associate-*r*86.2%

      \[\leadsto s \cdot \left(4 \cdot u + \color{blue}{\left(8 \cdot u\right) \cdot u}\right) \]
    3. distribute-rgt-out86.1%

      \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + 8 \cdot u\right)\right)} \]
    4. *-commutative86.1%

      \[\leadsto s \cdot \left(u \cdot \left(4 + \color{blue}{u \cdot 8}\right)\right) \]
  4. Simplified86.1%

    \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + u \cdot 8\right)\right)} \]
  5. Step-by-step derivation
    1. distribute-rgt-in86.2%

      \[\leadsto s \cdot \color{blue}{\left(4 \cdot u + \left(u \cdot 8\right) \cdot u\right)} \]
    2. *-commutative86.2%

      \[\leadsto s \cdot \left(\color{blue}{u \cdot 4} + \left(u \cdot 8\right) \cdot u\right) \]
  6. Applied egg-rr86.2%

    \[\leadsto s \cdot \color{blue}{\left(u \cdot 4 + \left(u \cdot 8\right) \cdot u\right)} \]
  7. Final simplification86.2%

    \[\leadsto s \cdot \left(u \cdot 4 + u \cdot \left(u \cdot 8\right)\right) \]

Alternative 5: 86.7% accurate, 9.9× speedup?

\[\begin{array}{l} \\ u \cdot \left(s \cdot 4 + 8 \cdot \left(s \cdot u\right)\right) \end{array} \]
(FPCore (s u) :precision binary32 (* u (+ (* s 4.0) (* 8.0 (* s u)))))
float code(float s, float u) {
	return u * ((s * 4.0f) + (8.0f * (s * u)));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = u * ((s * 4.0e0) + (8.0e0 * (s * u)))
end function
function code(s, u)
	return Float32(u * Float32(Float32(s * Float32(4.0)) + Float32(Float32(8.0) * Float32(s * u))))
end
function tmp = code(s, u)
	tmp = u * ((s * single(4.0)) + (single(8.0) * (s * u)));
end
\begin{array}{l}

\\
u \cdot \left(s \cdot 4 + 8 \cdot \left(s \cdot u\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 92.6%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right) + \left(8 \cdot \left(s \cdot {u}^{2}\right) + \left(21.333333333333332 \cdot \left(s \cdot {u}^{3}\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)\right)} \]
  3. Step-by-step derivation
    1. +-commutative92.6%

      \[\leadsto \color{blue}{\left(8 \cdot \left(s \cdot {u}^{2}\right) + \left(21.333333333333332 \cdot \left(s \cdot {u}^{3}\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)\right) + 4 \cdot \left(s \cdot u\right)} \]
    2. associate-+r+92.6%

      \[\leadsto \color{blue}{\left(\left(8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)} + 4 \cdot \left(s \cdot u\right) \]
    3. associate-+l+92.6%

      \[\leadsto \color{blue}{\left(8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right)} \]
    4. *-commutative92.6%

      \[\leadsto \left(8 \cdot \color{blue}{\left({u}^{2} \cdot s\right)} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    5. associate-*r*92.7%

      \[\leadsto \left(\color{blue}{\left(8 \cdot {u}^{2}\right) \cdot s} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    6. *-commutative92.7%

      \[\leadsto \left(\left(8 \cdot {u}^{2}\right) \cdot s + 21.333333333333332 \cdot \color{blue}{\left({u}^{3} \cdot s\right)}\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    7. associate-*r*92.8%

      \[\leadsto \left(\left(8 \cdot {u}^{2}\right) \cdot s + \color{blue}{\left(21.333333333333332 \cdot {u}^{3}\right) \cdot s}\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    8. distribute-rgt-out92.8%

      \[\leadsto \color{blue}{s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right)} + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    9. *-commutative92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(64 \cdot \color{blue}{\left({u}^{4} \cdot s\right)} + 4 \cdot \left(s \cdot u\right)\right) \]
    10. associate-*r*92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\color{blue}{\left(64 \cdot {u}^{4}\right) \cdot s} + 4 \cdot \left(s \cdot u\right)\right) \]
    11. *-commutative92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\left(64 \cdot {u}^{4}\right) \cdot s + 4 \cdot \color{blue}{\left(u \cdot s\right)}\right) \]
    12. associate-*r*93.1%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\left(64 \cdot {u}^{4}\right) \cdot s + \color{blue}{\left(4 \cdot u\right) \cdot s}\right) \]
    13. distribute-rgt-out93.1%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \color{blue}{s \cdot \left(64 \cdot {u}^{4} + 4 \cdot u\right)} \]
  4. Simplified93.1%

    \[\leadsto \color{blue}{s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right) + s \cdot \mathsf{fma}\left(64, {u}^{4}, 4 \cdot u\right)} \]
  5. Taylor expanded in u around 0 85.9%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right) + 8 \cdot \left(s \cdot {u}^{2}\right)} \]
  6. Step-by-step derivation
    1. +-commutative85.9%

      \[\leadsto \color{blue}{8 \cdot \left(s \cdot {u}^{2}\right) + 4 \cdot \left(s \cdot u\right)} \]
    2. unpow285.9%

      \[\leadsto 8 \cdot \left(s \cdot \color{blue}{\left(u \cdot u\right)}\right) + 4 \cdot \left(s \cdot u\right) \]
    3. *-commutative85.9%

      \[\leadsto 8 \cdot \color{blue}{\left(\left(u \cdot u\right) \cdot s\right)} + 4 \cdot \left(s \cdot u\right) \]
    4. associate-*l*85.9%

      \[\leadsto 8 \cdot \color{blue}{\left(u \cdot \left(u \cdot s\right)\right)} + 4 \cdot \left(s \cdot u\right) \]
    5. associate-*r*86.0%

      \[\leadsto \color{blue}{\left(8 \cdot u\right) \cdot \left(u \cdot s\right)} + 4 \cdot \left(s \cdot u\right) \]
    6. *-commutative86.0%

      \[\leadsto \left(8 \cdot u\right) \cdot \left(u \cdot s\right) + 4 \cdot \color{blue}{\left(u \cdot s\right)} \]
    7. distribute-rgt-in85.8%

      \[\leadsto \color{blue}{\left(u \cdot s\right) \cdot \left(8 \cdot u + 4\right)} \]
    8. *-commutative85.8%

      \[\leadsto \left(u \cdot s\right) \cdot \left(\color{blue}{u \cdot 8} + 4\right) \]
    9. fma-udef85.8%

      \[\leadsto \left(u \cdot s\right) \cdot \color{blue}{\mathsf{fma}\left(u, 8, 4\right)} \]
    10. associate-*r*86.1%

      \[\leadsto \color{blue}{u \cdot \left(s \cdot \mathsf{fma}\left(u, 8, 4\right)\right)} \]
  7. Simplified86.1%

    \[\leadsto \color{blue}{u \cdot \left(s \cdot \mathsf{fma}\left(u, 8, 4\right)\right)} \]
  8. Taylor expanded in u around 0 86.3%

    \[\leadsto u \cdot \color{blue}{\left(4 \cdot s + 8 \cdot \left(s \cdot u\right)\right)} \]
  9. Final simplification86.3%

    \[\leadsto u \cdot \left(s \cdot 4 + 8 \cdot \left(s \cdot u\right)\right) \]

Alternative 6: 86.5% accurate, 12.1× speedup?

\[\begin{array}{l} \\ s \cdot \left(u \cdot \left(4 + u \cdot 8\right)\right) \end{array} \]
(FPCore (s u) :precision binary32 (* s (* u (+ 4.0 (* u 8.0)))))
float code(float s, float u) {
	return s * (u * (4.0f + (u * 8.0f)));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * (u * (4.0e0 + (u * 8.0e0)))
end function
function code(s, u)
	return Float32(s * Float32(u * Float32(Float32(4.0) + Float32(u * Float32(8.0)))))
end
function tmp = code(s, u)
	tmp = s * (u * (single(4.0) + (u * single(8.0))));
end
\begin{array}{l}

\\
s \cdot \left(u \cdot \left(4 + u \cdot 8\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 86.2%

    \[\leadsto s \cdot \color{blue}{\left(4 \cdot u + 8 \cdot {u}^{2}\right)} \]
  3. Step-by-step derivation
    1. unpow286.2%

      \[\leadsto s \cdot \left(4 \cdot u + 8 \cdot \color{blue}{\left(u \cdot u\right)}\right) \]
    2. associate-*r*86.2%

      \[\leadsto s \cdot \left(4 \cdot u + \color{blue}{\left(8 \cdot u\right) \cdot u}\right) \]
    3. distribute-rgt-out86.1%

      \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + 8 \cdot u\right)\right)} \]
    4. *-commutative86.1%

      \[\leadsto s \cdot \left(u \cdot \left(4 + \color{blue}{u \cdot 8}\right)\right) \]
  4. Simplified86.1%

    \[\leadsto s \cdot \color{blue}{\left(u \cdot \left(4 + u \cdot 8\right)\right)} \]
  5. Final simplification86.1%

    \[\leadsto s \cdot \left(u \cdot \left(4 + u \cdot 8\right)\right) \]

Alternative 7: 86.5% accurate, 12.1× speedup?

\[\begin{array}{l} \\ u \cdot \left(s \cdot \left(4 + u \cdot 8\right)\right) \end{array} \]
(FPCore (s u) :precision binary32 (* u (* s (+ 4.0 (* u 8.0)))))
float code(float s, float u) {
	return u * (s * (4.0f + (u * 8.0f)));
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = u * (s * (4.0e0 + (u * 8.0e0)))
end function
function code(s, u)
	return Float32(u * Float32(s * Float32(Float32(4.0) + Float32(u * Float32(8.0)))))
end
function tmp = code(s, u)
	tmp = u * (s * (single(4.0) + (u * single(8.0))));
end
\begin{array}{l}

\\
u \cdot \left(s \cdot \left(4 + u \cdot 8\right)\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 92.6%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right) + \left(8 \cdot \left(s \cdot {u}^{2}\right) + \left(21.333333333333332 \cdot \left(s \cdot {u}^{3}\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)\right)} \]
  3. Step-by-step derivation
    1. +-commutative92.6%

      \[\leadsto \color{blue}{\left(8 \cdot \left(s \cdot {u}^{2}\right) + \left(21.333333333333332 \cdot \left(s \cdot {u}^{3}\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)\right) + 4 \cdot \left(s \cdot u\right)} \]
    2. associate-+r+92.6%

      \[\leadsto \color{blue}{\left(\left(8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + 64 \cdot \left(s \cdot {u}^{4}\right)\right)} + 4 \cdot \left(s \cdot u\right) \]
    3. associate-+l+92.6%

      \[\leadsto \color{blue}{\left(8 \cdot \left(s \cdot {u}^{2}\right) + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right)} \]
    4. *-commutative92.6%

      \[\leadsto \left(8 \cdot \color{blue}{\left({u}^{2} \cdot s\right)} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    5. associate-*r*92.7%

      \[\leadsto \left(\color{blue}{\left(8 \cdot {u}^{2}\right) \cdot s} + 21.333333333333332 \cdot \left(s \cdot {u}^{3}\right)\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    6. *-commutative92.7%

      \[\leadsto \left(\left(8 \cdot {u}^{2}\right) \cdot s + 21.333333333333332 \cdot \color{blue}{\left({u}^{3} \cdot s\right)}\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    7. associate-*r*92.8%

      \[\leadsto \left(\left(8 \cdot {u}^{2}\right) \cdot s + \color{blue}{\left(21.333333333333332 \cdot {u}^{3}\right) \cdot s}\right) + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    8. distribute-rgt-out92.8%

      \[\leadsto \color{blue}{s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right)} + \left(64 \cdot \left(s \cdot {u}^{4}\right) + 4 \cdot \left(s \cdot u\right)\right) \]
    9. *-commutative92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(64 \cdot \color{blue}{\left({u}^{4} \cdot s\right)} + 4 \cdot \left(s \cdot u\right)\right) \]
    10. associate-*r*92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\color{blue}{\left(64 \cdot {u}^{4}\right) \cdot s} + 4 \cdot \left(s \cdot u\right)\right) \]
    11. *-commutative92.8%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\left(64 \cdot {u}^{4}\right) \cdot s + 4 \cdot \color{blue}{\left(u \cdot s\right)}\right) \]
    12. associate-*r*93.1%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \left(\left(64 \cdot {u}^{4}\right) \cdot s + \color{blue}{\left(4 \cdot u\right) \cdot s}\right) \]
    13. distribute-rgt-out93.1%

      \[\leadsto s \cdot \left(8 \cdot {u}^{2} + 21.333333333333332 \cdot {u}^{3}\right) + \color{blue}{s \cdot \left(64 \cdot {u}^{4} + 4 \cdot u\right)} \]
  4. Simplified93.1%

    \[\leadsto \color{blue}{s \cdot \left(\left(u \cdot u\right) \cdot \left(8 + u \cdot 21.333333333333332\right)\right) + s \cdot \mathsf{fma}\left(64, {u}^{4}, 4 \cdot u\right)} \]
  5. Taylor expanded in u around 0 85.9%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right) + 8 \cdot \left(s \cdot {u}^{2}\right)} \]
  6. Step-by-step derivation
    1. +-commutative85.9%

      \[\leadsto \color{blue}{8 \cdot \left(s \cdot {u}^{2}\right) + 4 \cdot \left(s \cdot u\right)} \]
    2. unpow285.9%

      \[\leadsto 8 \cdot \left(s \cdot \color{blue}{\left(u \cdot u\right)}\right) + 4 \cdot \left(s \cdot u\right) \]
    3. *-commutative85.9%

      \[\leadsto 8 \cdot \color{blue}{\left(\left(u \cdot u\right) \cdot s\right)} + 4 \cdot \left(s \cdot u\right) \]
    4. associate-*l*85.9%

      \[\leadsto 8 \cdot \color{blue}{\left(u \cdot \left(u \cdot s\right)\right)} + 4 \cdot \left(s \cdot u\right) \]
    5. associate-*r*86.0%

      \[\leadsto \color{blue}{\left(8 \cdot u\right) \cdot \left(u \cdot s\right)} + 4 \cdot \left(s \cdot u\right) \]
    6. *-commutative86.0%

      \[\leadsto \left(8 \cdot u\right) \cdot \left(u \cdot s\right) + 4 \cdot \color{blue}{\left(u \cdot s\right)} \]
    7. distribute-rgt-in85.8%

      \[\leadsto \color{blue}{\left(u \cdot s\right) \cdot \left(8 \cdot u + 4\right)} \]
    8. *-commutative85.8%

      \[\leadsto \left(u \cdot s\right) \cdot \left(\color{blue}{u \cdot 8} + 4\right) \]
    9. fma-udef85.8%

      \[\leadsto \left(u \cdot s\right) \cdot \color{blue}{\mathsf{fma}\left(u, 8, 4\right)} \]
    10. associate-*r*86.1%

      \[\leadsto \color{blue}{u \cdot \left(s \cdot \mathsf{fma}\left(u, 8, 4\right)\right)} \]
  7. Simplified86.1%

    \[\leadsto \color{blue}{u \cdot \left(s \cdot \mathsf{fma}\left(u, 8, 4\right)\right)} \]
  8. Taylor expanded in s around 0 86.1%

    \[\leadsto u \cdot \color{blue}{\left(s \cdot \left(4 + 8 \cdot u\right)\right)} \]
  9. Final simplification86.1%

    \[\leadsto u \cdot \left(s \cdot \left(4 + u \cdot 8\right)\right) \]

Alternative 8: 73.5% accurate, 21.8× speedup?

\[\begin{array}{l} \\ 4 \cdot \left(s \cdot u\right) \end{array} \]
(FPCore (s u) :precision binary32 (* 4.0 (* s u)))
float code(float s, float u) {
	return 4.0f * (s * u);
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = 4.0e0 * (s * u)
end function
function code(s, u)
	return Float32(Float32(4.0) * Float32(s * u))
end
function tmp = code(s, u)
	tmp = single(4.0) * (s * u);
end
\begin{array}{l}

\\
4 \cdot \left(s \cdot u\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 72.3%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right)} \]
  3. Step-by-step derivation
    1. *-commutative72.3%

      \[\leadsto 4 \cdot \color{blue}{\left(u \cdot s\right)} \]
  4. Simplified72.3%

    \[\leadsto \color{blue}{4 \cdot \left(u \cdot s\right)} \]
  5. Final simplification72.3%

    \[\leadsto 4 \cdot \left(s \cdot u\right) \]

Alternative 9: 73.7% accurate, 21.8× speedup?

\[\begin{array}{l} \\ u \cdot \left(s \cdot 4\right) \end{array} \]
(FPCore (s u) :precision binary32 (* u (* s 4.0)))
float code(float s, float u) {
	return u * (s * 4.0f);
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = u * (s * 4.0e0)
end function
function code(s, u)
	return Float32(u * Float32(s * Float32(4.0)))
end
function tmp = code(s, u)
	tmp = u * (s * single(4.0));
end
\begin{array}{l}

\\
u \cdot \left(s \cdot 4\right)
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Taylor expanded in u around 0 72.3%

    \[\leadsto \color{blue}{4 \cdot \left(s \cdot u\right)} \]
  3. Step-by-step derivation
    1. associate-*r*72.5%

      \[\leadsto \color{blue}{\left(4 \cdot s\right) \cdot u} \]
    2. *-commutative72.5%

      \[\leadsto \color{blue}{u \cdot \left(4 \cdot s\right)} \]
  4. Simplified72.5%

    \[\leadsto \color{blue}{u \cdot \left(4 \cdot s\right)} \]
  5. Final simplification72.5%

    \[\leadsto u \cdot \left(s \cdot 4\right) \]

Alternative 10: 16.4% accurate, 36.3× speedup?

\[\begin{array}{l} \\ s \cdot 0 \end{array} \]
(FPCore (s u) :precision binary32 (* s 0.0))
float code(float s, float u) {
	return s * 0.0f;
}
real(4) function code(s, u)
    real(4), intent (in) :: s
    real(4), intent (in) :: u
    code = s * 0.0e0
end function
function code(s, u)
	return Float32(s * Float32(0.0))
end
function tmp = code(s, u)
	tmp = s * single(0.0);
end
\begin{array}{l}

\\
s \cdot 0
\end{array}
Derivation
  1. Initial program 63.0%

    \[s \cdot \log \left(\frac{1}{1 - 4 \cdot u}\right) \]
  2. Applied egg-rr16.1%

    \[\leadsto s \cdot \color{blue}{0} \]
  3. Final simplification16.1%

    \[\leadsto s \cdot 0 \]

Reproduce

?
herbie shell --seed 2023287 
(FPCore (s u)
  :name "Disney BSSRDF, sample scattering profile, lower"
  :precision binary32
  :pre (and (and (<= 0.0 s) (<= s 256.0)) (and (<= 2.328306437e-10 u) (<= u 0.25)))
  (* s (log (/ 1.0 (- 1.0 (* 4.0 u))))))