
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (pow (cbrt (* 0.5 (/ (* (exp (/ (fma cosTheta_i cosTheta_O -1.0) v)) (exp 0.6931)) v))) 3.0))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return powf(cbrtf((0.5f * ((expf((fmaf(cosTheta_i, cosTheta_O, -1.0f) / v)) * expf(0.6931f)) / v))), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return cbrt(Float32(Float32(0.5) * Float32(Float32(exp(Float32(fma(cosTheta_i, cosTheta_O, Float32(-1.0)) / v)) * exp(Float32(0.6931))) / v))) ^ Float32(3.0) end
\begin{array}{l}
\\
{\left(\sqrt[3]{0.5 \cdot \frac{e^{\frac{\mathsf{fma}\left(cosTheta\_i, cosTheta\_O, -1\right)}{v}} \cdot e^{0.6931}}{v}}\right)}^{3}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
associate-*l/99.7%
clear-num99.7%
Applied egg-rr99.7%
Taylor expanded in sinTheta_i around 0 99.7%
add-cube-cbrt99.7%
pow399.7%
Applied egg-rr99.7%
+-commutative99.7%
exp-sum99.7%
fma-neg99.7%
metadata-eval99.7%
Applied egg-rr99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (pow (cbrt 0.5) 3.0) (exp (- 0.6931 (/ 1.0 v)))) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (powf(cbrtf(0.5f), 3.0f) * expf((0.6931f - (1.0f / v)))) / v;
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32((cbrt(Float32(0.5)) ^ Float32(3.0)) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))) / v) end
\begin{array}{l}
\\
\frac{{\left(\sqrt[3]{0.5}\right)}^{3} \cdot e^{0.6931 - \frac{1}{v}}}{v}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
associate-*l/99.7%
clear-num99.7%
Applied egg-rr99.7%
Taylor expanded in sinTheta_i around 0 99.7%
add-cube-cbrt99.7%
pow399.7%
Applied egg-rr99.7%
Taylor expanded in cosTheta_i around 0 99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ 1.0 (/ v (* 0.5 (exp (- 0.6931 (/ 1.0 v)))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f / (v / (0.5f * expf((0.6931f - (1.0f / v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0 / (v / (0.5e0 * exp((0.6931e0 - (1.0e0 / v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(1.0) / Float32(v / Float32(Float32(0.5) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0) / (v / (single(0.5) * exp((single(0.6931) - (single(1.0) / v))))); end
\begin{array}{l}
\\
\frac{1}{\frac{v}{0.5 \cdot e^{0.6931 - \frac{1}{v}}}}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
associate-*l/99.7%
clear-num99.7%
Applied egg-rr99.7%
Taylor expanded in sinTheta_i around 0 99.7%
Taylor expanded in cosTheta_O around 0 99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* 0.5 (/ (exp (- 0.6931 (/ 1.0 v))) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 0.5f * (expf((0.6931f - (1.0f / v))) / v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 0.5e0 * (exp((0.6931e0 - (1.0e0 / v))) / v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(0.5) * Float32(exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v))) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.5) * (exp((single(0.6931) - (single(1.0) / v))) / v); end
\begin{array}{l}
\\
0.5 \cdot \frac{e^{0.6931 - \frac{1}{v}}}{v}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
associate-*l/99.7%
clear-num99.7%
Applied egg-rr99.7%
Taylor expanded in sinTheta_i around 0 99.7%
Taylor expanded in cosTheta_O around 0 99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* -0.5 (/ (* sinTheta_O sinTheta_i) (pow v 2.0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return -0.5f * ((sinTheta_O * sinTheta_i) / powf(v, 2.0f));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (-0.5e0) * ((sintheta_o * sintheta_i) / (v ** 2.0e0))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(-0.5) * Float32(Float32(sinTheta_O * sinTheta_i) / (v ^ Float32(2.0)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(-0.5) * ((sinTheta_O * sinTheta_i) / (v ^ single(2.0))); end
\begin{array}{l}
\\
-0.5 \cdot \frac{sinTheta\_O \cdot sinTheta\_i}{{v}^{2}}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
Taylor expanded in sinTheta_i around inf 11.4%
associate-*r/11.4%
mul-1-neg11.4%
Simplified11.4%
Taylor expanded in v around inf 4.7%
Taylor expanded in sinTheta_O around inf 20.2%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ 0.5 v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 0.5f / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 0.5e0 / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(0.5) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.5) / v; end
\begin{array}{l}
\\
\frac{0.5}{v}
\end{array}
Initial program 99.2%
exp-sum99.3%
*-commutative99.3%
rem-exp-log99.3%
associate-/r*99.3%
metadata-eval99.3%
associate--l-99.3%
associate-/l*99.3%
associate-/l*99.3%
fma-define99.3%
Simplified99.3%
Taylor expanded in sinTheta_i around inf 11.4%
associate-*r/11.4%
mul-1-neg11.4%
Simplified11.4%
Taylor expanded in v around inf 4.7%
herbie shell --seed 2024106
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))