
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0
(cbrt
(*
(exp
(+
(/
(+ (fma cosTheta_i cosTheta_O (* sinTheta_i sinTheta_O)) -1.0)
v)
0.6931))
(/ 0.5 v)))))
(pow (* (pow (pow t_0 2.0) 0.3333333333333333) (cbrt t_0)) 3.0)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = cbrtf((expf((((fmaf(cosTheta_i, cosTheta_O, (sinTheta_i * sinTheta_O)) + -1.0f) / v) + 0.6931f)) * (0.5f / v)));
return powf((powf(powf(t_0, 2.0f), 0.3333333333333333f) * cbrtf(t_0)), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = cbrt(Float32(exp(Float32(Float32(Float32(fma(cosTheta_i, cosTheta_O, Float32(sinTheta_i * sinTheta_O)) + Float32(-1.0)) / v) + Float32(0.6931))) * Float32(Float32(0.5) / v))) return Float32(((t_0 ^ Float32(2.0)) ^ Float32(0.3333333333333333)) * cbrt(t_0)) ^ Float32(3.0) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt[3]{e^{\frac{\mathsf{fma}\left(cosTheta\_i, cosTheta\_O, sinTheta\_i \cdot sinTheta\_O\right) + -1}{v} + 0.6931} \cdot \frac{0.5}{v}}\\
{\left({\left({t\_0}^{2}\right)}^{0.3333333333333333} \cdot \sqrt[3]{t\_0}\right)}^{3}
\end{array}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
add-cube-cbrt99.4%
pow399.4%
Applied egg-rr99.9%
pow1/399.8%
add-cube-cbrt99.8%
unpow-prod-down99.8%
Applied egg-rr99.9%
Final simplification99.9%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(pow
(*
(cbrt
(*
(exp
(+
(/ (+ (fma cosTheta_i cosTheta_O (* sinTheta_i sinTheta_O)) -1.0) v)
0.6931))
(/ 0.5 v)))
(pow
(* (/ 0.5 v) (exp (+ 0.6931 (/ (+ (* sinTheta_i sinTheta_O) -1.0) v))))
0.16666666666666666))
2.0))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return powf((cbrtf((expf((((fmaf(cosTheta_i, cosTheta_O, (sinTheta_i * sinTheta_O)) + -1.0f) / v) + 0.6931f)) * (0.5f / v))) * powf(((0.5f / v) * expf((0.6931f + (((sinTheta_i * sinTheta_O) + -1.0f) / v)))), 0.16666666666666666f)), 2.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(cbrt(Float32(exp(Float32(Float32(Float32(fma(cosTheta_i, cosTheta_O, Float32(sinTheta_i * sinTheta_O)) + Float32(-1.0)) / v) + Float32(0.6931))) * Float32(Float32(0.5) / v))) * (Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(Float32(Float32(sinTheta_i * sinTheta_O) + Float32(-1.0)) / v)))) ^ Float32(0.16666666666666666))) ^ Float32(2.0) end
\begin{array}{l}
\\
{\left(\sqrt[3]{e^{\frac{\mathsf{fma}\left(cosTheta\_i, cosTheta\_O, sinTheta\_i \cdot sinTheta\_O\right) + -1}{v} + 0.6931} \cdot \frac{0.5}{v}} \cdot {\left(\frac{0.5}{v} \cdot e^{0.6931 + \frac{sinTheta\_i \cdot sinTheta\_O + -1}{v}}\right)}^{0.16666666666666666}\right)}^{2}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
add-sqr-sqrt99.4%
pow299.4%
Applied egg-rr99.8%
add-cube-cbrt99.9%
sqrt-prod99.9%
Applied egg-rr99.9%
Taylor expanded in cosTheta_i around 0 99.9%
Final simplification99.9%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (pow (cbrt (* (/ 0.5 v) (exp (- 0.6931 (/ 1.0 v))))) 3.0))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return powf(cbrtf(((0.5f / v) * expf((0.6931f - (1.0f / v))))), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return cbrt(Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v))))) ^ Float32(3.0) end
\begin{array}{l}
\\
{\left(\sqrt[3]{\frac{0.5}{v} \cdot e^{0.6931 - \frac{1}{v}}}\right)}^{3}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
add-cube-cbrt99.4%
pow399.4%
Applied egg-rr99.9%
Taylor expanded in cosTheta_i around inf 99.9%
Taylor expanded in cosTheta_O around 0 99.9%
Final simplification99.9%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (- 0.6931 (/ 1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f - (1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 - (1.0e0 / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) - (single(1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 - \frac{1}{v}}
\end{array}
Initial program 99.8%
exp-sum99.9%
*-commutative99.9%
rem-exp-log99.8%
associate-/r*99.8%
metadata-eval99.8%
associate--l-99.8%
associate-/l*99.8%
*-commutative99.8%
associate-/l*99.8%
fma-define99.8%
Simplified99.8%
Taylor expanded in sinTheta_O around 0 99.8%
Taylor expanded in cosTheta_O around 0 99.8%
Final simplification99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ -1.0 v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(-1.0) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(-1.0) / v)); end
\begin{array}{l}
\\
e^{\frac{-1}{v}}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around 0 99.8%
Taylor expanded in v around 0 98.6%
Taylor expanded in cosTheta_O around 0 98.6%
Final simplification98.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* sinTheta_O (/ sinTheta_i v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return sinTheta_O * (sinTheta_i / v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = sintheta_o * (sintheta_i / v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(sinTheta_O * Float32(sinTheta_i / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = sinTheta_O * (sinTheta_i / v); end
\begin{array}{l}
\\
sinTheta\_O \cdot \frac{sinTheta\_i}{v}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around inf 14.5%
associate-*r/14.5%
*-commutative14.5%
neg-mul-114.5%
distribute-rgt-neg-in14.5%
Simplified14.5%
associate-/l*14.5%
add-sqr-sqrt7.4%
sqrt-unprod16.0%
sqr-neg16.0%
sqrt-unprod8.6%
add-sqr-sqrt14.8%
Applied egg-rr14.8%
Taylor expanded in sinTheta_i around 0 6.2%
Taylor expanded in sinTheta_O around inf 32.1%
associate-*r/16.2%
Simplified16.2%
Final simplification16.2%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* sinTheta_i sinTheta_O) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (sinTheta_i * sinTheta_O) / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (sintheta_i * sintheta_o) / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(sinTheta_i * sinTheta_O) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (sinTheta_i * sinTheta_O) / v; end
\begin{array}{l}
\\
\frac{sinTheta\_i \cdot sinTheta\_O}{v}
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around inf 14.5%
associate-*r/14.5%
*-commutative14.5%
neg-mul-114.5%
distribute-rgt-neg-in14.5%
Simplified14.5%
associate-/l*14.5%
add-sqr-sqrt7.4%
sqrt-unprod16.0%
sqr-neg16.0%
sqrt-unprod8.6%
add-sqr-sqrt14.8%
Applied egg-rr14.8%
Taylor expanded in sinTheta_i around 0 6.2%
Taylor expanded in sinTheta_O around inf 32.1%
Final simplification32.1%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 1.0)
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(1.0) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.8%
associate-+l+99.8%
associate--l-99.8%
associate-/l*99.8%
associate-/l*99.4%
associate-/r*99.4%
metadata-eval99.4%
Simplified99.4%
Taylor expanded in sinTheta_i around inf 14.5%
associate-*r/14.5%
*-commutative14.5%
neg-mul-114.5%
distribute-rgt-neg-in14.5%
Simplified14.5%
Taylor expanded in sinTheta_i around 0 6.3%
Final simplification6.3%
herbie shell --seed 2024081
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))