
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta_i \cdot cosTheta_O}{v} - \frac{sinTheta_i \cdot sinTheta_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta_i \cdot cosTheta_O}{v} - \frac{sinTheta_i \cdot sinTheta_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (/ (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) v))
(t_1 (- 0.6931 (/ 1.0 v))))
(*
(/ 0.5 v)
(pow
(*
(*
(cbrt (exp (* 0.2222222222222222 (+ 0.6931 (+ (/ -1.0 v) t_0)))))
(pow
(pow
(cbrt
(exp
(+
(/ (fma cosTheta_O cosTheta_i (* sinTheta_O (- sinTheta_i))) v)
t_1)))
4.0)
0.1111111111111111))
(cbrt (cbrt (exp (+ t_1 t_0)))))
3.0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = ((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v;
float t_1 = 0.6931f - (1.0f / v);
return (0.5f / v) * powf(((cbrtf(expf((0.2222222222222222f * (0.6931f + ((-1.0f / v) + t_0))))) * powf(powf(cbrtf(expf(((fmaf(cosTheta_O, cosTheta_i, (sinTheta_O * -sinTheta_i)) / v) + t_1))), 4.0f), 0.1111111111111111f)) * cbrtf(cbrtf(expf((t_1 + t_0))))), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) / v) t_1 = Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) return Float32(Float32(Float32(0.5) / v) * (Float32(Float32(cbrt(exp(Float32(Float32(0.2222222222222222) * Float32(Float32(0.6931) + Float32(Float32(Float32(-1.0) / v) + t_0))))) * ((cbrt(exp(Float32(Float32(fma(cosTheta_O, cosTheta_i, Float32(sinTheta_O * Float32(-sinTheta_i))) / v) + t_1))) ^ Float32(4.0)) ^ Float32(0.1111111111111111))) * cbrt(cbrt(exp(Float32(t_1 + t_0))))) ^ Float32(3.0))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta_O \cdot cosTheta_i - sinTheta_O \cdot sinTheta_i}{v}\\
t_1 := 0.6931 - \frac{1}{v}\\
\frac{0.5}{v} \cdot {\left(\left(\sqrt[3]{e^{0.2222222222222222 \cdot \left(0.6931 + \left(\frac{-1}{v} + t_0\right)\right)}} \cdot {\left({\left(\sqrt[3]{e^{\frac{\mathsf{fma}\left(cosTheta_O, cosTheta_i, sinTheta_O \cdot \left(-sinTheta_i\right)\right)}{v} + t_1}}\right)}^{4}\right)}^{0.1111111111111111}\right) \cdot \sqrt[3]{\sqrt[3]{e^{t_1 + t_0}}}\right)}^{3}
\end{array}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.6%
associate-/r*99.6%
metadata-eval99.6%
+-rgt-identity99.6%
metadata-eval99.6%
metadata-eval99.6%
+-rgt-identity99.6%
sub-neg99.6%
associate-+l+99.6%
Simplified99.6%
add-cube-cbrt99.6%
pow399.6%
associate-*l/99.6%
*-commutative99.6%
associate-/l*99.6%
sub-div99.6%
+-commutative99.6%
Applied egg-rr99.6%
pow1/399.6%
add-cube-cbrt99.6%
unpow-prod-down99.6%
pow299.6%
pow1/399.6%
Applied egg-rr99.6%
Applied egg-rr99.6%
Simplified99.6%
pow1/399.6%
pow1/399.6%
pow-pow99.6%
Applied egg-rr99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (/ (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) v))
(t_1 (- 0.6931 (/ 1.0 v))))
(*
(/ 0.5 v)
(pow
(*
(cbrt (cbrt (exp (+ t_1 t_0))))
(*
(cbrt
(exp (* 0.2222222222222222 (- t_1 (* sinTheta_O (/ sinTheta_i v))))))
(cbrt (cbrt (pow (cbrt (exp (+ 0.6931 (+ (/ -1.0 v) t_0)))) 4.0)))))
3.0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = ((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v;
float t_1 = 0.6931f - (1.0f / v);
return (0.5f / v) * powf((cbrtf(cbrtf(expf((t_1 + t_0)))) * (cbrtf(expf((0.2222222222222222f * (t_1 - (sinTheta_O * (sinTheta_i / v)))))) * cbrtf(cbrtf(powf(cbrtf(expf((0.6931f + ((-1.0f / v) + t_0)))), 4.0f))))), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) / v) t_1 = Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) return Float32(Float32(Float32(0.5) / v) * (Float32(cbrt(cbrt(exp(Float32(t_1 + t_0)))) * Float32(cbrt(exp(Float32(Float32(0.2222222222222222) * Float32(t_1 - Float32(sinTheta_O * Float32(sinTheta_i / v)))))) * cbrt(cbrt((cbrt(exp(Float32(Float32(0.6931) + Float32(Float32(Float32(-1.0) / v) + t_0)))) ^ Float32(4.0)))))) ^ Float32(3.0))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{cosTheta_O \cdot cosTheta_i - sinTheta_O \cdot sinTheta_i}{v}\\
t_1 := 0.6931 - \frac{1}{v}\\
\frac{0.5}{v} \cdot {\left(\sqrt[3]{\sqrt[3]{e^{t_1 + t_0}}} \cdot \left(\sqrt[3]{e^{0.2222222222222222 \cdot \left(t_1 - sinTheta_O \cdot \frac{sinTheta_i}{v}\right)}} \cdot \sqrt[3]{\sqrt[3]{{\left(\sqrt[3]{e^{0.6931 + \left(\frac{-1}{v} + t_0\right)}}\right)}^{4}}}\right)\right)}^{3}
\end{array}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.6%
associate-/r*99.6%
metadata-eval99.6%
+-rgt-identity99.6%
metadata-eval99.6%
metadata-eval99.6%
+-rgt-identity99.6%
sub-neg99.6%
associate-+l+99.6%
Simplified99.6%
add-cube-cbrt99.6%
pow399.6%
associate-*l/99.6%
*-commutative99.6%
associate-/l*99.6%
sub-div99.6%
+-commutative99.6%
Applied egg-rr99.6%
pow1/399.6%
add-cube-cbrt99.6%
unpow-prod-down99.6%
pow299.6%
pow1/399.6%
Applied egg-rr99.6%
Applied egg-rr99.6%
Simplified99.6%
Taylor expanded in cosTheta_O around 0 99.6%
*-commutative99.6%
associate--r+99.6%
*-commutative99.6%
associate-*l/99.6%
*-commutative99.6%
Simplified99.6%
Final simplification99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0
(cbrt
(exp
(+
(- 0.6931 (/ 1.0 v))
(/ (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) v))))))
(*
(/ 0.5 v)
(pow (* (cbrt t_0) (pow (pow t_0 2.0) 0.3333333333333333)) 3.0))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = cbrtf(expf(((0.6931f - (1.0f / v)) + (((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v))));
return (0.5f / v) * powf((cbrtf(t_0) * powf(powf(t_0, 2.0f), 0.3333333333333333f)), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = cbrt(exp(Float32(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) + Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) / v)))) return Float32(Float32(Float32(0.5) / v) * (Float32(cbrt(t_0) * ((t_0 ^ Float32(2.0)) ^ Float32(0.3333333333333333))) ^ Float32(3.0))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \sqrt[3]{e^{\left(0.6931 - \frac{1}{v}\right) + \frac{cosTheta_O \cdot cosTheta_i - sinTheta_O \cdot sinTheta_i}{v}}}\\
\frac{0.5}{v} \cdot {\left(\sqrt[3]{t_0} \cdot {\left({t_0}^{2}\right)}^{0.3333333333333333}\right)}^{3}
\end{array}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.6%
associate-/r*99.6%
metadata-eval99.6%
+-rgt-identity99.6%
metadata-eval99.6%
metadata-eval99.6%
+-rgt-identity99.6%
sub-neg99.6%
associate-+l+99.6%
Simplified99.6%
add-cube-cbrt99.6%
pow399.6%
associate-*l/99.6%
*-commutative99.6%
associate-/l*99.6%
sub-div99.6%
+-commutative99.6%
Applied egg-rr99.6%
pow1/399.6%
add-cube-cbrt99.6%
unpow-prod-down99.6%
pow299.6%
pow1/399.6%
Applied egg-rr99.6%
Final simplification99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(*
(/ 0.5 v)
(pow
(cbrt
(exp
(+
(- 0.6931 (/ 1.0 v))
(/ (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) v))))
3.0)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * powf(cbrtf(expf(((0.6931f - (1.0f / v)) + (((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v)))), 3.0f);
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * (cbrt(exp(Float32(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) + Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) / v)))) ^ Float32(3.0))) end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot {\left(\sqrt[3]{e^{\left(0.6931 - \frac{1}{v}\right) + \frac{cosTheta_O \cdot cosTheta_i - sinTheta_O \cdot sinTheta_i}{v}}}\right)}^{3}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.6%
associate-/r*99.6%
metadata-eval99.6%
+-rgt-identity99.6%
metadata-eval99.6%
metadata-eval99.6%
+-rgt-identity99.6%
sub-neg99.6%
associate-+l+99.6%
Simplified99.6%
add-cube-cbrt99.6%
pow399.6%
associate-*l/99.6%
*-commutative99.6%
associate-/l*99.6%
sub-div99.6%
+-commutative99.6%
Applied egg-rr99.6%
Final simplification99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(*
(/ 0.5 v)
(pow
E
(+
(- 0.6931 (/ 1.0 v))
(/ (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * powf(((float) M_E), ((0.6931f - (1.0f / v)) + (((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v)));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * (Float32(exp(1)) ^ Float32(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) + Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * (single(2.71828182845904523536) ^ ((single(0.6931) - (single(1.0) / v)) + (((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot {e}^{\left(\left(0.6931 - \frac{1}{v}\right) + \frac{cosTheta_O \cdot cosTheta_i - sinTheta_O \cdot sinTheta_i}{v}\right)}
\end{array}
Initial program 99.6%
exp-sum99.6%
*-commutative99.6%
rem-exp-log99.6%
associate-/r*99.6%
metadata-eval99.6%
+-rgt-identity99.6%
metadata-eval99.6%
metadata-eval99.6%
+-rgt-identity99.6%
sub-neg99.6%
associate-+l+99.6%
Simplified99.6%
*-un-lft-identity99.6%
exp-prod99.6%
associate-*l/99.6%
*-commutative99.6%
associate-/l*99.6%
sub-div99.6%
+-commutative99.6%
Applied egg-rr99.6%
Final simplification99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (- 0.6931 (/ 1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f - (1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 - (1.0e0 / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) - (single(1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 - \frac{1}{v}}
\end{array}
Initial program 99.6%
Taylor expanded in sinTheta_i around 0 99.6%
*-un-lft-identity99.6%
exp-prod99.6%
+-commutative99.6%
associate-/l*99.6%
Applied egg-rr99.6%
Taylor expanded in cosTheta_O around 0 99.6%
sub-neg99.6%
exp-sum99.2%
prod-exp99.2%
rem-exp-log99.2%
*-commutative99.2%
associate-*l*99.6%
distribute-neg-frac99.6%
metadata-eval99.6%
exp-sum99.6%
Simplified99.6%
Final simplification99.6%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ -1.0 v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(-1.0) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(-1.0) / v)); end
\begin{array}{l}
\\
e^{\frac{-1}{v}}
\end{array}
Initial program 99.6%
Taylor expanded in sinTheta_i around 0 99.6%
Taylor expanded in cosTheta_O around 0 99.6%
Taylor expanded in v around 0 97.2%
Final simplification97.2%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 1.0)
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(1.0) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0); end
\begin{array}{l}
\\
1
\end{array}
Initial program 99.6%
Taylor expanded in v around 0 97.2%
Taylor expanded in v around inf 6.4%
Final simplification6.4%
herbie shell --seed 2024021
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))