
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 10 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
cosTheta_O_m = (fabs.f32 cosTheta_O)
cosTheta_O_s = (copysign.f32 1 cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
(pow (exp sinTheta_i) (/ sinTheta_O (- v)))
(/
(* cosTheta_O_m (* cosTheta_i (* (/ 1.0 v) (/ 1.0 v))))
(* (sinh (/ 1.0 v)) 2.0)))))cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (powf(expf(sinTheta_i), (sinTheta_O / -v)) * ((cosTheta_O_m * (cosTheta_i * ((1.0f / v) * (1.0f / v)))) / (sinhf((1.0f / v)) * 2.0f)));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * ((exp(sintheta_i) ** (sintheta_o / -v)) * ((costheta_o_m * (costheta_i * ((1.0e0 / v) * (1.0e0 / v)))) / (sinh((1.0e0 / v)) * 2.0e0)))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32((exp(sinTheta_i) ^ Float32(sinTheta_O / Float32(-v))) * Float32(Float32(cosTheta_O_m * Float32(cosTheta_i * Float32(Float32(Float32(1.0) / v) * Float32(Float32(1.0) / v)))) / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * ((exp(sinTheta_i) ^ (sinTheta_O / -v)) * ((cosTheta_O_m * (cosTheta_i * ((single(1.0) / v) * (single(1.0) / v)))) / (sinh((single(1.0) / v)) * single(2.0))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left({\left(e^{sinTheta\_i}\right)}^{\left(\frac{sinTheta\_O}{-v}\right)} \cdot \frac{cosTheta\_O\_m \cdot \left(cosTheta\_i \cdot \left(\frac{1}{v} \cdot \frac{1}{v}\right)\right)}{\sinh \left(\frac{1}{v}\right) \cdot 2}\right)
\end{array}
Initial program 98.6%
times-frac98.5%
associate-*l/98.5%
associate-*r/98.5%
distribute-frac-neg298.5%
associate-/l*98.5%
exp-prod98.5%
*-commutative98.5%
associate-/l*98.6%
associate-/l*98.5%
Simplified98.5%
div-inv98.6%
*-un-lft-identity98.6%
times-frac98.6%
Applied egg-rr98.6%
div-inv98.8%
Applied egg-rr98.8%
Final simplification98.8%
cosTheta_O_m = (fabs.f32 cosTheta_O)
cosTheta_O_s = (copysign.f32 1 cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(/
(*
(exp (/ (* sinTheta_i sinTheta_O) (- v)))
(* (/ 1.0 v) (* cosTheta_O_m cosTheta_i)))
(* v (* (sinh (/ 1.0 v)) 2.0)))))cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * ((expf(((sinTheta_i * sinTheta_O) / -v)) * ((1.0f / v) * (cosTheta_O_m * cosTheta_i))) / (v * (sinhf((1.0f / v)) * 2.0f)));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * ((exp(((sintheta_i * sintheta_o) / -v)) * ((1.0e0 / v) * (costheta_o_m * costheta_i))) / (v * (sinh((1.0e0 / v)) * 2.0e0)))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) * Float32(Float32(Float32(1.0) / v) * Float32(cosTheta_O_m * cosTheta_i))) / Float32(v * Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * ((exp(((sinTheta_i * sinTheta_O) / -v)) * ((single(1.0) / v) * (cosTheta_O_m * cosTheta_i))) / (v * (sinh((single(1.0) / v)) * single(2.0))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}} \cdot \left(\frac{1}{v} \cdot \left(cosTheta\_O\_m \cdot cosTheta\_i\right)\right)}{v \cdot \left(\sinh \left(\frac{1}{v}\right) \cdot 2\right)}
\end{array}
Initial program 98.6%
div-inv98.7%
Applied egg-rr98.7%
Final simplification98.7%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* (/ (/ 1.0 v) (sinh (/ 1.0 v))) (/ (* cosTheta_i (/ cosTheta_O_m v)) 2.0))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (((1.0f / v) / sinhf((1.0f / v))) * ((cosTheta_i * (cosTheta_O_m / v)) / 2.0f));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (((1.0e0 / v) / sinh((1.0e0 / v))) * ((costheta_i * (costheta_o_m / v)) / 2.0e0))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(Float32(Float32(1.0) / v) / sinh(Float32(Float32(1.0) / v))) * Float32(Float32(cosTheta_i * Float32(cosTheta_O_m / v)) / Float32(2.0)))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (((single(1.0) / v) / sinh((single(1.0) / v))) * ((cosTheta_i * (cosTheta_O_m / v)) / single(2.0)));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(\frac{\frac{1}{v}}{\sinh \left(\frac{1}{v}\right)} \cdot \frac{cosTheta\_i \cdot \frac{cosTheta\_O\_m}{v}}{2}\right)
\end{array}
Initial program 98.6%
associate-*r/98.5%
associate-/l/98.5%
remove-double-neg98.5%
distribute-rgt-neg-out98.5%
distribute-rgt-neg-out98.5%
distribute-lft-neg-in98.5%
associate-*r/98.5%
associate-/l/98.5%
associate-*r/98.6%
Simplified98.5%
associate-*r*98.5%
times-frac98.3%
associate-*r/98.3%
add-sqr-sqrt-0.0%
sqrt-unprod98.2%
sqr-neg98.2%
sqrt-unprod98.2%
add-sqr-sqrt98.2%
associate-/l*98.2%
pow-exp98.2%
Applied egg-rr98.2%
Taylor expanded in sinTheta_i around 0 98.2%
metadata-eval98.2%
associate-*l/98.2%
associate-/r*98.4%
associate-/r/98.4%
rec-exp98.4%
sinh-def98.5%
Simplified98.5%
Final simplification98.5%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_O_m (/ cosTheta_i (fma v 2.0 (/ 0.3333333333333333 v))))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_O_m * (cosTheta_i / fmaf(v, 2.0f, (0.3333333333333333f / v))));
}
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_O_m * Float32(cosTheta_i / fma(v, Float32(2.0), Float32(Float32(0.3333333333333333) / v))))) end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_O\_m \cdot \frac{cosTheta\_i}{\mathsf{fma}\left(v, 2, \frac{0.3333333333333333}{v}\right)}\right)
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 63.3%
Taylor expanded in sinTheta_i around 0 63.3%
associate-/l*63.3%
associate-*r/63.3%
metadata-eval63.3%
*-commutative63.3%
fma-undefine63.3%
Simplified63.3%
Final simplification63.3%
cosTheta_O_m = (fabs.f32 cosTheta_O)
cosTheta_O_s = (copysign.f32 1 cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (* (/ 1.0 v) 0.3333333333333333)))
(*
cosTheta_O_s
(/
(* cosTheta_O_m cosTheta_i)
(+
t_0
(+ (* v 2.0) (/ (* sinTheta_O (* sinTheta_i (+ t_0 (* v 2.0)))) v)))))))cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (1.0f / v) * 0.3333333333333333f;
return cosTheta_O_s * ((cosTheta_O_m * cosTheta_i) / (t_0 + ((v * 2.0f) + ((sinTheta_O * (sinTheta_i * (t_0 + (v * 2.0f)))) / v))));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
t_0 = (1.0e0 / v) * 0.3333333333333333e0
code = costheta_o_s * ((costheta_o_m * costheta_i) / (t_0 + ((v * 2.0e0) + ((sintheta_o * (sintheta_i * (t_0 + (v * 2.0e0)))) / v))))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(Float32(1.0) / v) * Float32(0.3333333333333333)) return Float32(cosTheta_O_s * Float32(Float32(cosTheta_O_m * cosTheta_i) / Float32(t_0 + Float32(Float32(v * Float32(2.0)) + Float32(Float32(sinTheta_O * Float32(sinTheta_i * Float32(t_0 + Float32(v * Float32(2.0))))) / v))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
t_0 = (single(1.0) / v) * single(0.3333333333333333);
tmp = cosTheta_O_s * ((cosTheta_O_m * cosTheta_i) / (t_0 + ((v * single(2.0)) + ((sinTheta_O * (sinTheta_i * (t_0 + (v * single(2.0))))) / v))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
\begin{array}{l}
t_0 := \frac{1}{v} \cdot 0.3333333333333333\\
cosTheta\_O\_s \cdot \frac{cosTheta\_O\_m \cdot cosTheta\_i}{t\_0 + \left(v \cdot 2 + \frac{sinTheta\_O \cdot \left(sinTheta\_i \cdot \left(t\_0 + v \cdot 2\right)\right)}{v}\right)}
\end{array}
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 63.3%
Taylor expanded in sinTheta_i around 0 63.3%
Final simplification63.3%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (/ (* cosTheta_O_m cosTheta_i) (+ (* (/ 1.0 v) 0.3333333333333333) (* v 2.0)))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * ((cosTheta_O_m * cosTheta_i) / (((1.0f / v) * 0.3333333333333333f) + (v * 2.0f)));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * ((costheta_o_m * costheta_i) / (((1.0e0 / v) * 0.3333333333333333e0) + (v * 2.0e0)))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(cosTheta_O_m * cosTheta_i) / Float32(Float32(Float32(Float32(1.0) / v) * Float32(0.3333333333333333)) + Float32(v * Float32(2.0))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * ((cosTheta_O_m * cosTheta_i) / (((single(1.0) / v) * single(0.3333333333333333)) + (v * single(2.0))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \frac{cosTheta\_O\_m \cdot cosTheta\_i}{\frac{1}{v} \cdot 0.3333333333333333 + v \cdot 2}
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 63.3%
Taylor expanded in sinTheta_i around 0 63.3%
Final simplification63.3%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* 0.5 (/ 1.0 (/ v (* cosTheta_O_m cosTheta_i))))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (0.5f * (1.0f / (v / (cosTheta_O_m * cosTheta_i))));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (0.5e0 * (1.0e0 / (v / (costheta_o_m * costheta_i))))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(0.5) * Float32(Float32(1.0) / Float32(v / Float32(cosTheta_O_m * cosTheta_i))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (single(0.5) * (single(1.0) / (v / (cosTheta_O_m * cosTheta_i))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(0.5 \cdot \frac{1}{\frac{v}{cosTheta\_O\_m \cdot cosTheta\_i}}\right)
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 57.3%
distribute-lft-out57.3%
Simplified57.3%
Taylor expanded in v around inf 57.3%
associate-/l*57.3%
Simplified57.3%
Taylor expanded in cosTheta_O around 0 57.3%
*-commutative57.3%
associate-*r/57.3%
Simplified57.3%
associate-*r/57.3%
clear-num57.7%
Applied egg-rr57.7%
Final simplification57.7%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (/ 1.0 (/ 2.0 (* cosTheta_i (/ cosTheta_O_m v))))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (1.0f / (2.0f / (cosTheta_i * (cosTheta_O_m / v))));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (1.0e0 / (2.0e0 / (costheta_i * (costheta_o_m / v))))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(1.0) / Float32(Float32(2.0) / Float32(cosTheta_i * Float32(cosTheta_O_m / v))))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (single(1.0) / (single(2.0) / (cosTheta_i * (cosTheta_O_m / v))));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \frac{1}{\frac{2}{cosTheta\_i \cdot \frac{cosTheta\_O\_m}{v}}}
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 57.3%
distribute-lft-out57.3%
Simplified57.3%
Taylor expanded in v around inf 57.3%
associate-/l*57.3%
Simplified57.3%
Taylor expanded in cosTheta_O around 0 57.3%
*-commutative57.3%
associate-*r/57.3%
Simplified57.3%
*-commutative57.3%
metadata-eval57.3%
div-inv57.3%
clear-num57.8%
Applied egg-rr57.8%
Final simplification57.8%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* 0.5 (* cosTheta_O_m (/ cosTheta_i v)))))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (0.5f * (cosTheta_O_m * (cosTheta_i / v)));
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (0.5e0 * (costheta_o_m * (costheta_i / v)))
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(0.5) * Float32(cosTheta_O_m * Float32(cosTheta_i / v)))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (single(0.5) * (cosTheta_O_m * (cosTheta_i / v)));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(0.5 \cdot \left(cosTheta\_O\_m \cdot \frac{cosTheta\_i}{v}\right)\right)
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 57.3%
distribute-lft-out57.3%
Simplified57.3%
Taylor expanded in v around inf 57.3%
associate-/l*57.3%
Simplified57.3%
Final simplification57.3%
cosTheta_O_m = (fabs.f32 cosTheta_O) cosTheta_O_s = (copysign.f32 1 cosTheta_O) NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* (* cosTheta_i (/ cosTheta_O_m v)) 0.5)))
cosTheta_O_m = fabs(cosTheta_O);
cosTheta_O_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * ((cosTheta_i * (cosTheta_O_m / v)) * 0.5f);
}
cosTheta_O_m = abs(cosTheta_O)
cosTheta_O_s = copysign(1.0d0, cosTheta_O)
NOTE: cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * ((costheta_i * (costheta_o_m / v)) * 0.5e0)
end function
cosTheta_O_m = abs(cosTheta_O) cosTheta_O_s = copysign(1.0, cosTheta_O) cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(Float32(cosTheta_i * Float32(cosTheta_O_m / v)) * Float32(0.5))) end
cosTheta_O_m = abs(cosTheta_O);
cosTheta_O_s = sign(double(cosTheta_O)) * abs(1.0);
cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * ((cosTheta_i * (cosTheta_O_m / v)) * single(0.5));
end
\begin{array}{l}
cosTheta_O_m = \left|cosTheta\_O\right|
\\
cosTheta_O_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(\left(cosTheta\_i \cdot \frac{cosTheta\_O\_m}{v}\right) \cdot 0.5\right)
\end{array}
Initial program 98.6%
Simplified98.5%
Taylor expanded in v around inf 57.3%
distribute-lft-out57.3%
Simplified57.3%
Taylor expanded in v around inf 57.3%
associate-/l*57.3%
Simplified57.3%
Taylor expanded in cosTheta_O around 0 57.3%
*-commutative57.3%
associate-*r/57.3%
Simplified57.3%
Final simplification57.3%
herbie shell --seed 2024046
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, upper"
:precision binary32
:pre (and (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (< 0.1 v)) (<= v 1.5707964))
(/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))