
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 21 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(*
(/ 1.0 v)
(* (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v) cosTheta_O_m))
(/ (* cosTheta_i_m 0.5) (sinh (/ 1.0 v)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((1.0f / v) * ((expf(((sinTheta_i * sinTheta_O) / -v)) / v) * cosTheta_O_m)) * ((cosTheta_i_m * 0.5f) / sinhf((1.0f / v)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((1.0e0 / v) * ((exp(((sintheta_i * sintheta_o) / -v)) / v) * costheta_o_m)) * ((costheta_i_m * 0.5e0) / sinh((1.0e0 / v)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(Float32(1.0) / v) * Float32(Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v) * cosTheta_O_m)) * Float32(Float32(cosTheta_i_m * Float32(0.5)) / sinh(Float32(Float32(1.0) / v)))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((single(1.0) / v) * ((exp(((sinTheta_i * sinTheta_O) / -v)) / v) * cosTheta_O_m)) * ((cosTheta_i_m * single(0.5)) / sinh((single(1.0) / v)))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\left(\frac{1}{v} \cdot \left(\frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v} \cdot cosTheta\_O\_m\right)\right) \cdot \frac{cosTheta\_i\_m \cdot 0.5}{\sinh \left(\frac{1}{v}\right)}\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
*-commutativeN/A
div-invN/A
associate-*l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f3299.1
Applied egg-rr99.1%
*-commutativeN/A
associate-*l*N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f3298.9
Applied egg-rr98.9%
Final simplification98.9%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(/ (* cosTheta_i_m 0.5) (sinh (/ 1.0 v)))
(*
cosTheta_O_m
(* (/ 1.0 v) (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * 0.5f) / sinhf((1.0f / v))) * (cosTheta_O_m * ((1.0f / v) * (expf(((sinTheta_i * sinTheta_O) / -v)) / v)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((costheta_i_m * 0.5e0) / sinh((1.0e0 / v))) * (costheta_o_m * ((1.0e0 / v) * (exp(((sintheta_i * sintheta_o) / -v)) / v)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(cosTheta_i_m * Float32(0.5)) / sinh(Float32(Float32(1.0) / v))) * Float32(cosTheta_O_m * Float32(Float32(Float32(1.0) / v) * Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v)))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * single(0.5)) / sinh((single(1.0) / v))) * (cosTheta_O_m * ((single(1.0) / v) * (exp(((sinTheta_i * sinTheta_O) / -v)) / v)))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\frac{cosTheta\_i\_m \cdot 0.5}{\sinh \left(\frac{1}{v}\right)} \cdot \left(cosTheta\_O\_m \cdot \left(\frac{1}{v} \cdot \frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v}\right)\right)\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
*-commutativeN/A
div-invN/A
associate-*l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f3299.1
Applied egg-rr99.1%
Final simplification99.1%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(/ (* cosTheta_i_m 0.5) (sinh (/ 1.0 v)))
(* (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v) (/ cosTheta_O_m v))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * 0.5f) / sinhf((1.0f / v))) * ((expf(((sinTheta_i * sinTheta_O) / -v)) / v) * (cosTheta_O_m / v))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((costheta_i_m * 0.5e0) / sinh((1.0e0 / v))) * ((exp(((sintheta_i * sintheta_o) / -v)) / v) * (costheta_o_m / v))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(cosTheta_i_m * Float32(0.5)) / sinh(Float32(Float32(1.0) / v))) * Float32(Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v) * Float32(cosTheta_O_m / v))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * single(0.5)) / sinh((single(1.0) / v))) * ((exp(((sinTheta_i * sinTheta_O) / -v)) / v) * (cosTheta_O_m / v))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\frac{cosTheta\_i\_m \cdot 0.5}{\sinh \left(\frac{1}{v}\right)} \cdot \left(\frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v} \cdot \frac{cosTheta\_O\_m}{v}\right)\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
Final simplification98.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(* (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v) cosTheta_O_m)
(/ cosTheta_i_m (* (sinh (/ 1.0 v)) (* v 2.0)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((expf(((sinTheta_i * sinTheta_O) / -v)) / v) * cosTheta_O_m) * (cosTheta_i_m / (sinhf((1.0f / v)) * (v * 2.0f)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((exp(((sintheta_i * sintheta_o) / -v)) / v) * costheta_o_m) * (costheta_i_m / (sinh((1.0e0 / v)) * (v * 2.0e0)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v) * cosTheta_O_m) * Float32(cosTheta_i_m / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(v * Float32(2.0))))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((exp(((sinTheta_i * sinTheta_O) / -v)) / v) * cosTheta_O_m) * (cosTheta_i_m / (sinh((single(1.0) / v)) * (v * single(2.0))))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\left(\frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v} \cdot cosTheta\_O\_m\right) \cdot \frac{cosTheta\_i\_m}{\sinh \left(\frac{1}{v}\right) \cdot \left(v \cdot 2\right)}\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
Final simplification98.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
cosTheta_i_m
(*
(/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v)
(/ cosTheta_O_m (* (sinh (/ 1.0 v)) (* v 2.0))))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_i_m * ((expf(((sinTheta_i * sinTheta_O) / -v)) / v) * (cosTheta_O_m / (sinhf((1.0f / v)) * (v * 2.0f))))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (costheta_i_m * ((exp(((sintheta_i * sintheta_o) / -v)) / v) * (costheta_o_m / (sinh((1.0e0 / v)) * (v * 2.0e0))))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_i_m * Float32(Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v) * Float32(cosTheta_O_m / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(v * Float32(2.0)))))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (cosTheta_i_m * ((exp(((sinTheta_i * sinTheta_O) / -v)) / v) * (cosTheta_O_m / (sinh((single(1.0) / v)) * (v * single(2.0)))))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_i\_m \cdot \left(\frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v} \cdot \frac{cosTheta\_O\_m}{\sinh \left(\frac{1}{v}\right) \cdot \left(v \cdot 2\right)}\right)\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
Applied egg-rr98.8%
Final simplification98.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(* cosTheta_O_m (fma sinTheta_O (/ sinTheta_i (- v)) 1.0))
(/ cosTheta_i_m (* (sinh (/ 1.0 v)) (* v (* v 2.0))))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * fmaf(sinTheta_O, (sinTheta_i / -v), 1.0f)) * (cosTheta_i_m / (sinhf((1.0f / v)) * (v * (v * 2.0f))))));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_O_m * fma(sinTheta_O, Float32(sinTheta_i / Float32(-v)), Float32(1.0))) * Float32(cosTheta_i_m / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(v * Float32(v * Float32(2.0)))))))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\left(cosTheta\_O\_m \cdot \mathsf{fma}\left(sinTheta\_O, \frac{sinTheta\_i}{-v}, 1\right)\right) \cdot \frac{cosTheta\_i\_m}{\sinh \left(\frac{1}{v}\right) \cdot \left(v \cdot \left(v \cdot 2\right)\right)}\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
Taylor expanded in sinTheta_i around 0
+-commutativeN/A
mul-1-negN/A
associate-/l*N/A
distribute-rgt-neg-inN/A
mul-1-negN/A
accelerator-lowering-fma.f32N/A
mul-1-negN/A
distribute-neg-frac2N/A
mul-1-negN/A
/-lowering-/.f32N/A
mul-1-negN/A
neg-lowering-neg.f3298.8
Simplified98.8%
Final simplification98.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(/ (* cosTheta_i_m 0.5) (sinh (/ 1.0 v)))
(* cosTheta_O_m (* (/ 1.0 v) (/ 1.0 v)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * 0.5f) / sinhf((1.0f / v))) * (cosTheta_O_m * ((1.0f / v) * (1.0f / v)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((costheta_i_m * 0.5e0) / sinh((1.0e0 / v))) * (costheta_o_m * ((1.0e0 / v) * (1.0e0 / v)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(cosTheta_i_m * Float32(0.5)) / sinh(Float32(Float32(1.0) / v))) * Float32(cosTheta_O_m * Float32(Float32(Float32(1.0) / v) * Float32(Float32(1.0) / v)))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * single(0.5)) / sinh((single(1.0) / v))) * (cosTheta_O_m * ((single(1.0) / v) * (single(1.0) / v)))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\frac{cosTheta\_i\_m \cdot 0.5}{\sinh \left(\frac{1}{v}\right)} \cdot \left(cosTheta\_O\_m \cdot \left(\frac{1}{v} \cdot \frac{1}{v}\right)\right)\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
*-commutativeN/A
div-invN/A
associate-*l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
exp-lowering-exp.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f3299.1
Applied egg-rr99.1%
Taylor expanded in sinTheta_i around 0
Simplified98.9%
Final simplification98.9%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(/ (* cosTheta_i_m 0.5) (sinh (/ 1.0 v)))
(* (/ 1.0 v) (/ cosTheta_O_m v))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * 0.5f) / sinhf((1.0f / v))) * ((1.0f / v) * (cosTheta_O_m / v))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (((costheta_i_m * 0.5e0) / sinh((1.0e0 / v))) * ((1.0e0 / v) * (costheta_o_m / v))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(Float32(cosTheta_i_m * Float32(0.5)) / sinh(Float32(Float32(1.0) / v))) * Float32(Float32(Float32(1.0) / v) * Float32(cosTheta_O_m / v))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (((cosTheta_i_m * single(0.5)) / sinh((single(1.0) / v))) * ((single(1.0) / v) * (cosTheta_O_m / v))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\frac{cosTheta\_i\_m \cdot 0.5}{\sinh \left(\frac{1}{v}\right)} \cdot \left(\frac{1}{v} \cdot \frac{cosTheta\_O\_m}{v}\right)\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
associate-*r/N/A
associate-*r*N/A
associate-/r*N/A
Applied egg-rr98.8%
Taylor expanded in sinTheta_i around 0
/-lowering-/.f3298.6
Simplified98.6%
Final simplification98.6%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (* cosTheta_O_m (/ cosTheta_i_m (* (sinh (/ 1.0 v)) (* v (* v 2.0))))))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_O_m * (cosTheta_i_m / (sinhf((1.0f / v)) * (v * (v * 2.0f))))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (costheta_o_m * (costheta_i_m / (sinh((1.0e0 / v)) * (v * (v * 2.0e0))))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_O_m * Float32(cosTheta_i_m / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(v * Float32(v * Float32(2.0)))))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (cosTheta_O_m * (cosTheta_i_m / (sinh((single(1.0) / v)) * (v * (v * single(2.0)))))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_O\_m \cdot \frac{cosTheta\_i\_m}{\sinh \left(\frac{1}{v}\right) \cdot \left(v \cdot \left(v \cdot 2\right)\right)}\right)\right)
\end{array}
Initial program 98.6%
associate-*r/N/A
associate-/l/N/A
*-commutativeN/A
associate-*r*N/A
associate-/l*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
exp-lowering-exp.f32N/A
distribute-neg-frac2N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
neg-lowering-neg.f32N/A
/-lowering-/.f32N/A
Applied egg-rr98.8%
Taylor expanded in sinTheta_i around 0
Simplified98.6%
Final simplification98.6%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(/
(*
cosTheta_O_m
(/
cosTheta_i_m
(fma
2.0
(fma
sinTheta_i
(/ sinTheta_O v)
(/
(fma
sinTheta_O
(* sinTheta_O (* 0.5 (* sinTheta_i sinTheta_i)))
0.16666666666666666)
(* v v)))
2.0)))
v))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * (cosTheta_i_m / fmaf(2.0f, fmaf(sinTheta_i, (sinTheta_O / v), (fmaf(sinTheta_O, (sinTheta_O * (0.5f * (sinTheta_i * sinTheta_i))), 0.16666666666666666f) / (v * v))), 2.0f))) / v));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_O_m * Float32(cosTheta_i_m / fma(Float32(2.0), fma(sinTheta_i, Float32(sinTheta_O / v), Float32(fma(sinTheta_O, Float32(sinTheta_O * Float32(Float32(0.5) * Float32(sinTheta_i * sinTheta_i))), Float32(0.16666666666666666)) / Float32(v * v))), Float32(2.0)))) / v))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \frac{cosTheta\_O\_m \cdot \frac{cosTheta\_i\_m}{\mathsf{fma}\left(2, \mathsf{fma}\left(sinTheta\_i, \frac{sinTheta\_O}{v}, \frac{\mathsf{fma}\left(sinTheta\_O, sinTheta\_O \cdot \left(0.5 \cdot \left(sinTheta\_i \cdot sinTheta\_i\right)\right), 0.16666666666666666\right)}{v \cdot v}\right), 2\right)}}{v}\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
times-fracN/A
associate-*r/N/A
/-lowering-/.f32N/A
Applied egg-rr64.2%
Final simplification64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(/
(* cosTheta_i_m (/ cosTheta_O_m v))
(fma
2.0
(fma
sinTheta_O
(/ sinTheta_i v)
(/
(fma
(* sinTheta_O (* sinTheta_O 0.5))
(* sinTheta_i sinTheta_i)
0.16666666666666666)
(* v v)))
2.0)))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_i_m * (cosTheta_O_m / v)) / fmaf(2.0f, fmaf(sinTheta_O, (sinTheta_i / v), (fmaf((sinTheta_O * (sinTheta_O * 0.5f)), (sinTheta_i * sinTheta_i), 0.16666666666666666f) / (v * v))), 2.0f)));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_i_m * Float32(cosTheta_O_m / v)) / fma(Float32(2.0), fma(sinTheta_O, Float32(sinTheta_i / v), Float32(fma(Float32(sinTheta_O * Float32(sinTheta_O * Float32(0.5))), Float32(sinTheta_i * sinTheta_i), Float32(0.16666666666666666)) / Float32(v * v))), Float32(2.0))))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \frac{cosTheta\_i\_m \cdot \frac{cosTheta\_O\_m}{v}}{\mathsf{fma}\left(2, \mathsf{fma}\left(sinTheta\_O, \frac{sinTheta\_i}{v}, \frac{\mathsf{fma}\left(sinTheta\_O \cdot \left(sinTheta\_O \cdot 0.5\right), sinTheta\_i \cdot sinTheta\_i, 0.16666666666666666\right)}{v \cdot v}\right), 2\right)}\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
div-invN/A
*-lowering-*.f32N/A
associate-*l*N/A
accelerator-lowering-fma.f32N/A
*-lowering-*.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f3264.2
Applied egg-rr64.2%
times-fracN/A
associate-*l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
Applied egg-rr64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
(/ cosTheta_O_m v)
(/
cosTheta_i_m
(fma
2.0
(fma
sinTheta_i
(/ sinTheta_O v)
(/
(fma
sinTheta_O
(* sinTheta_O (* 0.5 (* sinTheta_i sinTheta_i)))
0.16666666666666666)
(* v v)))
2.0))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m / v) * (cosTheta_i_m / fmaf(2.0f, fmaf(sinTheta_i, (sinTheta_O / v), (fmaf(sinTheta_O, (sinTheta_O * (0.5f * (sinTheta_i * sinTheta_i))), 0.16666666666666666f) / (v * v))), 2.0f))));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_O_m / v) * Float32(cosTheta_i_m / fma(Float32(2.0), fma(sinTheta_i, Float32(sinTheta_O / v), Float32(fma(sinTheta_O, Float32(sinTheta_O * Float32(Float32(0.5) * Float32(sinTheta_i * sinTheta_i))), Float32(0.16666666666666666)) / Float32(v * v))), Float32(2.0)))))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\frac{cosTheta\_O\_m}{v} \cdot \frac{cosTheta\_i\_m}{\mathsf{fma}\left(2, \mathsf{fma}\left(sinTheta\_i, \frac{sinTheta\_O}{v}, \frac{\mathsf{fma}\left(sinTheta\_O, sinTheta\_O \cdot \left(0.5 \cdot \left(sinTheta\_i \cdot sinTheta\_i\right)\right), 0.16666666666666666\right)}{v \cdot v}\right), 2\right)}\right)\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
times-fracN/A
*-lowering-*.f32N/A
Applied egg-rr64.2%
Final simplification64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
cosTheta_i_m
(/
cosTheta_O_m
(*
v
(fma
2.0
(fma
sinTheta_i
(/ sinTheta_O v)
(/
(fma
sinTheta_O
(* sinTheta_O (* 0.5 (* sinTheta_i sinTheta_i)))
0.16666666666666666)
(* v v)))
2.0)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_i_m * (cosTheta_O_m / (v * fmaf(2.0f, fmaf(sinTheta_i, (sinTheta_O / v), (fmaf(sinTheta_O, (sinTheta_O * (0.5f * (sinTheta_i * sinTheta_i))), 0.16666666666666666f) / (v * v))), 2.0f)))));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_i_m * Float32(cosTheta_O_m / Float32(v * fma(Float32(2.0), fma(sinTheta_i, Float32(sinTheta_O / v), Float32(fma(sinTheta_O, Float32(sinTheta_O * Float32(Float32(0.5) * Float32(sinTheta_i * sinTheta_i))), Float32(0.16666666666666666)) / Float32(v * v))), Float32(2.0))))))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_i\_m \cdot \frac{cosTheta\_O\_m}{v \cdot \mathsf{fma}\left(2, \mathsf{fma}\left(sinTheta\_i, \frac{sinTheta\_O}{v}, \frac{\mathsf{fma}\left(sinTheta\_O, sinTheta\_O \cdot \left(0.5 \cdot \left(sinTheta\_i \cdot sinTheta\_i\right)\right), 0.16666666666666666\right)}{v \cdot v}\right), 2\right)}\right)\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
associate-/l*N/A
*-commutativeN/A
*-lowering-*.f32N/A
Applied egg-rr64.2%
Final simplification64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(*
cosTheta_O_m
(/
cosTheta_i_m
(*
v
(fma
2.0
(fma
sinTheta_i
(/ sinTheta_O v)
(/
(fma
sinTheta_O
(* sinTheta_O (* 0.5 (* sinTheta_i sinTheta_i)))
0.16666666666666666)
(* v v)))
2.0)))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_O_m * (cosTheta_i_m / (v * fmaf(2.0f, fmaf(sinTheta_i, (sinTheta_O / v), (fmaf(sinTheta_O, (sinTheta_O * (0.5f * (sinTheta_i * sinTheta_i))), 0.16666666666666666f) / (v * v))), 2.0f)))));
}
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_O_m * Float32(cosTheta_i_m / Float32(v * fma(Float32(2.0), fma(sinTheta_i, Float32(sinTheta_O / v), Float32(fma(sinTheta_O, Float32(sinTheta_O * Float32(Float32(0.5) * Float32(sinTheta_i * sinTheta_i))), Float32(0.16666666666666666)) / Float32(v * v))), Float32(2.0))))))) end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_O\_m \cdot \frac{cosTheta\_i\_m}{v \cdot \mathsf{fma}\left(2, \mathsf{fma}\left(sinTheta\_i, \frac{sinTheta\_O}{v}, \frac{\mathsf{fma}\left(sinTheta\_O, sinTheta\_O \cdot \left(0.5 \cdot \left(sinTheta\_i \cdot sinTheta\_i\right)\right), 0.16666666666666666\right)}{v \cdot v}\right), 2\right)}\right)\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
*-commutativeN/A
associate-/l*N/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
accelerator-lowering-fma.f32N/A
Applied egg-rr64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_O_s
(*
cosTheta_i_s
(/
(* cosTheta_O_m cosTheta_i_m)
(* v (+ 2.0 (/ 0.3333333333333333 (* v v))))))))cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * cosTheta_i_m) / (v * (2.0f + (0.3333333333333333f / (v * v))))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * ((costheta_o_m * costheta_i_m) / (v * (2.0e0 + (0.3333333333333333e0 / (v * v))))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_O_m * cosTheta_i_m) / Float32(v * Float32(Float32(2.0) + Float32(Float32(0.3333333333333333) / Float32(v * v))))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * cosTheta_i_m) / (v * (single(2.0) + (single(0.3333333333333333) / (v * v))))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \frac{cosTheta\_O\_m \cdot cosTheta\_i\_m}{v \cdot \left(2 + \frac{0.3333333333333333}{v \cdot v}\right)}\right)
\end{array}
Initial program 98.6%
*-commutativeN/A
exp-negN/A
un-div-invN/A
associate-/r*N/A
associate-/l/N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
Applied egg-rr98.6%
Taylor expanded in v around inf
+-commutativeN/A
distribute-lft-outN/A
accelerator-lowering-fma.f32N/A
Simplified64.2%
Taylor expanded in sinTheta_O around 0
+-lowering-+.f32N/A
associate-*r/N/A
metadata-evalN/A
/-lowering-/.f32N/A
unpow2N/A
*-lowering-*.f3264.2
Simplified64.2%
Final simplification64.2%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (/ 1.0 (/ v (* cosTheta_i_m (* cosTheta_O_m 0.5)))))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (1.0f / (v / (cosTheta_i_m * (cosTheta_O_m * 0.5f)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (1.0e0 / (v / (costheta_i_m * (costheta_o_m * 0.5e0)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(1.0) / Float32(v / Float32(cosTheta_i_m * Float32(cosTheta_O_m * Float32(0.5))))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (single(1.0) / (v / (cosTheta_i_m * (cosTheta_O_m * single(0.5))))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \frac{1}{\frac{v}{cosTheta\_i\_m \cdot \left(cosTheta\_O\_m \cdot 0.5\right)}}\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
associate-/l*N/A
*-commutativeN/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f3258.8
Applied egg-rr58.8%
associate-*l/N/A
associate-*l/N/A
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
*-lowering-*.f32N/A
*-commutativeN/A
*-lowering-*.f3259.3
Applied egg-rr59.3%
Final simplification59.3%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (/ 1.0 (/ v (* 0.5 (* cosTheta_O_m cosTheta_i_m)))))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (1.0f / (v / (0.5f * (cosTheta_O_m * cosTheta_i_m)))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (1.0e0 / (v / (0.5e0 * (costheta_o_m * costheta_i_m)))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(1.0) / Float32(v / Float32(Float32(0.5) * Float32(cosTheta_O_m * cosTheta_i_m)))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (single(1.0) / (v / (single(0.5) * (cosTheta_O_m * cosTheta_i_m)))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \frac{1}{\frac{v}{0.5 \cdot \left(cosTheta\_O\_m \cdot cosTheta\_i\_m\right)}}\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
clear-numN/A
/-lowering-/.f32N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-commutativeN/A
*-lowering-*.f32N/A
*-commutativeN/A
*-lowering-*.f3259.3
Applied egg-rr59.3%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (* 0.5 (/ (* cosTheta_O_m cosTheta_i_m) v)))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (0.5f * ((cosTheta_O_m * cosTheta_i_m) / v)));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (0.5e0 * ((costheta_o_m * costheta_i_m) / v)))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(0.5) * Float32(Float32(cosTheta_O_m * cosTheta_i_m) / v)))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (single(0.5) * ((cosTheta_O_m * cosTheta_i_m) / v)));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(0.5 \cdot \frac{cosTheta\_O\_m \cdot cosTheta\_i\_m}{v}\right)\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
clear-numN/A
*-commutativeN/A
associate-/r*N/A
associate-/r/N/A
clear-numN/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f3258.8
Applied egg-rr58.8%
Final simplification58.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (* (* cosTheta_O_m cosTheta_i_m) (/ 0.5 v)))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * cosTheta_i_m) * (0.5f / v)));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * ((costheta_o_m * costheta_i_m) * (0.5e0 / v)))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(Float32(cosTheta_O_m * cosTheta_i_m) * Float32(Float32(0.5) / v)))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * ((cosTheta_O_m * cosTheta_i_m) * (single(0.5) / v)));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(\left(cosTheta\_O\_m \cdot cosTheta\_i\_m\right) \cdot \frac{0.5}{v}\right)\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
associate-/l*N/A
*-commutativeN/A
*-commutativeN/A
*-lowering-*.f32N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f3258.8
Applied egg-rr58.8%
Final simplification58.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (* cosTheta_O_m (* cosTheta_i_m (/ 0.5 v))))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_O_m * (cosTheta_i_m * (0.5f / v))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (costheta_o_m * (costheta_i_m * (0.5e0 / v))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_O_m * Float32(cosTheta_i_m * Float32(Float32(0.5) / v))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (cosTheta_O_m * (cosTheta_i_m * (single(0.5) / v))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_O\_m \cdot \left(cosTheta\_i\_m \cdot \frac{0.5}{v}\right)\right)\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
associate-/l*N/A
*-commutativeN/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f3258.8
Applied egg-rr58.8%
associate-*l*N/A
*-commutativeN/A
associate-*r*N/A
*-lowering-*.f32N/A
metadata-evalN/A
associate-/r*N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-commutativeN/A
associate-/r*N/A
metadata-evalN/A
/-lowering-/.f3258.8
Applied egg-rr58.8%
Final simplification58.8%
cosTheta_i\_m = (fabs.f32 cosTheta_i) cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i) cosTheta_O\_m = (fabs.f32 cosTheta_O) cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O) NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function. (FPCore (cosTheta_O_s cosTheta_i_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v) :precision binary32 (* cosTheta_O_s (* cosTheta_i_s (* cosTheta_i_m (* cosTheta_O_m (/ 0.5 v))))))
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_O_s, float cosTheta_i_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_O_s * (cosTheta_i_s * (cosTheta_i_m * (cosTheta_O_m * (0.5f / v))));
}
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_o_s, costheta_i_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_o_s * (costheta_i_s * (costheta_i_m * (costheta_o_m * (0.5e0 / v))))
end function
cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_O_s * Float32(cosTheta_i_s * Float32(cosTheta_i_m * Float32(cosTheta_O_m * Float32(Float32(0.5) / v))))) end
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_O_s, cosTheta_i_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_O_s * (cosTheta_i_s * (cosTheta_i_m * (cosTheta_O_m * (single(0.5) / v))));
end
\begin{array}{l}
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_O\_s \cdot \left(cosTheta\_i\_s \cdot \left(cosTheta\_i\_m \cdot \left(cosTheta\_O\_m \cdot \frac{0.5}{v}\right)\right)\right)
\end{array}
Initial program 98.6%
Taylor expanded in v around inf
associate-*r/N/A
/-lowering-/.f32N/A
*-commutativeN/A
*-lowering-*.f32N/A
*-lowering-*.f3258.8
Simplified58.8%
associate-/l*N/A
*-commutativeN/A
*-commutativeN/A
*-commutativeN/A
associate-*r*N/A
*-lowering-*.f32N/A
*-lowering-*.f32N/A
/-lowering-/.f3258.8
Applied egg-rr58.8%
Final simplification58.8%
herbie shell --seed 2024203
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, upper"
:precision binary32
:pre (and (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (< 0.1 v)) (<= v 1.5707964))
(/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))