
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 19 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinhf((1.0f / v)) * 2.0f) * v);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(-((sintheta_i * sintheta_o) / v)) * ((costheta_i * costheta_o) / v)) / ((sinh((1.0e0 / v)) * 2.0e0) * v)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(-Float32(Float32(sinTheta_i * sinTheta_O) / v))) * Float32(Float32(cosTheta_i * cosTheta_O) / v)) / Float32(Float32(sinh(Float32(Float32(1.0) / v)) * Float32(2.0)) * v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(-((sinTheta_i * sinTheta_O) / v)) * ((cosTheta_i * cosTheta_O) / v)) / ((sinh((single(1.0) / v)) * single(2.0)) * v); end
\begin{array}{l}
\\
\frac{e^{-\frac{sinTheta\_i \cdot sinTheta\_O}{v}} \cdot \frac{cosTheta\_i \cdot cosTheta\_O}{v}}{\left(\sinh \left(\frac{1}{v}\right) \cdot 2\right) \cdot v}
\end{array}
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_i_s cosTheta_O_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_i_s
(*
cosTheta_O_s
(/
(*
cosTheta_O_m
(* cosTheta_i_m (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v)))
(/ 1.0 (/ (/ 2.0 v) (* 2.0 (* 2.0 (sinh (/ 1.0 v))))))))))cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_i_s, float cosTheta_O_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_i_s * (cosTheta_O_s * ((cosTheta_O_m * (cosTheta_i_m * (expf(((sinTheta_i * sinTheta_O) / -v)) / v))) / (1.0f / ((2.0f / v) / (2.0f * (2.0f * sinhf((1.0f / v))))))));
}
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_i_s, costheta_o_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_i_s * (costheta_o_s * ((costheta_o_m * (costheta_i_m * (exp(((sintheta_i * sintheta_o) / -v)) / v))) / (1.0e0 / ((2.0e0 / v) / (2.0e0 * (2.0e0 * sinh((1.0e0 / v))))))))
end function
cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_i_s, cosTheta_O_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_i_s * Float32(cosTheta_O_s * Float32(Float32(cosTheta_O_m * Float32(cosTheta_i_m * Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v))) / Float32(Float32(1.0) / Float32(Float32(Float32(2.0) / v) / Float32(Float32(2.0) * Float32(Float32(2.0) * sinh(Float32(Float32(1.0) / v))))))))) end
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_i_s, cosTheta_O_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_i_s * (cosTheta_O_s * ((cosTheta_O_m * (cosTheta_i_m * (exp(((sinTheta_i * sinTheta_O) / -v)) / v))) / (single(1.0) / ((single(2.0) / v) / (single(2.0) * (single(2.0) * sinh((single(1.0) / v))))))));
end
\begin{array}{l}
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_i\_s \cdot \left(cosTheta\_O\_s \cdot \frac{cosTheta\_O\_m \cdot \left(cosTheta\_i\_m \cdot \frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v}\right)}{\frac{1}{\frac{\frac{2}{v}}{2 \cdot \left(2 \cdot \sinh \left(\frac{1}{v}\right)\right)}}}\right)
\end{array}
Initial program 98.9%
lift-*.f32N/A
*-commutativeN/A
lift-/.f32N/A
div-invN/A
lift-/.f32N/A
associate-*l*N/A
lift-*.f32N/A
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lift-/.f32N/A
div-invN/A
lower-/.f3299.1
lift-neg.f32N/A
lift-/.f32N/A
distribute-neg-frac2N/A
lower-/.f32N/A
lower-neg.f3299.1
Applied rewrites99.1%
lift-*.f32N/A
remove-double-divN/A
lift-/.f32N/A
un-div-invN/A
lower-/.f3299.1
Applied rewrites99.1%
lift-/.f32N/A
lift-*.f32N/A
associate-/l*N/A
lift-sinh.f32N/A
sinh-defN/A
sinh-undefN/A
lift-sinh.f32N/A
*-commutativeN/A
lift-*.f32N/A
frac-timesN/A
clear-numN/A
lower-/.f32N/A
lower-/.f32N/A
lift-/.f32N/A
un-div-invN/A
lower-/.f32N/A
lower-*.f3299.2
Applied rewrites99.2%
Final simplification99.2%
cosTheta_O\_m = (fabs.f32 cosTheta_O)
cosTheta_O\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_O)
cosTheta_i\_m = (fabs.f32 cosTheta_i)
cosTheta_i\_s = (copysign.f32 #s(literal 1 binary32) cosTheta_i)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
(FPCore (cosTheta_i_s cosTheta_O_s cosTheta_i_m cosTheta_O_m sinTheta_i sinTheta_O v)
:precision binary32
(*
cosTheta_i_s
(*
cosTheta_O_s
(/
(*
cosTheta_O_m
(* cosTheta_i_m (/ (exp (/ (* sinTheta_i sinTheta_O) (- v))) v)))
(* (sinh (/ 1.0 v)) (/ 4.0 (/ 2.0 v)))))))cosTheta_O\_m = fabs(cosTheta_O);
cosTheta_O\_s = copysign(1.0, cosTheta_O);
cosTheta_i\_m = fabs(cosTheta_i);
cosTheta_i\_s = copysign(1.0, cosTheta_i);
assert(cosTheta_i_m < cosTheta_O_m && cosTheta_O_m < sinTheta_i && sinTheta_i < sinTheta_O && sinTheta_O < v);
float code(float cosTheta_i_s, float cosTheta_O_s, float cosTheta_i_m, float cosTheta_O_m, float sinTheta_i, float sinTheta_O, float v) {
return cosTheta_i_s * (cosTheta_O_s * ((cosTheta_O_m * (cosTheta_i_m * (expf(((sinTheta_i * sinTheta_O) / -v)) / v))) / (sinhf((1.0f / v)) * (4.0f / (2.0f / v)))));
}
cosTheta_O\_m = abs(costheta_o)
cosTheta_O\_s = copysign(1.0d0, costheta_o)
cosTheta_i\_m = abs(costheta_i)
cosTheta_i\_s = copysign(1.0d0, costheta_i)
NOTE: cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, and v should be sorted in increasing order before calling this function.
real(4) function code(costheta_i_s, costheta_o_s, costheta_i_m, costheta_o_m, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i_s
real(4), intent (in) :: costheta_o_s
real(4), intent (in) :: costheta_i_m
real(4), intent (in) :: costheta_o_m
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = costheta_i_s * (costheta_o_s * ((costheta_o_m * (costheta_i_m * (exp(((sintheta_i * sintheta_o) / -v)) / v))) / (sinh((1.0e0 / v)) * (4.0e0 / (2.0e0 / v)))))
end function
cosTheta_O\_m = abs(cosTheta_O) cosTheta_O\_s = copysign(1.0, cosTheta_O) cosTheta_i\_m = abs(cosTheta_i) cosTheta_i\_s = copysign(1.0, cosTheta_i) cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v]) function code(cosTheta_i_s, cosTheta_O_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v) return Float32(cosTheta_i_s * Float32(cosTheta_O_s * Float32(Float32(cosTheta_O_m * Float32(cosTheta_i_m * Float32(exp(Float32(Float32(sinTheta_i * sinTheta_O) / Float32(-v))) / v))) / Float32(sinh(Float32(Float32(1.0) / v)) * Float32(Float32(4.0) / Float32(Float32(2.0) / v)))))) end
cosTheta_O\_m = abs(cosTheta_O);
cosTheta_O\_s = sign(cosTheta_O) * abs(1.0);
cosTheta_i\_m = abs(cosTheta_i);
cosTheta_i\_s = sign(cosTheta_i) * abs(1.0);
cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v = num2cell(sort([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])){:}
function tmp = code(cosTheta_i_s, cosTheta_O_s, cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v)
tmp = cosTheta_i_s * (cosTheta_O_s * ((cosTheta_O_m * (cosTheta_i_m * (exp(((sinTheta_i * sinTheta_O) / -v)) / v))) / (sinh((single(1.0) / v)) * (single(4.0) / (single(2.0) / v)))));
end
\begin{array}{l}
cosTheta_O\_m = \left|cosTheta\_O\right|
\\
cosTheta_O\_s = \mathsf{copysign}\left(1, cosTheta\_O\right)
\\
cosTheta_i\_m = \left|cosTheta\_i\right|
\\
cosTheta_i\_s = \mathsf{copysign}\left(1, cosTheta\_i\right)
\\
[cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v] = \mathsf{sort}([cosTheta_i_m, cosTheta_O_m, sinTheta_i, sinTheta_O, v])\\
\\
cosTheta\_i\_s \cdot \left(cosTheta\_O\_s \cdot \frac{cosTheta\_O\_m \cdot \left(cosTheta\_i\_m \cdot \frac{e^{\frac{sinTheta\_i \cdot sinTheta\_O}{-v}}}{v}\right)}{\sinh \left(\frac{1}{v}\right) \cdot \frac{4}{\frac{2}{v}}}\right)
\end{array}
Initial program 98.5%
lift-*.f32N/A
*-commutativeN/A
lift-/.f32N/A
div-invN/A
lift-/.f32N/A
associate-*l*N/A
lift-*.f32N/A
*-commutativeN/A
associate-*l*N/A
lower-*.f32N/A
lower-*.f32N/A
*-commutativeN/A
lift-/.f32N/A
div-invN/A
lower-/.f3298.7
lift-neg.f32N/A
lift-/.f32N/A
distribute-neg-frac2N/A
lower-/.f32N/A
lower-neg.f3298.7
Applied rewrites98.7%
lift-*.f32N/A
remove-double-divN/A
lift-/.f32N/A
un-div-invN/A
lower-/.f3298.9
Applied rewrites98.9%
lift-/.f32N/A
lift-*.f32N/A
associate-/l*N/A
lift-sinh.f32N/A
sinh-defN/A
sinh-undefN/A
lift-sinh.f32N/A
*-commutativeN/A
lift-*.f32N/A
frac-timesN/A
clear-numN/A
lower-/.f32N/A
lower-/.f32N/A
lift-/.f32N/A
un-div-invN/A
lower-/.f32N/A
lower-*.f3298.8
Applied rewrites98.8%
lift-/.f32N/A
lift-/.f32N/A
clear-numN/A
lift-*.f32N/A
lift-*.f32N/A
associate-*l*N/A
associate-/l*N/A
lower-*.f32N/A
lower-/.f32N/A
metadata-eval98.8
Applied rewrites98.8%
herbie shell --seed 2024228
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, upper"
:precision binary32
:pre (and (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (< 0.1 v)) (<= v 1.5707964))
(/ (* (exp (- (/ (* sinTheta_i sinTheta_O) v))) (/ (* cosTheta_i cosTheta_O) v)) (* (* (sinh (/ 1.0 v)) 2.0) v)))