
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0
(/
(fma cosTheta_i cosTheta_O (fma sinTheta_i (- sinTheta_O) -1.0))
v))
(t_1 (log (* v 2.0)))
(t_2 (+ 0.6931 (/ (fma cosTheta_O cosTheta_i -1.0) v))))
(*
(pow (* v 2.0) (/ t_1 (- (- (- 0.6931) t_1) t_0)))
(exp (/ (* t_2 t_2) (+ t_0 (+ t_1 0.6931)))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = fmaf(cosTheta_i, cosTheta_O, fmaf(sinTheta_i, -sinTheta_O, -1.0f)) / v;
float t_1 = logf((v * 2.0f));
float t_2 = 0.6931f + (fmaf(cosTheta_O, cosTheta_i, -1.0f) / v);
return powf((v * 2.0f), (t_1 / ((-0.6931f - t_1) - t_0))) * expf(((t_2 * t_2) / (t_0 + (t_1 + 0.6931f))));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(fma(cosTheta_i, cosTheta_O, fma(sinTheta_i, Float32(-sinTheta_O), Float32(-1.0))) / v) t_1 = log(Float32(v * Float32(2.0))) t_2 = Float32(Float32(0.6931) + Float32(fma(cosTheta_O, cosTheta_i, Float32(-1.0)) / v)) return Float32((Float32(v * Float32(2.0)) ^ Float32(t_1 / Float32(Float32(Float32(-Float32(0.6931)) - t_1) - t_0))) * exp(Float32(Float32(t_2 * t_2) / Float32(t_0 + Float32(t_1 + Float32(0.6931)))))) end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{\mathsf{fma}\left(cosTheta\_i, cosTheta\_O, \mathsf{fma}\left(sinTheta\_i, -sinTheta\_O, -1\right)\right)}{v}\\
t_1 := \log \left(v \cdot 2\right)\\
t_2 := 0.6931 + \frac{\mathsf{fma}\left(cosTheta\_O, cosTheta\_i, -1\right)}{v}\\
{\left(v \cdot 2\right)}^{\left(\frac{t\_1}{\left(\left(-0.6931\right) - t\_1\right) - t\_0}\right)} \cdot e^{\frac{t\_2 \cdot t\_2}{t\_0 + \left(t\_1 + 0.6931\right)}}
\end{array}
\end{array}
Initial program 99.7%
Applied rewrites99.8%
lift-/.f32N/A
clear-numN/A
associate-/r/N/A
lower-*.f32N/A
Applied rewrites99.8%
Applied rewrites99.8%
Taylor expanded in sinTheta_i around 0
unpow2N/A
lower-*.f32N/A
associate--l+N/A
lower-+.f32N/A
div-subN/A
lower-/.f32N/A
sub-negN/A
metadata-evalN/A
lower-fma.f32N/A
associate--l+N/A
lower-+.f32N/A
div-subN/A
lower-/.f32N/A
sub-negN/A
metadata-evalN/A
lower-fma.f3299.8
Applied rewrites99.8%
Final simplification99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (fma (fma (* cosTheta_i cosTheta_O) v (- v)) (/ 1.0 (* v v)) (- 0.6931 (log (* v 2.0))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(fmaf(fmaf((cosTheta_i * cosTheta_O), v, -v), (1.0f / (v * v)), (0.6931f - logf((v * 2.0f)))));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(fma(fma(Float32(cosTheta_i * cosTheta_O), v, Float32(-v)), Float32(Float32(1.0) / Float32(v * v)), Float32(Float32(0.6931) - log(Float32(v * Float32(2.0)))))) end
\begin{array}{l}
\\
e^{\mathsf{fma}\left(\mathsf{fma}\left(cosTheta\_i \cdot cosTheta\_O, v, -v\right), \frac{1}{v \cdot v}, 0.6931 - \log \left(v \cdot 2\right)\right)}
\end{array}
Initial program 99.7%
lift-+.f32N/A
lift-+.f32N/A
associate-+l+N/A
lift--.f32N/A
lift--.f32N/A
lift-/.f32N/A
lift-/.f32N/A
sub-divN/A
lift-/.f32N/A
frac-subN/A
div-invN/A
metadata-evalN/A
frac-timesN/A
lift-/.f32N/A
lift-/.f32N/A
Applied rewrites99.7%
Taylor expanded in cosTheta_i around inf
lower-*.f3299.7
Applied rewrites99.7%
Final simplification99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (- (+ 0.6931 (/ (fma v (* cosTheta_i cosTheta_O) (- v)) (* v v))) (log (* v 2.0)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((0.6931f + (fmaf(v, (cosTheta_i * cosTheta_O), -v) / (v * v))) - logf((v * 2.0f))));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(0.6931) + Float32(fma(v, Float32(cosTheta_i * cosTheta_O), Float32(-v)) / Float32(v * v))) - log(Float32(v * Float32(2.0))))) end
\begin{array}{l}
\\
e^{\left(0.6931 + \frac{\mathsf{fma}\left(v, cosTheta\_i \cdot cosTheta\_O, -v\right)}{v \cdot v}\right) - \log \left(v \cdot 2\right)}
\end{array}
Initial program 99.7%
lift-+.f32N/A
lift-+.f32N/A
associate-+l+N/A
lift--.f32N/A
lift--.f32N/A
lift-/.f32N/A
lift-/.f32N/A
sub-divN/A
lift-/.f32N/A
frac-subN/A
div-invN/A
metadata-evalN/A
frac-timesN/A
lift-/.f32N/A
lift-/.f32N/A
Applied rewrites99.7%
Taylor expanded in cosTheta_i around inf
lower-*.f3299.7
Applied rewrites99.7%
lift-fma.f32N/A
lift--.f32N/A
associate-+r-N/A
lower--.f32N/A
Applied rewrites99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (+ 0.6931 (/ -1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f + (-1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 + ((-1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(Float32(-1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) + (single(-1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 + \frac{-1}{v}}
\end{array}
Initial program 99.7%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
lower-*.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
sub-negN/A
lower-+.f32N/A
distribute-neg-inN/A
mul-1-negN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
distribute-rgt1-inN/A
+-commutativeN/A
lower-*.f32N/A
Applied rewrites99.7%
Taylor expanded in sinTheta_O around 0
Applied rewrites99.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ (fma cosTheta_O cosTheta_i -1.0) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((fmaf(cosTheta_O, cosTheta_i, -1.0f) / v));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(fma(cosTheta_O, cosTheta_i, Float32(-1.0)) / v)) end
\begin{array}{l}
\\
e^{\frac{\mathsf{fma}\left(cosTheta\_O, cosTheta\_i, -1\right)}{v}}
\end{array}
Initial program 99.7%
Taylor expanded in v around 0
lower-/.f32N/A
sub-negN/A
lower-fma.f32N/A
+-commutativeN/A
distribute-neg-inN/A
distribute-rgt-neg-inN/A
mul-1-negN/A
metadata-evalN/A
lower-fma.f32N/A
mul-1-negN/A
lower-neg.f3297.4
Applied rewrites97.4%
Taylor expanded in sinTheta_O around 0
Applied rewrites97.4%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ (* cosTheta_i cosTheta_O) v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((cosTheta_i * cosTheta_O) / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((costheta_i * costheta_o) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(cosTheta_i * cosTheta_O) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((cosTheta_i * cosTheta_O) / v)); end
\begin{array}{l}
\\
e^{\frac{cosTheta\_i \cdot cosTheta\_O}{v}}
\end{array}
Initial program 99.7%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3211.7
Applied rewrites11.7%
Applied rewrites11.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (* cosTheta_i (/ cosTheta_O v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((cosTheta_i * (cosTheta_O / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp((costheta_i * (costheta_o / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(cosTheta_i * Float32(cosTheta_O / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((cosTheta_i * (cosTheta_O / v))); end
\begin{array}{l}
\\
e^{cosTheta\_i \cdot \frac{cosTheta\_O}{v}}
\end{array}
Initial program 99.7%
Taylor expanded in cosTheta_i around inf
*-commutativeN/A
associate-*r/N/A
lower-*.f32N/A
lower-/.f3211.7
Applied rewrites11.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp 0.6931)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf(0.6931f);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp(0.6931e0)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(0.6931))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp(single(0.6931)); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931}
\end{array}
Initial program 99.7%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
lower-*.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
sub-negN/A
lower-+.f32N/A
distribute-neg-inN/A
mul-1-negN/A
associate-*r/N/A
*-commutativeN/A
associate-/l*N/A
metadata-evalN/A
distribute-neg-fracN/A
distribute-rgt1-inN/A
+-commutativeN/A
lower-*.f32N/A
Applied rewrites99.7%
Taylor expanded in v around inf
Applied rewrites4.7%
herbie shell --seed 2024237
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))