
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 8 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (log (/ 0.5 v)))
(t_1
(+
0.6931
(/
(- (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) 1.0)
v))))
(/
(exp (/ (pow t_1 2.0) (- t_1 t_0)))
(exp
(/
(pow (log (* 2.0 v)) 2.0)
(- (+ 0.6931 (/ (- (* (- sinTheta_O) sinTheta_i) 1.0) v)) t_0))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = logf((0.5f / v));
float t_1 = 0.6931f + ((((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) - 1.0f) / v);
return expf((powf(t_1, 2.0f) / (t_1 - t_0))) / expf((powf(logf((2.0f * v)), 2.0f) / ((0.6931f + (((-sinTheta_O * sinTheta_i) - 1.0f) / v)) - t_0)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
real(4) :: t_1
t_0 = log((0.5e0 / v))
t_1 = 0.6931e0 + ((((costheta_o * costheta_i) - (sintheta_o * sintheta_i)) - 1.0e0) / v)
code = exp(((t_1 ** 2.0e0) / (t_1 - t_0))) / exp(((log((2.0e0 * v)) ** 2.0e0) / ((0.6931e0 + (((-sintheta_o * sintheta_i) - 1.0e0) / v)) - t_0)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = log(Float32(Float32(0.5) / v)) t_1 = Float32(Float32(0.6931) + Float32(Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) - Float32(1.0)) / v)) return Float32(exp(Float32((t_1 ^ Float32(2.0)) / Float32(t_1 - t_0))) / exp(Float32((log(Float32(Float32(2.0) * v)) ^ Float32(2.0)) / Float32(Float32(Float32(0.6931) + Float32(Float32(Float32(Float32(-sinTheta_O) * sinTheta_i) - Float32(1.0)) / v)) - t_0)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = log((single(0.5) / v)); t_1 = single(0.6931) + ((((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) - single(1.0)) / v); tmp = exp(((t_1 ^ single(2.0)) / (t_1 - t_0))) / exp(((log((single(2.0) * v)) ^ single(2.0)) / ((single(0.6931) + (((-sinTheta_O * sinTheta_i) - single(1.0)) / v)) - t_0))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \log \left(\frac{0.5}{v}\right)\\
t_1 := 0.6931 + \frac{\left(cosTheta\_O \cdot cosTheta\_i - sinTheta\_O \cdot sinTheta\_i\right) - 1}{v}\\
\frac{e^{\frac{{t\_1}^{2}}{t\_1 - t\_0}}}{e^{\frac{{\log \left(2 \cdot v\right)}^{2}}{\left(0.6931 + \frac{\left(-sinTheta\_O\right) \cdot sinTheta\_i - 1}{v}\right) - t\_0}}}
\end{array}
\end{array}
Initial program 99.7%
Applied rewrites99.8%
Taylor expanded in cosTheta_i around 0
associate-*r*N/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f3299.8
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (+ 0.6931 (/ (- (* (- sinTheta_O) sinTheta_i) 1.0) v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f + (((-sinTheta_O * sinTheta_i) - 1.0f) / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 + (((-sintheta_o * sintheta_i) - 1.0e0) / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(Float32(Float32(Float32(-sinTheta_O) * sinTheta_i) - Float32(1.0)) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) + (((-sinTheta_O * sinTheta_i) - single(1.0)) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 + \frac{\left(-sinTheta\_O\right) \cdot sinTheta\_i - 1}{v}}
\end{array}
Initial program 99.7%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
exp-sumN/A
lift-log.f32N/A
rem-exp-logN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
metadata-evalN/A
lower-exp.f3299.8
lift-+.f32N/A
Applied rewrites99.8%
Taylor expanded in cosTheta_i around 0
associate-*r*N/A
lower-*.f32N/A
mul-1-negN/A
lower-neg.f3299.8
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (+ 0.6931 (/ (fma cosTheta_O cosTheta_i -1.0) v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f + (fmaf(cosTheta_O, cosTheta_i, -1.0f) / v)));
}
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) + Float32(fma(cosTheta_O, cosTheta_i, Float32(-1.0)) / v)))) end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 + \frac{\mathsf{fma}\left(cosTheta\_O, cosTheta\_i, -1\right)}{v}}
\end{array}
Initial program 99.7%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
exp-sumN/A
lift-log.f32N/A
rem-exp-logN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
metadata-evalN/A
lower-exp.f3299.8
lift-+.f32N/A
Applied rewrites99.8%
Taylor expanded in sinTheta_i around 0
sub-negN/A
metadata-evalN/A
lower-fma.f3298.3
Applied rewrites98.3%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (/ (* cosTheta_O cosTheta_i) v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf(((cosTheta_O * cosTheta_i) / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp(((costheta_o * costheta_i) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(cosTheta_O * cosTheta_i) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp(((cosTheta_O * cosTheta_i) / v)); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{\frac{cosTheta\_O \cdot cosTheta\_i}{v}}
\end{array}
Initial program 99.7%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
exp-sumN/A
lift-log.f32N/A
rem-exp-logN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
metadata-evalN/A
lower-exp.f3299.8
lift-+.f32N/A
Applied rewrites99.8%
Taylor expanded in v around inf
Applied rewrites4.5%
Taylor expanded in cosTheta_i around inf
lower-/.f32N/A
lower-*.f3213.2
Applied rewrites13.2%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ 1.0 (/ v (* (exp 0.6931) 0.5))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 1.0f / (v / (expf(0.6931f) * 0.5f));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 1.0e0 / (v / (exp(0.6931e0) * 0.5e0))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(1.0) / Float32(v / Float32(exp(Float32(0.6931)) * Float32(0.5)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(1.0) / (v / (exp(single(0.6931)) * single(0.5))); end
\begin{array}{l}
\\
\frac{1}{\frac{v}{e^{0.6931} \cdot 0.5}}
\end{array}
Initial program 99.7%
Taylor expanded in v around -inf
associate-+r+N/A
exp-sumN/A
metadata-evalN/A
distribute-neg-fracN/A
rem-exp-logN/A
lower-*.f32N/A
exp-sumN/A
rem-exp-logN/A
lower-*.f32N/A
lower-exp.f32N/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f324.5
Applied rewrites4.5%
Applied rewrites4.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp 0.6931)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf(0.6931f);
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp(0.6931e0)
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(0.6931))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp(single(0.6931)); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931}
\end{array}
Initial program 99.7%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
exp-sumN/A
lift-log.f32N/A
rem-exp-logN/A
lower-*.f32N/A
lift-/.f32N/A
lift-*.f32N/A
associate-/r*N/A
lower-/.f32N/A
metadata-evalN/A
lower-exp.f3299.8
lift-+.f32N/A
Applied rewrites99.8%
Taylor expanded in v around inf
Applied rewrites4.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ 0.5 (* v (exp -0.6931))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return 0.5f / (v * expf(-0.6931f));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = 0.5e0 / (v * exp((-0.6931e0)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(0.5) / Float32(v * exp(Float32(-0.6931)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = single(0.5) / (v * exp(single(-0.6931))); end
\begin{array}{l}
\\
\frac{0.5}{v \cdot e^{-0.6931}}
\end{array}
Initial program 99.7%
lift-exp.f32N/A
lift-+.f32N/A
+-commutativeN/A
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
associate-+r-N/A
exp-diffN/A
lower-/.f32N/A
Applied rewrites88.4%
lift-exp.f32N/A
lift-+.f32N/A
lift-log.f32N/A
lift-/.f32N/A
log-divN/A
associate-+l-N/A
exp-diffN/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
lower--.f32N/A
lower-log.f3288.4
lift-*.f32N/A
*-commutativeN/A
lower-*.f3288.4
lift-*.f32N/A
*-commutativeN/A
lower-*.f3288.4
Applied rewrites88.4%
Taylor expanded in v around inf
lower-/.f32N/A
lower-*.f32N/A
lower-exp.f324.5
Applied rewrites4.5%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (/ (* (exp 0.6931) 0.5) v))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (expf(0.6931f) * 0.5f) / v;
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (exp(0.6931e0) * 0.5e0) / v
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(exp(Float32(0.6931)) * Float32(0.5)) / v) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (exp(single(0.6931)) * single(0.5)) / v; end
\begin{array}{l}
\\
\frac{e^{0.6931} \cdot 0.5}{v}
\end{array}
Initial program 99.7%
Taylor expanded in v around -inf
associate-+r+N/A
exp-sumN/A
metadata-evalN/A
distribute-neg-fracN/A
rem-exp-logN/A
lower-*.f32N/A
exp-sumN/A
rem-exp-logN/A
lower-*.f32N/A
lower-exp.f32N/A
distribute-neg-fracN/A
metadata-evalN/A
lower-/.f324.5
Applied rewrites4.5%
Applied rewrites4.5%
herbie shell --seed 2024309
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))