
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
Sampling outcomes in binary32 precision:
Herbie found 6 alternatives:
| Alternative | Accuracy | Speedup |
|---|
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(exp
(+
(+
(-
(- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v))
(/ 1.0 v))
0.6931)
(log (/ 1.0 (* 2.0 v))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (1.0f / v)) + 0.6931f) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((((costheta_i * costheta_o) / v) - ((sintheta_i * sintheta_o) / v)) - (1.0e0 / v)) + 0.6931e0) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_i * cosTheta_O) / v) - Float32(Float32(sinTheta_i * sinTheta_O) / v)) - Float32(Float32(1.0) / v)) + Float32(0.6931)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((((cosTheta_i * cosTheta_O) / v) - ((sinTheta_i * sinTheta_O) / v)) - (single(1.0) / v)) + single(0.6931)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
e^{\left(\left(\left(\frac{cosTheta\_i \cdot cosTheta\_O}{v} - \frac{sinTheta\_i \cdot sinTheta\_O}{v}\right) - \frac{1}{v}\right) + 0.6931\right) + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:precision binary32
(let* ((t_0 (+ (/ 1.0 v) 0.6931)))
(exp
(+
(/
(-
(* (- (* cosTheta_O cosTheta_i) (* sinTheta_O sinTheta_i)) t_0)
(* v (- (pow v -2.0) 0.48038761)))
(* v t_0))
(log (/ 1.0 (* 2.0 v)))))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
float t_0 = (1.0f / v) + 0.6931f;
return expf(((((((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) * t_0) - (v * (powf(v, -2.0f) - 0.48038761f))) / (v * t_0)) + logf((1.0f / (2.0f * v)))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
real(4) :: t_0
t_0 = (1.0e0 / v) + 0.6931e0
code = exp(((((((costheta_o * costheta_i) - (sintheta_o * sintheta_i)) * t_0) - (v * ((v ** (-2.0e0)) - 0.48038761e0))) / (v * t_0)) + log((1.0e0 / (2.0e0 * v)))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = Float32(Float32(Float32(1.0) / v) + Float32(0.6931)) return exp(Float32(Float32(Float32(Float32(Float32(Float32(cosTheta_O * cosTheta_i) - Float32(sinTheta_O * sinTheta_i)) * t_0) - Float32(v * Float32((v ^ Float32(-2.0)) - Float32(0.48038761)))) / Float32(v * t_0)) + log(Float32(Float32(1.0) / Float32(Float32(2.0) * v))))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) t_0 = (single(1.0) / v) + single(0.6931); tmp = exp(((((((cosTheta_O * cosTheta_i) - (sinTheta_O * sinTheta_i)) * t_0) - (v * ((v ^ single(-2.0)) - single(0.48038761)))) / (v * t_0)) + log((single(1.0) / (single(2.0) * v))))); end
\begin{array}{l}
\\
\begin{array}{l}
t_0 := \frac{1}{v} + 0.6931\\
e^{\frac{\left(cosTheta\_O \cdot cosTheta\_i - sinTheta\_O \cdot sinTheta\_i\right) \cdot t\_0 - v \cdot \left({v}^{-2} - 0.48038761\right)}{v \cdot t\_0} + \log \left(\frac{1}{2 \cdot v}\right)}
\end{array}
\end{array}
Initial program 99.8%
lift-+.f32N/A
lift--.f32N/A
associate-+l-N/A
lift--.f32N/A
lift-/.f32N/A
lift-/.f32N/A
sub-divN/A
flip--N/A
frac-subN/A
lower-/.f32N/A
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (* (/ (- (- 0.6931 (/ 1.0 v)) (log (* 2.0 v))) sinTheta_O) sinTheta_O)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf(((((0.6931f - (1.0f / v)) - logf((2.0f * v))) / sinTheta_O) * sinTheta_O));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((((0.6931e0 - (1.0e0 / v)) - log((2.0e0 * v))) / sintheta_o) * sintheta_o))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(Float32(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)) - log(Float32(Float32(2.0) * v))) / sinTheta_O) * sinTheta_O)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp(((((single(0.6931) - (single(1.0) / v)) - log((single(2.0) * v))) / sinTheta_O) * sinTheta_O)); end
\begin{array}{l}
\\
e^{\frac{\left(0.6931 - \frac{1}{v}\right) - \log \left(2 \cdot v\right)}{sinTheta\_O} \cdot sinTheta\_O}
\end{array}
Initial program 99.8%
Taylor expanded in cosTheta_i around 0
lower--.f32N/A
+-commutativeN/A
lower-+.f32N/A
rem-exp-logN/A
lower-log.f32N/A
rem-exp-logN/A
lower-/.f32N/A
div-add-revN/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f3237.8
Applied rewrites38.2%
Taylor expanded in sinTheta_O around inf
Applied rewrites96.7%
Applied rewrites96.7%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (- 0.6931 (+ (log (* 2.0 v)) (/ 1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((0.6931f - (logf((2.0f * v)) + (1.0f / v))));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp((0.6931e0 - (log((2.0e0 * v)) + (1.0e0 / v))))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(0.6931) - Float32(log(Float32(Float32(2.0) * v)) + Float32(Float32(1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(0.6931) - (log((single(2.0) * v)) + (single(1.0) / v)))); end
\begin{array}{l}
\\
e^{0.6931 - \left(\log \left(2 \cdot v\right) + \frac{1}{v}\right)}
\end{array}
Initial program 99.8%
Taylor expanded in cosTheta_i around 0
lower--.f32N/A
+-commutativeN/A
lower-+.f32N/A
rem-exp-logN/A
lower-log.f32N/A
rem-exp-logN/A
lower-/.f32N/A
div-add-revN/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f3238.2
Applied rewrites38.2%
Applied rewrites38.5%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (* (/ 0.5 v) (exp (- 0.6931 (/ 1.0 v)))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return (0.5f / v) * expf((0.6931f - (1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = (0.5e0 / v) * exp((0.6931e0 - (1.0e0 / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return Float32(Float32(Float32(0.5) / v) * exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v)))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = (single(0.5) / v) * exp((single(0.6931) - (single(1.0) / v))); end
\begin{array}{l}
\\
\frac{0.5}{v} \cdot e^{0.6931 - \frac{1}{v}}
\end{array}
Initial program 99.8%
Taylor expanded in cosTheta_i around 0
+-commutativeN/A
associate--l+N/A
exp-sumN/A
lower-*.f32N/A
rem-exp-logN/A
lower-/.f32N/A
lower-exp.f32N/A
lower--.f32N/A
div-add-revN/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f3299.8
Applied rewrites99.8%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.8%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (- 0.6931 (/ 1.0 v))))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((0.6931f - (1.0f / v)));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp((0.6931e0 - (1.0e0 / v)))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(0.6931) - Float32(Float32(1.0) / v))) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(0.6931) - (single(1.0) / v))); end
\begin{array}{l}
\\
e^{0.6931 - \frac{1}{v}}
\end{array}
Initial program 99.8%
Taylor expanded in cosTheta_i around 0
lower--.f32N/A
+-commutativeN/A
lower-+.f32N/A
rem-exp-logN/A
lower-log.f32N/A
rem-exp-logN/A
lower-/.f32N/A
div-add-revN/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f3238.2
Applied rewrites38.6%
Applied rewrites38.8%
Taylor expanded in sinTheta_i around 0
Applied rewrites99.8%
Taylor expanded in v around 0
Applied rewrites98.7%
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v) :precision binary32 (exp (/ -1.0 v)))
float code(float cosTheta_i, float cosTheta_O, float sinTheta_i, float sinTheta_O, float v) {
return expf((-1.0f / v));
}
real(4) function code(costheta_i, costheta_o, sintheta_i, sintheta_o, v)
real(4), intent (in) :: costheta_i
real(4), intent (in) :: costheta_o
real(4), intent (in) :: sintheta_i
real(4), intent (in) :: sintheta_o
real(4), intent (in) :: v
code = exp(((-1.0e0) / v))
end function
function code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) return exp(Float32(Float32(-1.0) / v)) end
function tmp = code(cosTheta_i, cosTheta_O, sinTheta_i, sinTheta_O, v) tmp = exp((single(-1.0) / v)); end
\begin{array}{l}
\\
e^{\frac{-1}{v}}
\end{array}
Initial program 99.8%
Taylor expanded in cosTheta_i around 0
lower--.f32N/A
+-commutativeN/A
lower-+.f32N/A
rem-exp-logN/A
lower-log.f32N/A
rem-exp-logN/A
lower-/.f32N/A
div-add-revN/A
lower-/.f32N/A
+-commutativeN/A
lower-fma.f3238.6
Applied rewrites38.6%
Taylor expanded in v around 0
Applied rewrites98.6%
Taylor expanded in sinTheta_i around 0
Applied rewrites98.7%
herbie shell --seed 2024320
(FPCore (cosTheta_i cosTheta_O sinTheta_i sinTheta_O v)
:name "HairBSDF, Mp, lower"
:precision binary32
:pre (and (and (and (and (and (<= -1.0 cosTheta_i) (<= cosTheta_i 1.0)) (and (<= -1.0 cosTheta_O) (<= cosTheta_O 1.0))) (and (<= -1.0 sinTheta_i) (<= sinTheta_i 1.0))) (and (<= -1.0 sinTheta_O) (<= sinTheta_O 1.0))) (and (<= -1.5707964 v) (<= v 0.1)))
(exp (+ (+ (- (- (/ (* cosTheta_i cosTheta_O) v) (/ (* sinTheta_i sinTheta_O) v)) (/ 1.0 v)) 0.6931) (log (/ 1.0 (* 2.0 v))))))