__global__ void smagorinsky_nut_compute(T *__restrict__ s11, T *__restrict__ s22, T *__restrict__ s33, T *__restrict__ s12, T *__restrict__ s13, T *__restrict__ s23, T *__restrict__ delta, T *__restrict__ nut, T *__restrict__ mult, const T c_s, const int n)