__global__ void vreman_nut_compute(T *__restrict__ a11, T *__restrict__ a12, T *__restrict__ a13, T *__restrict__ a21, T *__restrict__ a22, T *__restrict__ a23, T *__restrict__ a31, T *__restrict__ a32, T *__restrict__ a33, T *__restrict__ delta, T *__restrict__ nut, T *__restrict__ mult, const T c, const T eps, const int n)