47 const dim3 nthrds(1024, 1, 1);
48 const dim3 nblcks(((*m)+1024 - 1)/ 1024, 1, 1);
61 void *z,
real *g,
int *m) {
64 const dim3 nblcks(((*m)+1024 - 1)/ 1024, 1, 1);
__global__ void const T *__restrict__ x
__global__ void dirichlet_apply_scalar_kernel(const int *__restrict__ msk, T *__restrict__ x, const T g, const int m)
void cuda_dirichlet_apply_vector(void *msk, void *x, void *y, void *z, real *g, int *m)
void cuda_dirichlet_apply_scalar(void *msk, void *x, real *g, int *m)