47    const dim3 nthrds(1024, 1, 1);
 
   48    const dim3 nblcks(((*m)+1024 - 1)/ 1024, 1, 1);
 
 
   61                                  void *z, 
real *g, 
int *m) {
 
   64    const dim3 nblcks(((*m)+1024 - 1)/ 1024, 1, 1);
 
 
__global__ void const T *__restrict__ x
 
__global__ void dirichlet_apply_scalar_kernel(const int *__restrict__ msk, T *__restrict__ x, const T g, const int m)
 
void cuda_dirichlet_apply_vector(void *msk, void *x, void *y, void *z, real *g, int *m)
 
void cuda_dirichlet_apply_scalar(void *msk, void *x, real *g, int *m)