1#ifndef __MATH_MATHOPS_KERNEL_H__ 
    2#define __MATH_MATHOPS_KERNEL_H__ 
   51    for (
int i = idx; 
i < n; 
i += 
str) {
 
   58    for (
int i = idx; 
i < n; 
i += 
str) {
 
 
   81    for (
int i = idx; 
i < n; 
i += 
str) {
 
   88    for (
int i = idx; 
i < n; 
i += 
str) {
 
 
  115    for (
int i = idx; 
i < n; 
i += 
str) {
 
  122    for (
int i = idx; 
i < n; 
i += 
str) {
 
 
  148    for (
int i = idx; 
i < n; 
i += 
str) {
 
  155    for (
int i = idx; 
i < n; 
i += 
str) {
 
 
  182    for (
int i = idx; 
i < n; 
i += 
str) {
 
  189    for (
int i = idx; 
i < n; 
i += 
str) {
 
 
__global__ void dirichlet_apply_scalar_kernel(const int *__restrict__ msk, T *__restrict__ x, const T g, const int m)
 
__global__ void opcolv_kernel(T *__restrict__ a1, T *__restrict__ a2, T *__restrict__ a3, const T *__restrict__ c, const int gdim, const int n)
 
__global__ void opchsign_kernel(T *__restrict__ a1, T *__restrict__ a2, T *__restrict__ a3, const int gdim, const int n)
 
__global__ void opadd2col_kernel(T *__restrict__ a1, T *__restrict__ a2, T *__restrict__ a3, const T *__restrict__ b1, const T *__restrict__ b2, const T *__restrict__ b3, const T *__restrict__ c, const int gdim, const int n)
 
__global__ void opcolv3c_kernel(T *__restrict__ a1, T *__restrict__ a2, T *__restrict__ a3, const T *__restrict__ b1, const T *__restrict__ b2, const T *__restrict__ b3, const T *__restrict__ c, const T d, const int gdim, const int n)
 
__global__ void opadd2cm_kernel(T *__restrict__ a1, T *__restrict__ a2, T *__restrict__ a3, const T *__restrict__ b1, const T *__restrict__ b2, const T *__restrict__ b3, const T c, const int gdim, const int n)