Neko 0.9.99
A portable framework for high-order spectral element flow simulations
Loading...
Searching...
No Matches
opr_dudxyz.cu File Reference
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include "dudxyz_kernel.h"
#include <device/device_config.h>
#include <device/cuda/check.h>
#include <common/neko_log.h>

Go to the source code of this file.

Macros

#define CASE_1D(LX)
 
#define CASE_KSTEP(LX)
 
#define CASE(LX)
 
#define CASE_LARGE(LX)
 

Functions

template<const int >
int tune_dudxyz (void *du, void *u, void *dr, void *ds, void *dt, void *dx, void *dy, void *dz, void *jacinv, int *nel, int *lx)
 
void cuda_dudxyz (void *du, void *u, void *dr, void *ds, void *dt, void *dx, void *dy, void *dz, void *jacinv, int *nel, int *lx)
 

Macro Definition Documentation

◆ CASE

#define CASE (   LX)
Value:
case LX: \
if(autotune[LX] == 0 ) { \
dr, ds, dt, \
dx, dy, dz, \
jacinv, nel, lx); \
} else if (autotune[LX] == 1 ) { \
} else if (autotune[LX] == 2 ) { \
} \
break
__global__ void T *__restrict__ T *__restrict__ const T *__restrict__ u
__global__ void T *__restrict__ T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dx
__global__ void T *__restrict__ T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dz
__global__ void T *__restrict__ T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dy
__global__ void T *__restrict__ T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ jacinv
__global__ void const T *__restrict__ const T *__restrict__ dr
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ ds
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dt
__global__ void dirichlet_apply_scalar_kernel(const int *__restrict__ msk, T *__restrict__ x, const T g, const int m)

◆ CASE_1D

#define CASE_1D (   LX)
Value:
<<<nblcks, nthrds_1d, 0, stream>>>((real *) du, (real *) u, \
(real *) dr, (real *) ds, (real *) dt, \
(real *) dx, (real *) dy, (real *) dz, \
(real *) jacinv); \
double real

◆ CASE_KSTEP

#define CASE_KSTEP (   LX)
Value:
<<<nblcks, nthrds_kstep, 0, stream>>>((real *) du, (real *) u, \
(real *) dr, (real *) ds, (real *) dt, \
(real *) dx, (real *) dy, (real *) dz, \
(real *) jacinv); \

◆ CASE_LARGE

#define CASE_LARGE (   LX)
Value:
case LX: \
break

Function Documentation

◆ cuda_dudxyz()

void cuda_dudxyz ( void du,
void u,
void dr,
void ds,
void dt,
void dx,
void dy,
void dz,
void jacinv,
int nel,
int lx 
)

Fortran wrapper for device cuda derivative kernels

Definition at line 57 of file opr_dudxyz.cu.

Here is the call graph for this function:
Here is the caller graph for this function:

◆ tune_dudxyz()

template<const int >
int tune_dudxyz ( void du,
void u,
void dr,
void ds,
void dt,
void dx,
void dy,
void dz,
void jacinv,
int nel,
int lx 
)

Definition at line 142 of file opr_dudxyz.cu.

Here is the call graph for this function: