#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include "dudxyz_kernel.h"
#include <device/device_config.h>
#include <device/cuda/check.h>
#include <common/neko_log.h>

Macros
#define	CASE_1D(LX)

#define	CASE_KSTEP(LX)

#define	CASE(LX)

#define	CASE_LARGE(LX)

Functions
template<const int >
int	tune_dudxyz (void du, void u, void dr, void ds, void dt, void dx, void dy, void dz, void jacinv, int nel, int *lx)

void	cuda_dudxyz (void du, void u, void dr, void ds, void dt, void dx, void dy, void dz, void jacinv, int nel, int *lx)

Macro Definition Documentation

◆ CASE

#define CASE ( LX )

Value:

    case LX:                                                                    \
      if(autotune[LX] == 0 ) {                                                  \
        autotune[LX]=tune_dudxyz<LX>(du, u,                                     \
                                     dr, ds, dt,                                \
                                     dx, dy, dz,                                \
                                     jacinv, nel, lx);                          \
      } else if (autotune[LX] == 1 ) {                                          \
        CASE_1D(LX);                                                            \
      } else if (autotune[LX] == 2 ) {                                          \
        CASE_KSTEP(LX);                                                         \
      }                                                                         \
      break

◆ CASE_1D

#define CASE_1D ( LX )

Value:

    dudxyz_kernel_1d<real, LX, 1024>                                            \
      <<<nblcks, nthrds_1d, 0, stream>>>((real *) du, (real *) u,               \
                              (real *) dr, (real *) ds, (real *) dt,            \
                              (real *) dx, (real *) dy, (real *) dz,            \
                              (real *) jacinv);                                 \
    CUDA_CHECK(cudaGetLastError());

◆ CASE_KSTEP

#define CASE_KSTEP ( LX )

Value:

    dudxyz_kernel_kstep<real, LX>                                               \
      <<<nblcks, nthrds_kstep, 0, stream>>>((real *) du, (real *) u,            \
                                (real *) dr, (real *) ds, (real *) dt,          \
                                (real *) dx, (real *) dy, (real *) dz,          \
                                (real *) jacinv);                               \
      CUDA_CHECK(cudaGetLastError());

◆ CASE_LARGE

#define CASE_LARGE ( LX )

Value:

    case LX:                                                                    \
      CASE_KSTEP(LX);                                                           \
      break

Function Documentation

◆ cuda_dudxyz()

void cuda_dudxyz	(	void *	du,
		void *	u,
		void *	dr,
		void *	ds,
		void *	dt,
		void *	dx,
		void *	dy,
		void *	dz,
		void *	jacinv,
		int *	nel,
		int *	lx
	)

Fortran wrapper for device cuda derivative kernels

Definition at line 57 of file opr_dudxyz.cu.

Here is the call graph for this function:

Here is the caller graph for this function:

◆ tune_dudxyz()

template<const int >

int tune_dudxyz	(	void *	du,
		void *	u,
		void *	dr,
		void *	ds,
		void *	dt,
		void *	dx,
		void *	dy,
		void *	dz,
		void *	jacinv,
		int *	nel,
		int *	lx
	)

Definition at line 142 of file opr_dudxyz.cu.

Here is the call graph for this function:

Macros

Functions

Macro Definition Documentation

◆ CASE

◆ CASE_1D

◆ CASE_KSTEP

◆ CASE_LARGE

Function Documentation

◆ cuda_dudxyz()

◆ tune_dudxyz()