Neko  0.9.99
A portable framework for high-order spectral element flow simulations
opr_cdtp.hip File Reference
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include <hip/hip_runtime.h>
#include <device/device_config.h>
#include <device/hip/check.h>
#include "cdtp_kernel.h"
#include <common/neko_log.h>
Include dependency graph for opr_cdtp.hip:

Go to the source code of this file.

Macros

#define CASE_1D(LX)
 
#define CASE_KSTEP(LX)
 
#define CASE(LX)
 
#define CASE_LARGE(LX)
 

Functions

template<const int >
int tune_cdtp (void *dtx, void *x, void *dr, void *ds, void *dt, void *dxt, void *dyt, void *dzt, void *w3, int *nel, int *lx)
 
void hip_cdtp (void *dtx, void *x, void *dr, void *ds, void *dt, void *dxt, void *dyt, void *dzt, void *w3, int *nel, int *lx)
 

Macro Definition Documentation

◆ CASE

#define CASE (   LX)
Value:
case LX: \
if(autotune[LX] == 0 ) { \
autotune[LX]=tune_cdtp<LX>(dtx, x, \
dr, ds, dt, \
dxt, dyt, dzt, \
w3, nel, lx); \
} else if (autotune[LX] == 1 ) { \
CASE_1D(LX); \
} else if (autotune[LX] == 2 ) { \
CASE_KSTEP(LX); \
} \
break
__global__ void const T *__restrict__ const T *__restrict__ dr
Definition: cdtp_kernel.h:107
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ ds
Definition: cdtp_kernel.h:108
__global__ void const T *__restrict__ x
Definition: cdtp_kernel.h:106
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dt
Definition: cdtp_kernel.h:109
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ w3
Definition: cdtp_kernel.h:113
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dzt
Definition: cdtp_kernel.h:112
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dyt
Definition: cdtp_kernel.h:111
__global__ void const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ const T *__restrict__ dxt
Definition: cdtp_kernel.h:110

◆ CASE_1D

#define CASE_1D (   LX)
Value:
hipLaunchKernelGGL( HIP_KERNEL_NAME(cdtp_kernel_1d<real, LX, 1024> ), \
nblcks, nthrds_1d, 0, (hipStream_t) glb_cmd_queue, \
(real *) dtx, (real *) x, \
(real *) dr, (real *) ds, (real *) dt, \
(real *) dxt, (real *) dyt, (real *) dzt, \
(real *) w3); \
HIP_CHECK(hipGetLastError());
double real
Definition: device_config.h:12
void * glb_cmd_queue

◆ CASE_KSTEP

#define CASE_KSTEP (   LX)
Value:
hipLaunchKernelGGL( HIP_KERNEL_NAME(cdtp_kernel_kstep<real, LX> ), \
nblcks, nthrds_kstep, 0, (hipStream_t) glb_cmd_queue, \
(real *) dtx, (real *) x, \
(real *) dr, (real *) ds, (real *) dt, \
(real *) dxt, (real *) dyt, (real *) dzt, \
(real *) w3); \
HIP_CHECK(hipGetLastError());

◆ CASE_LARGE

#define CASE_LARGE (   LX)
Value:
case LX: \
CASE_KSTEP(LX); \
break

Function Documentation

◆ hip_cdtp()

void hip_cdtp ( void *  dtx,
void *  x,
void *  dr,
void *  ds,
void *  dt,
void *  dxt,
void *  dyt,
void *  dzt,
void *  w3,
int *  nel,
int *  lx 
)

Fortran wrapper for device hip \( D^T X \)

Definition at line 58 of file opr_cdtp.hip.

◆ tune_cdtp()

template<const int >
int tune_cdtp ( void *  dtx,
void *  x,
void *  dr,
void *  ds,
void *  dt,
void *  dxt,
void *  dyt,
void *  dzt,
void *  w3,
int *  nel,
int *  lx 
)

Definition at line 144 of file opr_cdtp.hip.

Here is the call graph for this function: