Neko 0.9.99
A portable framework for high-order spectral element flow simulations
|
Go to the source code of this file.
Functions | |
template<typename T , const int LX, const int CHUNKS> | |
__global__ void | ax_helm_kernel_1d (T *__restrict__ w, const T *__restrict__ u, const T *__restrict__ dx, const T *__restrict__ dy, const T *__restrict__ dz, const T *__restrict__ dxt, const T *__restrict__ dyt, const T *__restrict__ dzt, const T *__restrict__ h1, const T *__restrict__ g11, const T *__restrict__ g22, const T *__restrict__ g33, const T *__restrict__ g12, const T *__restrict__ g13, const T *__restrict__ g23) |
template<typename T , const int LX> | |
__global__ void | __launch_bounds__ (LX *LX, 3) ax_helm_kernel_kstep(T *__restrict__ w |
for (int k=0;k< LX;++k) | |
__syncthreads () | |
template<typename T > | |
__global__ void | ax_helm_kernel_vector_part2 (T *__restrict__ au, T *__restrict__ av, T *__restrict__ aw, const T *__restrict__ u, const T *__restrict__ v, const T *__restrict__ w, const T *__restrict__ h2, const T *__restrict__ B, const int n) |
Device kernel for axhelm with padding in shared memory to remove bank conflicts when LX is a power of 2
__syncthreads | ( | ) |
__global__ void ax_helm_kernel_1d | ( | T *__restrict__ | w, |
const T *__restrict__ | u, | ||
const T *__restrict__ | dx, | ||
const T *__restrict__ | dy, | ||
const T *__restrict__ | dz, | ||
const T *__restrict__ | dxt, | ||
const T *__restrict__ | dyt, | ||
const T *__restrict__ | dzt, | ||
const T *__restrict__ | h1, | ||
const T *__restrict__ | g11, | ||
const T *__restrict__ | g22, | ||
const T *__restrict__ | g33, | ||
const T *__restrict__ | g12, | ||
const T *__restrict__ | g13, | ||
const T *__restrict__ | g23 | ||
) |
Device kernels for Ax helm
Definition at line 42 of file ax_helm_kernel.h.
__global__ void ax_helm_kernel_vector_part2 | ( | T *__restrict__ | au, |
T *__restrict__ | av, | ||
T *__restrict__ | aw, | ||
const T *__restrict__ | u, | ||
const T *__restrict__ | v, | ||
const T *__restrict__ | w, | ||
const T *__restrict__ | h2, | ||
const T *__restrict__ | B, | ||
const int | n | ||
) |
for | ( | ) |
__global__ void T* __restrict__ av |
Definition at line 359 of file ax_helm_kernel.h.
__global__ void T* __restrict__ T* __restrict__ aw |
Definition at line 360 of file ax_helm_kernel.h.
__global__ void T* __restrict__ T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ dx |
Definition at line 152 of file ax_helm_kernel.h.
__global__ void T* __restrict__ T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ dy |
Definition at line 153 of file ax_helm_kernel.h.
__global__ void T* __restrict__ T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ dz |
Definition at line 154 of file ax_helm_kernel.h.
const int e = blockIdx.x |
Definition at line 175 of file ax_helm_kernel.h.
Definition at line 156 of file ax_helm_kernel.h.
Definition at line 159 of file ax_helm_kernel.h.
Definition at line 160 of file ax_helm_kernel.h.
Definition at line 157 of file ax_helm_kernel.h.
Definition at line 161 of file ax_helm_kernel.h.
Definition at line 158 of file ax_helm_kernel.h.
Definition at line 155 of file ax_helm_kernel.h.
const int i = threadIdx.x |
Definition at line 177 of file ax_helm_kernel.h.
Definition at line 176 of file ax_helm_kernel.h.
Definition at line 171 of file ax_helm_kernel.h.
T rut |
Definition at line 173 of file ax_helm_kernel.h.
Definition at line 395 of file ax_helm_kernel.h.
Definition at line 392 of file ax_helm_kernel.h.
T rvt |
Definition at line 400 of file ax_helm_kernel.h.
Definition at line 396 of file ax_helm_kernel.h.
Definition at line 172 of file ax_helm_kernel.h.
T rwt |
Definition at line 401 of file ax_helm_kernel.h.
Definition at line 397 of file ax_helm_kernel.h.
Definition at line 181 of file ax_helm_kernel.h.
Definition at line 164 of file ax_helm_kernel.h.
Definition at line 165 of file ax_helm_kernel.h.
__shared__ T shu[LX *(LX+1)] |
Definition at line 167 of file ax_helm_kernel.h.
__shared__ T shur[LX *LX] |
Definition at line 168 of file ax_helm_kernel.h.
__shared__ T shus[LX *(LX+1)] |
Definition at line 169 of file ax_helm_kernel.h.
__shared__ T shv[LX *(LX+1)] |
Definition at line 383 of file ax_helm_kernel.h.
__shared__ T shvr[LX *LX] |
Definition at line 384 of file ax_helm_kernel.h.
__shared__ T shvs[LX *(LX+1)] |
Definition at line 385 of file ax_helm_kernel.h.
__shared__ T shw[LX *(LX+1)] |
Definition at line 387 of file ax_helm_kernel.h.
__shared__ T shwr[LX *LX] |
Definition at line 388 of file ax_helm_kernel.h.
__shared__ T shws[LX *(LX+1)] |
Definition at line 389 of file ax_helm_kernel.h.
Definition at line 151 of file ax_helm_kernel.h.
Definition at line 362 of file ax_helm_kernel.h.
__global__ void T* __restrict__ T* __restrict__ const T* __restrict__ const T* __restrict__ const T* __restrict__ w |
Definition at line 363 of file ax_helm_kernel.h.