42 use,
intrinsic :: iso_c_binding, only : c_ptr, c_int
55 dx_d, dy_d, dz_d, dxt_d, dyt_d, dzt_d, &
56 h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d, nelv, lx) &
57 bind(c, name=
'hip_ax_helm')
58 use,
intrinsic :: iso_c_binding
59 type(c_ptr),
value :: w_d, u_d
60 type(c_ptr),
value :: dx_d, dy_d, dz_d
61 type(c_ptr),
value :: dxt_d, dyt_d, dzt_d
62 type(c_ptr),
value :: h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d
63 integer(c_int) :: nel, lx
69 dx_d, dy_d, dz_d, dxt_d, dyt_d, dzt_d,&
70 h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d, nelv, lx) &
71 bind(c, name=
'hip_ax_helm_vector')
72 use,
intrinsic :: iso_c_binding
73 type(c_ptr),
value :: au_d, av_d, aw_d
74 type(c_ptr),
value :: u_d, v_d, w_d
75 type(c_ptr),
value :: dx_d, dy_d, dz_d
76 type(c_ptr),
value :: dxt_d, dyt_d, dzt_d
77 type(c_ptr),
value :: h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d
78 integer(c_int) :: nel, lx
84 h2_d, B_d, n) bind(c, name='hip_ax_helm_vector_part2')
85 use,
intrinsic :: iso_c_binding
86 type(c_ptr),
value :: au_d, av_d, aw_d
87 type(c_ptr),
value :: u_d, v_d, w_d
88 type(c_ptr),
value :: h2_d, B_d
95 dx_d, dy_d, dz_d, dxt_d, dyt_d, dzt_d,&
96 h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d, nelv, lx) &
97 bind(c, name=
'cuda_ax_helm')
98 use,
intrinsic :: iso_c_binding
99 type(c_ptr),
value :: w_d, u_d
100 type(c_ptr),
value :: dx_d, dy_d, dz_d
101 type(c_ptr),
value :: dxt_d, dyt_d, dzt_d
102 type(c_ptr),
value :: h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d
103 integer(c_int) :: nel, lx
109 dx_d, dy_d, dz_d, dxt_d, dyt_d, dzt_d,&
110 h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d, nelv, lx) &
111 bind(c, name=
'cuda_ax_helm_vector')
112 use,
intrinsic :: iso_c_binding
113 type(c_ptr),
value :: au_d, av_d, aw_d
114 type(c_ptr),
value :: u_d, v_d, w_d
115 type(c_ptr),
value :: dx_d, dy_d, dz_d
116 type(c_ptr),
value :: dxt_d, dyt_d, dzt_d
117 type(c_ptr),
value :: h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d
118 integer(c_int) :: nel, lx
124 h2_d, B_d, n) bind(c, name='cuda_ax_helm_vector_part2')
125 use,
intrinsic :: iso_c_binding
126 type(c_ptr),
value :: au_d, av_d, aw_d
127 type(c_ptr),
value :: u_d, v_d, w_d
128 type(c_ptr),
value :: h2_d, B_d
135 dx_d, dy_d, dz_d, dxt_d, dyt_d, dzt_d, &
136 h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d, nelv, lx) &
137 bind(c, name=
'opencl_ax_helm')
138 use,
intrinsic :: iso_c_binding
139 type(c_ptr),
value :: w_d, u_d
140 type(c_ptr),
value :: dx_d, dy_d, dz_d
141 type(c_ptr),
value :: dxt_d, dyt_d, dzt_d
142 type(c_ptr),
value :: h1_d, g11_d, g22_d, g33_d, g12_d, g13_d, g23_d
143 integer(c_int) :: nel, lx
151 type(
mesh_t),
intent(inout) :: msh
152 type(
space_t),
intent(inout) :: Xh
153 type(
coef_t),
intent(inout) :: coef
154 real(kind=
rp),
intent(inout) :: w(xh%lx, xh%ly, xh%lz, msh%nelv)
155 real(kind=
rp),
intent(inout) :: u(xh%lx, xh%ly, xh%lz, msh%nelv)
156 type(c_ptr) :: u_d, w_d
162 call hip_ax_helm(w_d, u_d, xh%dx_d, xh%dy_d, xh%dz_d, &
163 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
164 coef%G11_d, coef%G22_d, coef%G33_d, &
165 coef%G12_d, coef%G13_d, coef%G23_d, &
168 call cuda_ax_helm(w_d, u_d, xh%dx_d, xh%dy_d, xh%dz_d, &
169 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
170 coef%G11_d, coef%G22_d, coef%G33_d, &
171 coef%G12_d, coef%G13_d, coef%G23_d, &
175 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
176 coef%G11_d, coef%G22_d, coef%G33_d, &
177 coef%G12_d, coef%G13_d, coef%G23_d, &
182 call device_addcol4(w_d ,coef%h2_d, coef%B_d, u_d, coef%dof%size())
188 u, v, w, coef, msh, Xh)
190 type(
space_t),
intent(inout) :: Xh
191 type(
mesh_t),
intent(inout) :: msh
192 type(
coef_t),
intent(inout) :: coef
193 real(kind=
rp),
intent(inout) :: au(xh%lx, xh%ly, xh%lz, msh%nelv)
194 real(kind=
rp),
intent(inout) :: av(xh%lx, xh%ly, xh%lz, msh%nelv)
195 real(kind=
rp),
intent(inout) :: aw(xh%lx, xh%ly, xh%lz, msh%nelv)
196 real(kind=
rp),
intent(inout) :: u(xh%lx, xh%ly, xh%lz, msh%nelv)
197 real(kind=
rp),
intent(inout) :: v(xh%lx, xh%ly, xh%lz, msh%nelv)
198 real(kind=
rp),
intent(inout) :: w(xh%lx, xh%ly, xh%lz, msh%nelv)
199 type(c_ptr) :: u_d, v_d, w_d
200 type(c_ptr) :: au_d, av_d, aw_d
212 xh%dx_d, xh%dy_d, xh%dz_d, xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
213 coef%G11_d, coef%G22_d, coef%G33_d, &
214 coef%G12_d, coef%G13_d, coef%G23_d, &
218 xh%dx_d, xh%dy_d, xh%dz_d, xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
219 coef%G11_d, coef%G22_d, coef%G33_d, &
220 coef%G12_d, coef%G13_d, coef%G23_d, &
224 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
225 coef%G11_d, coef%G22_d, coef%G33_d, &
226 coef%G12_d, coef%G13_d, coef%G23_d, &
229 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
230 coef%G11_d, coef%G22_d, coef%G33_d, &
231 coef%G12_d, coef%G13_d, coef%G23_d, &
234 xh%dxt_d, xh%dyt_d, xh%dzt_d, coef%h1_d, &
235 coef%G11_d, coef%G22_d, coef%G33_d, &
236 coef%G12_d, coef%G13_d, coef%G23_d, &
243 coef%h2_d, coef%B_d, coef%dof%size())
246 coef%h2_d, coef%B_d, coef%dof%size())
248 call device_addcol4(au_d ,coef%h2_d, coef%B_d, u_d, coef%dof%size())
249 call device_addcol4(av_d ,coef%h2_d, coef%B_d, v_d, coef%dof%size())
250 call device_addcol4(aw_d ,coef%h2_d, coef%B_d, w_d, coef%dof%size())
void opencl_ax_helm(void *w, void *u, void *dx, void *dy, void *dz, void *dxt, void *dyt, void *dzt, void *h1, void *g11, void *g22, void *g33, void *g12, void *g13, void *g23, int *nelv, int *lx)
void cuda_ax_helm_vector_part2(void *au, void *av, void *aw, void *u, void *v, void *w, void *h2, void *B, int *n)
void cuda_ax_helm(void *w, void *u, void *dx, void *dy, void *dz, void *dxt, void *dyt, void *dzt, void *h1, void *g11, void *g22, void *g33, void *g12, void *g13, void *g23, int *nelv, int *lx)
void cuda_ax_helm_vector(void *au, void *av, void *aw, void *u, void *v, void *w, void *dx, void *dy, void *dz, void *dxt, void *dyt, void *dzt, void *h1, void *g11, void *g22, void *g33, void *g12, void *g13, void *g23, int *nelv, int *lx)
Return the device pointer for an associated Fortran array.
subroutine ax_helm_device_compute(w, u, coef, msh, xh)
subroutine ax_helm_device_compute_vector(this, au, av, aw, u, v, w, coef, msh, xh)
subroutine, public device_addcol4(a_d, b_d, c_d, d_d, n)
Returns .
Device abstraction, common interface for various accelerators.
integer, parameter, public rp
Global precision used in computations.
Defines a function space.
Matrix-vector product for a Helmholtz problem.
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
The function space for the SEM solution fields.