47 bind(c, name =
'cuda_masked_copy')
48 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
49 type(c_ptr),
value :: a_d, b_d, mask_d, strm
50 integer(c_int) :: n, n_mask
54 bind(c, name =
'cuda_masked_gather_copy')
55 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
56 type(c_ptr),
value :: a_d, b_d, mask_d, strm
57 integer(c_int) :: n, n_mask
61 strm) bind(c, name = 'cuda_masked_gather_copy_aligned')
62 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
63 type(c_ptr),
value :: a_d, b_d, mask_d, strm
64 integer(c_int) :: n, n_mask
68 bind(c, name =
'cuda_masked_scatter_copy')
69 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
70 type(c_ptr),
value :: a_d, b_d, mask_d, strm
71 integer(c_int) :: n, n_mask
75 bind(c, name =
'cuda_masked_atomic_reduction')
76 use,
intrinsic :: iso_c_binding, only : c_ptr, c_int
77 type(c_ptr),
value :: a_d, b_d, mask_d, strm
78 integer(c_int) :: n, m
82 bind(c, name =
'cuda_cfill_mask')
83 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
85 type(c_ptr),
value :: a_d, strm
88 type(c_ptr),
value :: mask_d
89 integer(c_int) :: n_mask
173 bind(c, name =
'cuda_add4')
174 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
176 type(c_ptr),
value :: a_d, b_d, c_d, d_d, strm
208 bind(c, name =
'cuda_add3s2')
209 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
211 type(c_ptr),
value :: a_d, b_d, c_d, strm
217 bind(c, name =
'cuda_add4s3')
218 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
220 type(c_ptr),
value :: a_d, b_d, c_d, d_d, strm
221 real(c_rp) :: c1, c2, c3
225 subroutine cuda_add5s4(a_d, b_d, c_d, d_d, e_d, c1, c2, c3, c4, n, strm) &
226 bind(c, name =
'cuda_add5s4')
227 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
229 type(c_ptr),
value :: a_d, b_d, c_d, d_d, e_d, strm
230 real(c_rp) :: c1, c2, c3, c4
305 bind(c, name =
'cuda_addcol4')
306 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
307 type(c_ptr),
value :: a_d, b_d, c_d, d_d, strm
320 subroutine cuda_vdot3(dot_d, u1_d, u2_d, u3_d, v1_d, v2_d, v3_d, n, strm) &
321 bind(c, name =
'cuda_vdot3')
322 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
323 type(c_ptr),
value :: dot_d, u1_d, u2_d, u3_d, v1_d, v2_d, v3_d, strm
328 w1_d, w2_d, w3_d, n, strm) &
329 bind(c, name =
'cuda_vcross')
330 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
331 type(c_ptr),
value :: u1_d, u2_d, u3_d
332 type(c_ptr),
value :: v1_d, v2_d, v3_d
333 type(c_ptr),
value :: w1_d, w2_d, w3_d
334 type(c_ptr),
value :: strm
363 bind(c, name =
'cuda_glsc3_many')
364 use,
intrinsic :: iso_c_binding, only : c_int, c_ptr
366 type(c_ptr),
value :: w_d, v_d_d, mult_d, strm
367 integer(c_int) :: j, n