41 use,
intrinsic :: iso_c_binding
46 real(kind=
rp),
allocatable :: x(:,:)
47 character(len=NEKO_VARNAME_LEN) :: name =
""
48 type(c_ptr) :: x_d = c_null_ptr
49 integer,
private :: nrows = 0
50 integer,
private :: ncols = 0
51 integer,
private :: n = 0
91 integer,
intent(in) :: nrows
92 integer,
intent(in) :: ncols
93 character(len=*),
intent(in),
optional :: name
95 call m%alloc(nrows, ncols)
101 if (
present(name))
then
113 integer,
intent(in) :: nrows
114 integer,
intent(in) :: ncols
118 allocate(m%x(nrows, ncols))
135 if (
allocated(m%x))
then
139 if (c_associated(m%x_d))
then
165 integer,
intent(in) :: memdir
166 logical,
intent(in) :: sync
193 if (
allocated(m%x))
then
197 if (.not.
allocated(m%x))
then
202 allocate(m%x(m%nrows, m%ncols))
223 real(kind=
rp),
intent(in) :: s
225 if (.not.
allocated(m%x))
then
239 integer,
optional :: bcknd
244 &implemented on accelarators.")
257 integer :: indr(m%nrows), indc(m%ncols), ipiv(m%ncols)
258 real(kind=
xp) :: rmult(m%nrows), amx, tmp, piv, eps
259 integer :: i, j, k, ir, jc
261 if (.not. (m%ncols .eq. m%nrows))
then
262 call neko_error(
"Fatal error: trying to invert m matrix that is not &
272 if (ipiv(i) .ne. 1)
then
274 if (ipiv(j) .eq. 0)
then
275 if (abs(m%x(i, j)) .ge. amx)
then
280 else if (ipiv(j) .gt. 1)
then
286 ipiv(jc) = ipiv(jc) + 1
292 m%x(ir, j) = m%x(jc, j)
299 if (abs(m%x(jc, jc)) .lt. eps)
then
300 call neko_error(
"matrix_inverse error: small Gauss Jordan Piv")
302 piv = 1.0_xp/m%x(jc, jc)
305 m%x(jc, j) = m%x(jc, j)*piv
310 m%x(jc, j) = m%x(1 , j)
314 rmult(i) = m%x(i, jc)
320 m%x(i, j) = m%x(i, j) - rmult(i)*m%x(1, j)
326 m%x(jc, j) = m%x(1 , j)
332 do j = m%nrows, 1, -1
333 if (indr(j) .ne. indc(j))
then
335 tmp = m%x(i, indr(j))
336 m%x(i, indr(j)) = m%x(i, indc(j))
337 m%x(i, indc(j)) = tmp
Deassociate a Fortran array from a device pointer.
Map a Fortran array to a device (allocate and associate)
Copy data between host and device (or device and device)
Synchronize a device or stream.
subroutine, public device_copy(a_d, b_d, n, strm)
Copy a vector .
subroutine, public device_cfill(a_d, c, n, strm)
Set all elements to a constant c .
Device abstraction, common interface for various accelerators.
subroutine, public device_free(x_d)
Deallocate memory on the device.
subroutine matrix_free(m)
Deallocate a matrix.
subroutine matrix_bcknd_inverse(m, bcknd)
pure integer function matrix_ncols(m)
Returns the number of columns in the matrix.
subroutine matrix_assign_matrix(m, w)
Assignment .
subroutine cpu_matrix_inverse(m)
pure integer function matrix_nrows(m)
Returns the number of rows in the matrix.
subroutine matrix_init(m, nrows, ncols, name)
Initialise a matrix of size nrows*ncols.
pure integer function matrix_size(m)
Returns the number of entries in the matrix.
subroutine matrix_copy_from(m, memdir, sync)
Easy way to copy between host and device.
subroutine matrix_assign_scalar(m, s)
Assignment .
subroutine matrix_allocate(m, nrows, ncols)
Allocate a matrix of size nrows*ncols.
integer, parameter neko_bcknd_device
integer, parameter, public xp
integer, parameter, public rp
Global precision used in computations.
integer, parameter, public neko_varname_len