dc/dcb/matrix_8f90_source.html

! Copyright (c) 2024, The Neko Authors

! All rights reserved.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

!   * Redistributions of source code must retain the above copyright

!     notice, this list of conditions and the following disclaimer.

!

!   * Redistributions in binary form must reproduce the above

!     copyright notice, this list of conditions and the following

!     disclaimer in the documentation and/or other materials provided

!     with the distribution.

!

!   * Neither the name of the authors nor the names of its

!     contributors may be used to endorse or promote products derived

!     from this software without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

! POSSIBILITY OF SUCH DAMAGE.

!

module matrix

  use neko_config, only: neko_bcknd_device

  use math, only: sub3, chsign, add3, cmult2, cadd2, copy

  use num_types, only: rp

  use device, only: device_map, device_free, c_ptr, c_null_ptr

  use device_math, only: device_copy, device_cfill, device_cmult, &

       device_sub3, device_cmult2, device_add3, device_cadd2

  use utils, only: neko_error

  use, intrinsic :: iso_c_binding

  implicit none

  private


  type, public ::  matrix_t

     real(kind=rp), allocatable :: x(:,:)

     type(c_ptr) :: x_d = c_null_ptr

     integer :: nrows  = 0

     integer :: ncols  = 0

     integer :: n = 0

   contains

     procedure, pass(m) :: init => matrix_init

     procedure, pass(m) :: free => matrix_free

     procedure, pass(m) :: size => matrix_size

     procedure, pass(m) :: matrix_assign_matrix

     procedure, pass(m) :: matrix_assign_scalar

     procedure, pass(m) :: matrix_add_matrix

     procedure, pass(m) :: matrix_add_scalar_left

     procedure, pass(m) :: matrix_add_scalar_right

     procedure, pass(m) :: matrix_sub_matrix

     procedure, pass(m) :: matrix_sub_scalar_left

     procedure, pass(m) :: matrix_sub_scalar_right

     procedure, pass(m) :: matrix_cmult_left

     procedure, pass(m) :: matrix_cmult_right

     procedure, pass(m) :: inverse => matrix_bcknd_inverse


     generic :: assignment(=) => matrix_assign_matrix, &

          matrix_assign_scalar

     generic :: operator(+) => matrix_add_matrix, &

          matrix_add_scalar_left, matrix_add_scalar_right

     generic :: operator(-) => matrix_sub_matrix, &

          matrix_sub_scalar_left, matrix_sub_scalar_right

     generic :: operator(*) => matrix_cmult_left, matrix_cmult_right

  end type matrix_t

  type, public ::  matrix_t …


contains


  subroutine matrix_init(m, nrows, ncols)

    class(matrix_t), intent(inout) :: m

    integer, intent(in) :: nrows

    integer, intent(in) :: ncols


    call m%free()


    allocate(m%x(nrows, ncols))

    m%x = 0.0_rp

    m%nrows = nrows

    m%ncols = ncols

    m%n = nrows*ncols


    if (neko_bcknd_device .eq. 1) then

       call device_map(m%x, m%x_d, m%n)

       call device_cfill(m%x_d, 0.0_rp, m%n)

    end if


  subroutine matrix_init(m, nrows, ncols) …

  end subroutine matrix_init


  subroutine matrix_free(m)

    class(matrix_t), intent(inout) :: m


    if (allocated(m%x)) then

       deallocate(m%x)

    end if


    if (c_associated(m%x_d)) then

       call device_free(m%x_d)

    end if


    m%nrows = 0

    m%ncols = 0

    m%n = 0


  subroutine matrix_free(m) …

  end subroutine matrix_free


  function matrix_size(m) result(s)

    class(matrix_t), intent(inout) :: m

    integer :: s

    s = m%n

  function matrix_size(m) result(s) …

  end function matrix_size


  subroutine matrix_assign_matrix(m, w)

    class(matrix_t), intent(inout) :: m

    type(matrix_t), intent(in) :: w


    if (allocated(m%x)) then

       call m%free()

    end if


    if (.not. allocated(m%x)) then


       m%nrows = w%nrows

       m%ncols = w%ncols

       m%n = w%n

       allocate(m%x(m%nrows, m%ncols))


       if (neko_bcknd_device .eq. 1) then

          call device_map(m%x, m%x_d, m%n)

       end if


    end if


    if (neko_bcknd_device .eq. 1) then

       call device_copy(m%x_d, w%x_d, m%n)

    else

       m%x = w%x

    end if


  subroutine matrix_assign_matrix(m, w) …

  end subroutine matrix_assign_matrix


  subroutine matrix_assign_scalar(m, s)

    class(matrix_t), intent(inout) :: m

    real(kind=rp), intent(in) :: s


    if (.not. allocated(m%x)) then

       call neko_error('matrix not allocated')

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cfill(m%x_d, s, m%n)

    else

       m%x = s

    end if


  subroutine matrix_assign_scalar(m, s) …

  end subroutine matrix_assign_scalar


  function matrix_add_matrix(m, b) result(v)

    class(matrix_t), intent(in) :: m, b

    type(matrix_t) :: v


    if (m%nrows .ne. b%nrows .or. m%ncols .ne. b%ncols) &

         call neko_error("Matrices must be the same size!")


    v%n = m%n

    v%nrows = m%nrows

    v%ncols = m%ncols

    allocate(v%x(v%nrows, v%ncols))


    if (neko_bcknd_device .eq. 1) then

       call device_map(v%x, v%x_d, v%n)

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add3(v%x_d, m%x_d, b%x_d, v%n)

    else

       call add3(v%x, m%x, b%x, v%n)

    end if


  function matrix_add_matrix(m, b) result(v) …

  end function matrix_add_matrix


  function matrix_add_scalar_left(m, c) result(v)

    class(matrix_t), intent(in) :: m

    real(kind=rp), intent(in) :: c

    type(matrix_t) :: v


    v%n = m%n

    v%nrows = m%nrows

    v%ncols = m%ncols

    allocate(v%x(v%nrows, v%ncols))


    if (neko_bcknd_device .eq. 1) then

       call device_map(v%x, v%x_d, v%n)

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cadd2(v%x_d, m%x_d, c, v%n)

    else

       call cadd2(v%x, m%x, c, v%n)

    end if


  function matrix_add_scalar_left(m, c) result(v) …

  end function matrix_add_scalar_left


  function matrix_add_scalar_right(c, m) result(v)

    real(kind=rp), intent(in) :: c

    class(matrix_t), intent(in) :: m

    type(matrix_t) :: v


    v = matrix_add_scalar_left(m, c)


  function matrix_add_scalar_right(c, m) result(v) …

  end function matrix_add_scalar_right


  function matrix_sub_matrix(m, b) result(v)

    class(matrix_t), intent(in) :: m, b

    type(matrix_t) :: v


    if (m%nrows .ne. b%nrows .or. m%ncols .ne. b%ncols) &

         call neko_error("Matrices must be the same size!")


    v%n = m%n

    v%nrows = m%nrows

    v%ncols = m%ncols

    allocate(v%x(v%nrows, v%ncols))


    if (neko_bcknd_device .eq. 1) then

       call device_map(v%x, v%x_d, v%n)

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_sub3(v%x_d, m%x_d, b%x_d, v%n)

    else

       call sub3(v%x, m%x, b%x, v%n)

    end if


  function matrix_sub_matrix(m, b) result(v) …

  end function matrix_sub_matrix


  function matrix_sub_scalar_left(m, c) result(v)

    class(matrix_t), intent(in) :: m

    real(kind=rp), intent(in) :: c

    type(matrix_t) :: v


    v%n = m%n

    v%nrows = m%nrows

    v%ncols = m%ncols

    allocate(v%x(v%nrows, v%ncols))


    if (neko_bcknd_device .eq. 1) then

       call device_map(v%x, v%x_d, v%n)

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cadd2(v%x_d, m%x_d, -1.0_rp*c, v%n)

    else

       call cadd2(v%x, m%x, -1.0_rp*c, m%n)

    end if


  function matrix_sub_scalar_left(m, c) result(v) …

  end function matrix_sub_scalar_left


  function matrix_sub_scalar_right(c, m) result(v)

    real(kind=rp), intent(in) :: c

    class(matrix_t), intent(in) :: m

    type(matrix_t) :: v


    v = matrix_sub_scalar_left(m, c)


    if (neko_bcknd_device .eq. 1) then

       call device_cmult(v%x_d, -1.0_rp, v%n)

    else

       call chsign(v%x, v%n)

    end if


  function matrix_sub_scalar_right(c, m) result(v) …

  end function matrix_sub_scalar_right


  function matrix_cmult_left(m, c) result(v)

    class(matrix_t), intent(in) :: m

    real(kind=rp), intent(in) :: c

    type(matrix_t) :: v


    v%n = m%n

    v%nrows = m%nrows

    v%ncols = m%ncols

    allocate(v%x(v%nrows, v%ncols))


    if (neko_bcknd_device .eq. 1) then

       call device_map(v%x, v%x_d, v%n)

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cmult2(v%x_d, m%x_d, c, v%n)

    else

       call cmult2(v%x, m%x, c, v%n)

    end if


  function matrix_cmult_left(m, c) result(v) …

  end function matrix_cmult_left


  function matrix_cmult_right(c, m) result(v)

    real(kind=rp), intent(in) :: c

    class(matrix_t), intent(in) :: m

    type(matrix_t) :: v


    v = matrix_cmult_left(m, c)


  function matrix_cmult_right(c, m) result(v) …

  end function matrix_cmult_right


  subroutine matrix_bcknd_inverse(m)

    class(matrix_t), intent(inout) :: m

    if (neko_bcknd_device .eq. 1) then

       call neko_error("matrix_bcknd_inverse not implemented on accelarators.")

    else

       call cpu_matrix_inverse(m)

    end if

  subroutine matrix_bcknd_inverse(m) …

  end subroutine matrix_bcknd_inverse


  subroutine cpu_matrix_inverse(m)

    ! Gauss-Jordan matrix inversion with full pivoting

    ! Num. Rec. p. 30, 2nd Ed., Fortran

    ! m%x     is an sqaure matrix

    ! rmult is m  work array of length nrows = ncols

    class(matrix_t), intent(inout) :: m

    integer :: indr(m%nrows), indc(m%ncols), ipiv(m%ncols)

    real(kind=rp) ::  rmult(m%nrows), amx, tmp, piv, eps

    integer :: i, j, k, ir, jc


    if (.not. (m%ncols .eq. m%nrows)) then

       call neko_error("Fatal error: trying to invert m matrix that is not &

&square")

    end if


    eps = 1e-9_rp

    ipiv = 0


    do k = 1, m%nrows

       amx = 0.0_rp

       do i = 1, m%nrows                    ! Pivot search

          if (ipiv(i) .ne. 1) then

             do j = 1, m%nrows

                if (ipiv(j) .eq. 0) then

                   if (abs(m%x(i, j)) .ge. amx) then

                      amx = abs(m%x(i, j))

                      ir  = i

                      jc  = j

                   end if

                else if (ipiv(j) .gt. 1) then

                   return

                end if

             end do

          end if

       end do

       ipiv(jc) = ipiv(jc) + 1


       !  Swap rows

       if (ir .ne. jc) then

          do j = 1, m%ncols

             tmp       = m%x(ir, j)

             m%x(ir, j) = m%x(jc, j)

             m%x(jc, j) = tmp

          end do

       end if

       indr(k) = ir

       indc(k) = jc


       if (abs(m%x(jc, jc)) .lt. eps) then

          call neko_error("matrix_inverse error: small Gauss Jordan Piv")

       end if

       piv = 1.0_rp/m%x(jc, jc)

       m%x(jc, jc) = 1.0_rp

       do j = 1, m%ncols

          m%x(jc, j) = m%x(jc, j)*piv

       end do


       do j = 1, m%ncols

          tmp       = m%x(jc, j)

          m%x(jc, j) = m%x(1 , j)

          m%x(1 , j) = tmp

       end do

       do i = 2, m%nrows

          rmult(i)   = m%x(i, jc)

          m%x(i, jc)  = 0.0_rp

       end do


       do j = 1, m%ncols

          do i = 2, m%nrows

             m%x(i, j) = m%x(i, j) - rmult(i)*m%x(1, j)

          end do

       end do


       do j = 1, m%ncols

          tmp       = m%x(jc, j)

          m%x(jc, j) = m%x(1 , j)

          m%x(1 , j) = tmp

       end do

    end do


    ! Unscramble matrix

    do j= m%nrows, 1, -1

       if (indr(j) .ne. indc(j)) then

          do i = 1, m%nrows

             tmp            = m%x(i, indr(j))

             m%x(i, indr(j)) = m%x(i, indc(j))

             m%x(i, indc(j)) = tmp

          end do

       end if

    end do


    return

  subroutine cpu_matrix_inverse(m) …

  end subroutine cpu_matrix_inverse


end module matrix

device::device_map
Map a Fortran array to a device (allocate and associate)
Definition device.F90:57

utils::neko_error
Definition utils.f90:42

device_math
Definition device_math.F90:33

device_math::device_cmult2
subroutine, public device_cmult2(a_d, b_d, c, n)
Multiplication by constant c .
Definition device_math.F90:182

device_math::device_cmult
subroutine, public device_cmult(a_d, c, n)
Multiplication by constant c .
Definition device_math.F90:166

device_math::device_sub3
subroutine, public device_sub3(a_d, b_d, c_d, n)
Vector subtraction .
Definition device_math.F90:445

device_math::device_add3
subroutine, public device_add3(a_d, b_d, c_d, n)
Vector addition .
Definition device_math.F90:324

device_math::device_cadd2
subroutine, public device_cadd2(a_d, b_d, c, n)
Add a scalar to vector .
Definition device_math.F90:214

device_math::device_copy
subroutine, public device_copy(a_d, b_d, n)
Copy a vector .
Definition device_math.F90:76

device_math::device_cfill
subroutine, public device_cfill(a_d, c, n)
Set all elements to a constant c .
Definition device_math.F90:231

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

device::device_free
subroutine, public device_free(x_d)
Deallocate memory on the device.
Definition device.F90:185

math
Definition math.f90:60

math::cmult2
subroutine, public cmult2(a, b, c, n)
Multiplication by constant c .
Definition math.f90:701

math::cadd2
subroutine, public cadd2(a, b, s, n)
Add a scalar to vector .
Definition math.f90:335

math::add3
subroutine, public add3(a, b, c, n)
Vector addition .
Definition math.f90:600

math::sub3
subroutine, public sub3(a, b, c, n)
Vector subtraction .
Definition math.f90:642

math::chsign
subroutine, public chsign(a, n)
Change sign of vector .
Definition math.f90:440

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition math.f90:239

matrix
Defines a matrix.
Definition matrix.f90:34

matrix::matrix_free
subroutine matrix_free(m)
Deallocate a matrix.
Definition matrix.f90:118

matrix::matrix_sub_matrix
type(matrix_t) function matrix_sub_matrix(m, b)
Matrix-matrix subtraction .
Definition matrix.f90:248

matrix::matrix_assign_matrix
subroutine matrix_assign_matrix(m, w)
Assignment .
Definition matrix.f90:143

matrix::matrix_add_scalar_left
type(matrix_t) function matrix_add_scalar_left(m, c)
Matrix-scalar addition .
Definition matrix.f90:215

matrix::matrix_sub_scalar_right
type(matrix_t) function matrix_sub_scalar_right(c, m)
Scalar-matrix subtraction .
Definition matrix.f90:296

matrix::matrix_add_matrix
type(matrix_t) function matrix_add_matrix(m, b)
Matrix-matrix addition .
Definition matrix.f90:190

matrix::matrix_add_scalar_right
type(matrix_t) function matrix_add_scalar_right(c, m)
Scalar-matrix addition .
Definition matrix.f90:238

matrix::matrix_cmult_right
type(matrix_t) function matrix_cmult_right(c, m)
Scalar-matrix multiplication .
Definition matrix.f90:335

matrix::matrix_bcknd_inverse
subroutine matrix_bcknd_inverse(m)
Definition matrix.f90:344

matrix::matrix_size
integer function matrix_size(m)
Returns the number of entries in the matrix.
Definition matrix.f90:136

matrix::cpu_matrix_inverse
subroutine cpu_matrix_inverse(m)
Definition matrix.f90:353

matrix::matrix_cmult_left
type(matrix_t) function matrix_cmult_left(m, c)
Matrix-scalar multiplication .
Definition matrix.f90:312

matrix::matrix_sub_scalar_left
type(matrix_t) function matrix_sub_scalar_left(m, c)
Matrix-scalar subtraction .
Definition matrix.f90:273

matrix::matrix_assign_scalar
subroutine matrix_assign_scalar(m, s)
Assignment .
Definition matrix.f90:173

matrix::matrix_init
subroutine matrix_init(m, nrows, ncols)
Initialise a matrix of size nrows*ncols.
Definition matrix.f90:97

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

utils
Utilities.
Definition utils.f90:35

matrix::matrix_t
Definition matrix.f90:46