d5/d20/matrix__math_8f90_source.html

! Copyright (c) 2008-2020, UCHICAGO ARGONNE, LLC.

!

! The UChicago Argonne, LLC as Operator of Argonne National

! Laboratory holds copyright in the Software. The copyright holder

! reserves all rights except those expressly granted to licensees,

! and U.S. Government license rights.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

! 1. Redistributions of source code must retain the above copyright

! notice, this list of conditions and the disclaimer below.

!

! 2. Redistributions in binary form must reproduce the above copyright

! notice, this list of conditions and the disclaimer (as noted below)

! in the documentation and/or other materials provided with the

! distribution.

!

! 3. Neither the name of ANL nor the names of its contributors

! may be used to endorse or promote products derived from this software

! without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL

! UCHICAGO ARGONNE, LLC, THE U.S. DEPARTMENT OF

! ENERGY OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED

! TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

! DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

! THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

! (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

! OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

!

! Additional BSD Notice

! ---------------------

! 1. This notice is required to be provided under our contract with

! the U.S. Department of Energy (DOE). This work was produced at

! Argonne National Laboratory under Contract

! No. DE-AC02-06CH11357 with the DOE.

!

! 2. Neither the United States Government nor UCHICAGO ARGONNE,

! LLC nor any of their employees, makes any warranty,

! express or implied, or assumes any liability or responsibility for the

! accuracy, completeness, or usefulness of any information, apparatus,

! product, or process disclosed, or represents that its use would not

! infringe privately-owned rights.

!

! 3. Also, reference herein to any specific commercial products, process,

! or services by trade name, trademark, manufacturer or otherwise does

! not necessarily constitute or imply its endorsement, recommendation,

! or favoring by the United States Government or UCHICAGO ARGONNE LLC.

! The views and opinions of authors expressed

! herein do not necessarily state or reflect those of the United States

! Government or UCHICAGO ARGONNE, LLC, and shall

! not be used for advertising or product endorsement purposes.

!

module matrix_math

  use neko_config, only: neko_bcknd_device

  use num_types, only: rp

  use matrix, only: matrix_t

  use device

  use math, only: rzero, rone, copy, cmult, cadd, cfill, invcol1, vdot3, add2, &

       add3, add4, sub2, sub3, add2s1, add2s2, addsqr2s2, cmult2, invcol2, &

       col2, col3, subcol3, add3s2, addcol3, addcol4, glsum, glsc2, glsc3, &

       masked_gather_copy_0, masked_scatter_copy_0, glsubnorm, invcol3

  use device_math, only: device_rzero, device_rone, device_copy, device_cmult, &

       device_cadd, device_cfill, device_invcol1, device_vdot3, device_add2, &

       device_add3, device_add4, device_sub2, device_sub3, device_add2s1, &

       device_add2s2, device_addsqr2s2, device_cmult2, device_invcol2, &

       device_col2, device_col3, device_subcol3, device_add3s2, &

       device_addcol3, device_addcol4, device_glsum, device_glsc2, &

       device_glsc3, device_masked_gather_copy_0, device_masked_scatter_copy_0,&

       device_glsubnorm, device_invcol3

  use, intrinsic :: iso_c_binding, only: c_ptr

  implicit none

  private


  public :: matrix_rzero, matrix_rone, matrix_copy, matrix_cmult, &

       matrix_cadd, matrix_cfill, matrix_invcol1, matrix_invcol3, &

       matrix_add2, matrix_sub2, matrix_sub3, matrix_add2s1, &

       matrix_add2s2, matrix_addsqr2s2, matrix_cmult2, &

       matrix_invcol2, matrix_col2, matrix_col3, matrix_subcol3, &

       matrix_add3s2, matrix_addcol3, matrix_addcol4, matrix_glsum, &

       matrix_glsc2, matrix_glsc3, matrix_add3, &

       matrix_glsubnorm


contains


  subroutine matrix_rzero(a, n)

    type(matrix_t), intent(inout) :: a

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_rzero(a%x_d, size)

    else

       call rzero(a%x, size)

    end if


  end subroutine matrix_rzero


  subroutine matrix_rone(a, n)

    type(matrix_t), intent(inout) :: a

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_rone(a%x_d, size)

    else

       call rone(a%x, size)

    end if


  end subroutine matrix_rone


  subroutine matrix_copy(a, b, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_copy(a%x_d, b%x_d, size)

    else

       call copy(a%x, b%x, size)

    end if


  end subroutine matrix_copy


  subroutine matrix_cmult(a, c, n)

    type(matrix_t), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cmult(a%x_d, c, size)

    else

       call cmult(a%x, c, size)

    end if


  end subroutine matrix_cmult


  subroutine matrix_cadd(a, s, n)

    type(matrix_t), intent(inout) :: a

    real(kind=rp), intent(in) :: s

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cadd(a%x_d, s, size)

    else

       call cadd(a%x, s, size)

    end if


  end subroutine matrix_cadd


  subroutine matrix_cfill(a, c, n)

    type(matrix_t), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cfill(a%x_d, c, size)

    else

       call cfill(a%x, c, size)

    end if


  end subroutine matrix_cfill


  subroutine matrix_invcol1(a, n)

    type(matrix_t), intent(inout) :: a

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol1(a%x_d, size)

    else

       call invcol1(a%x, size)

    end if


  end subroutine matrix_invcol1


  subroutine matrix_invcol3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call invcol3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_invcol3


  subroutine matrix_add2(a, b, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2(a%x_d, b%x_d, size)

    else

       call add2(a%x, b%x, size)

    end if


  end subroutine matrix_add2


  subroutine matrix_add3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b, c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add3(a%x_d, b%x_d, c%x_d, size)

    else

       call add3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_add3


  subroutine matrix_add4(a, b, c, d, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b, c, d

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add4(a%x_d, b%x_d, c%x_d, d%x_d, size)

    else

       call add4(a%x, b%x, c%x, d%x, size)

    end if


  end subroutine matrix_add4


  subroutine matrix_sub2(a, b, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_sub2(a%x_d, b%x_d, size)

    else

       call sub2(a%x, b%x, size)

    end if


  end subroutine matrix_sub2


  subroutine matrix_sub3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_sub3(a%x_d, b%x_d, c%x_d, size)

    else

       call sub3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_sub3


  subroutine matrix_add2s1(a, b, c1, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    real(kind=rp), intent(in) :: c1

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2s1(a%x_d, b%x_d, c1, size)

    else

       call add2s1(a%x, b%x, c1, size)

    end if


  end subroutine matrix_add2s1


  subroutine matrix_add2s2(a, b, c1, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    real(kind=rp), intent(in) :: c1

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2s2(a%x_d, b%x_d, c1, size)

    else

       call add2s2(a%x, b%x, c1, size)

    end if


  end subroutine matrix_add2s2


  subroutine matrix_addsqr2s2(a, b, c1, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    real(kind=rp), intent(in) :: c1

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addsqr2s2(a%x_d, b%x_d, c1, size)

    else

       call addsqr2s2(a%x, b%x, c1, size)

    end if


  end subroutine matrix_addsqr2s2


  subroutine matrix_cmult2(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    real(kind=rp), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cmult2(a%x_d, b%x_d, c, size)

    else

       call cmult2(a%x, b%x, c, size)

    end if


  end subroutine matrix_cmult2


  subroutine matrix_invcol2(a, b, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol2(a%x_d, b%x_d, size)

    else

       call invcol2(a%x, b%x, size)

    end if


  end subroutine matrix_invcol2


  subroutine matrix_col2(a, b, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_col2(a%x_d, b%x_d, size)

    else

       call col2(a%x, b%x, size)

    end if


  end subroutine matrix_col2


  subroutine matrix_col3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_col3(a%x_d, b%x_d, c%x_d, size)

    else

       call col3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_col3


  subroutine matrix_subcol3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_subcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call subcol3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_subcol3


  subroutine matrix_add3s2(a, b, c, c1, c2, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    real(kind=rp), intent(in) :: c1, c2

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add3s2(a%x_d, b%x_d, c%x_d, c1, c2, size)

    else

       call add3s2(a%x, b%x, c%x, c1, c2, size)

    end if


  end subroutine matrix_add3s2


  subroutine matrix_addcol3(a, b, c, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call addcol3(a%x, b%x, c%x, size)

    end if


  end subroutine matrix_addcol3


  subroutine matrix_addcol4(a, b, c, d, n)

    type(matrix_t), intent(inout) :: a

    type(matrix_t), intent(in) :: b

    type(matrix_t), intent(in) :: c

    type(matrix_t), intent(in) :: d

    integer, intent(in), optional :: n

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addcol4(a%x_d, b%x_d, c%x_d, d%x_d, size)

    else

       call addcol4(a%x, b%x, c%x, d%x, size)

    end if


  end subroutine matrix_addcol4


  function matrix_glsum(a, n) result(sum)

    integer, intent(in), optional :: n

    type(matrix_t), intent(in) :: a

    real(kind=rp) :: sum

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       sum = device_glsum(a%x_d, size)

    else

       sum = glsum(a%x, size)

    end if


  end function matrix_glsum


  function matrix_glsc2(a, b, n) result(ip)

    integer, intent(in), optional :: n

    type(matrix_t), intent(in) :: a, b

    real(kind=rp) :: ip

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       ip = device_glsc2(a%x_d, b%x_d, size)

    else

       ip = glsc2(a%x, b%x, size)

    end if


  end function matrix_glsc2


  function matrix_glsc3(a, b, c, n) result(ip)

    integer, intent(in), optional :: n

    type(matrix_t), intent(in) :: a, b, c

    real(kind=rp) :: ip

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       ip = device_glsc3(a%x_d, b%x_d, c%x_d, size)

    else

       ip = glsc3(a%x, b%x, c%x, size)

    end if


  end function matrix_glsc3


  function matrix_glsubnorm(a, b, n) result(norm)

    integer, intent(in), optional :: n

    type(matrix_t), intent(in) :: a, b

    real(kind=rp) :: norm

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       norm = device_glsubnorm(a%x_d, b%x_d, size)

    else

       norm = glsubnorm(a%x, b%x, size)

    end if


  end function matrix_glsubnorm


end module matrix_math

device_math::device_cadd
Definition device_math.F90:50

device_math
Definition device_math.F90:33

device_math::device_add2s1
subroutine, public device_add2s1(a_d, b_d, c1, n, strm)
Definition device_math.F90:517

device_math::device_sub3
subroutine, public device_sub3(a_d, b_d, c_d, n, strm)
Vector subtraction .
Definition device_math.F90:886

device_math::device_masked_scatter_copy_0
subroutine, public device_masked_scatter_copy_0(a_d, b_d, mask_d, n, n_mask, strm)
Scatter a masked vector .
Definition device_math.F90:151

device_math::device_add2s2
subroutine, public device_add2s2(a_d, b_d, c1, n, strm)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition device_math.F90:545

device_math::device_add2
subroutine, public device_add2(a_d, b_d, n, strm)
Vector addition .
Definition device_math.F90:467

device_math::device_addcol3
subroutine, public device_addcol3(a_d, b_d, c_d, n, strm)
Returns .
Definition device_math.F90:912

device_math::device_glsum
real(kind=rp) function, public device_glsum(a_d, n, strm)
Sum a vector of length n.
Definition device_math.F90:1242

device_math::device_invcol1
subroutine, public device_invcol1(a_d, n, strm)
Invert a vector .
Definition device_math.F90:706

device_math::device_add3s2
subroutine, public device_add3s2(a_d, b_d, c_d, c1, c2, n, strm)
Returns .
Definition device_math.F90:625

device_math::device_rzero
subroutine, public device_rzero(a_d, n, strm)
Zero a real vector.
Definition device_math.F90:232

device_math::device_rone
subroutine, public device_rone(a_d, n, strm)
Set all elements to one.
Definition device_math.F90:258

device_math::device_cmult
subroutine, public device_cmult(a_d, c, n, strm)
Multiplication by constant c .
Definition device_math.F90:281

device_math::device_vdot3
subroutine, public device_vdot3(dot_d, u1_d, u2_d, u3_d, v1_d, v2_d, v3_d, n, strm)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition device_math.F90:992

device_math::device_glsubnorm
real(kind=rp) function, public device_glsubnorm(a_d, b_d, n, strm)
Returns the norm of the difference of two vectors .
Definition device_math.F90:1206

device_math::device_sub2
subroutine, public device_sub2(a_d, b_d, n, strm)
Vector substraction .
Definition device_math.F90:860

device_math::device_copy
subroutine, public device_copy(a_d, b_d, n, strm)
Copy a vector .
Definition device_math.F90:73

device_math::device_invcol3
subroutine, public device_invcol3(a_d, b_d, c_d, n, strm)
Vector division .
Definition device_math.F90:758

device_math::device_col2
subroutine, public device_col2(a_d, b_d, n, strm)
Vector multiplication .
Definition device_math.F90:783

device_math::device_add4
subroutine, public device_add4(a_d, b_d, c_d, d_d, n, strm)
Definition device_math.F90:492

device_math::device_subcol3
subroutine, public device_subcol3(a_d, b_d, c_d, n, strm)
Returns .
Definition device_math.F90:834

device_math::device_masked_gather_copy_0
subroutine, public device_masked_gather_copy_0(a_d, b_d, mask_d, n, n_mask, strm)
Gather a masked vector .
Definition device_math.F90:125

device_math::device_invcol2
subroutine, public device_invcol2(a_d, b_d, n, strm)
Vector division .
Definition device_math.F90:732

device_math::device_addsqr2s2
subroutine, public device_addsqr2s2(a_d, b_d, c1, n, strm)
Returns .
Definition device_math.F90:572

device_math::device_glsc3
real(kind=rp) function, public device_glsc3(a_d, b_d, c_d, n, strm)
Weighted inner product .
Definition device_math.F90:1082

device_math::device_glsc2
real(kind=rp) function, public device_glsc2(a_d, b_d, n, strm)
Weighted inner product .
Definition device_math.F90:1172

device_math::device_cmult2
subroutine, public device_cmult2(a_d, b_d, c, n, strm)
Multiplication by constant c .
Definition device_math.F90:308

device_math::device_col3
subroutine, public device_col3(a_d, b_d, c_d, n, strm)
Vector multiplication with 3 vectors .
Definition device_math.F90:808

device_math::device_addcol4
subroutine, public device_addcol4(a_d, b_d, c_d, d_d, n, strm)
Returns .
Definition device_math.F90:938

device_math::device_cfill
subroutine, public device_cfill(a_d, c, n, strm)
Set all elements to a constant c .
Definition device_math.F90:440

device_math::device_add3
subroutine, public device_add3(a_d, b_d, c_d, n, strm)
Vector addition .
Definition device_math.F90:599

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

math
Definition math.f90:60

math::cmult
subroutine, public cmult(a, c, n)
Multiplication by constant c .
Definition math.f90:411

math::cmult2
subroutine, public cmult2(a, b, c, n)
Multiplication by constant c .
Definition math.f90:423

math::invcol2
subroutine, public invcol2(a, b, n)
Vector division .
Definition math.f90:840

math::glsc3
real(kind=rp) function, public glsc3(a, b, c, n)
Weighted inner product .
Definition math.f90:1067

math::cadd
subroutine, public cadd(a, s, n)
Add a scalar to vector .
Definition math.f90:462

math::addsqr2s2
subroutine, public addsqr2s2(a, b, c1, n)
Returns .
Definition math.f90:826

math::add2s1
subroutine, public add2s1(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition math.f90:797

math::glsc2
real(kind=rp) function, public glsc2(a, b, n)
Weighted inner product .
Definition math.f90:1048

math::masked_scatter_copy_0
subroutine, public masked_scatter_copy_0(a, b, mask, n, n_mask)
Scatter a contigous vector to masked positions in a target array .
Definition math.f90:358

math::subcol3
subroutine, public subcol3(a, b, c, n)
Returns .
Definition math.f90:881

math::rone
subroutine, public rone(a, n)
Set all elements to one.
Definition math.f90:238

math::add3
subroutine, public add3(a, b, c, n)
Vector addition .
Definition math.f90:739

math::glsum
real(kind=rp) function, public glsum(a, n)
Sum a vector of length n.
Definition math.f90:499

math::sub3
subroutine, public sub3(a, b, c, n)
Vector subtraction .
Definition math.f90:781

math::addcol4
subroutine, public addcol4(a, b, c, d, n)
Returns .
Definition math.f90:972

math::add2
subroutine, public add2(a, b, n)
Vector addition .
Definition math.f90:726

math::cfill
subroutine, public cfill(a, c, n)
Set all elements to a constant c .
Definition math.f90:487

math::invcol3
subroutine, public invcol3(a, b, c, n)
Invert a vector .
Definition math.f90:626

math::add3s2
subroutine, public add3s2(a, b, c, c1, c2, n)
Returns .
Definition math.f90:895

math::masked_gather_copy_0
subroutine, public masked_gather_copy_0(a, b, mask, n, n_mask)
Gather a masked vector to reduced contigous vector .
Definition math.f90:312

math::addcol3
subroutine, public addcol3(a, b, c, n)
Returns .
Definition math.f90:958

math::invcol1
subroutine, public invcol1(a, n)
Invert a vector .
Definition math.f90:614

math::col2
subroutine, public col2(a, b, n)
Vector multiplication .
Definition math.f90:854

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition math.f90:249

math::add4
subroutine, public add4(a, b, c, d, n)
Vector addition .
Definition math.f90:753

math::col3
subroutine, public col3(a, b, c, n)
Vector multiplication with 3 vectors .
Definition math.f90:867

math::vdot3
subroutine, public vdot3(dot, u1, u2, u3, v1, v2, v3, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition math.f90:684

math::rzero
subroutine, public rzero(a, n)
Zero a real vector.
Definition math.f90:205

math::glsubnorm
real(kind=rp) function, public glsubnorm(a, b, n)
Returns the norm of the difference of two vectors .
Definition math.f90:1109

math::sub2
subroutine, public sub2(a, b, n)
Vector substraction .
Definition math.f90:768

math::add2s2
subroutine, public add2s2(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on second argument)
Definition math.f90:812

matrix_math
Definition matrix_math.f90:60

matrix_math::matrix_glsum
real(kind=rp) function, public matrix_glsum(a, n)
Global sum of all elements in a matrix .
Definition matrix_math.f90:606

matrix_math::matrix_copy
subroutine, public matrix_copy(a, b, n)
Copy a matrix .
Definition matrix_math.f90:132

matrix_math::matrix_invcol2
subroutine, public matrix_invcol2(a, b, n)
Vector division .
Definition matrix_math.f90:451

matrix_math::matrix_add2
subroutine, public matrix_add2(a, b, n)
Vector addition .
Definition matrix_math.f90:254

matrix_math::matrix_addcol4
subroutine, public matrix_addcol4(a, b, c, d, n)
Returns .
Definition matrix_math.f90:583

matrix_math::matrix_cadd
subroutine, public matrix_cadd(a, s, n)
Add a scalar to matrix .
Definition matrix_math.f90:172

matrix_math::matrix_cmult
subroutine, public matrix_cmult(a, c, n)
Multiplication by constant c .
Definition matrix_math.f90:152

matrix_math::matrix_add3s2
subroutine, public matrix_add3s2(a, b, c, c1, c2, n)
Returns .
Definition matrix_math.f90:538

matrix_math::matrix_cmult2
subroutine, public matrix_cmult2(a, b, c, n)
Multiplication by constant c .
Definition matrix_math.f90:429

matrix_math::matrix_add4
subroutine matrix_add4(a, b, c, d, n)
Vector addition .
Definition matrix_math.f90:296

matrix_math::matrix_col3
subroutine, public matrix_col3(a, b, c, n)
Vector multiplication with 3 vectors .
Definition matrix_math.f90:494

matrix_math::matrix_cfill
subroutine, public matrix_cfill(a, c, n)
Set all elements to a constant c .
Definition matrix_math.f90:192

matrix_math::matrix_invcol1
subroutine, public matrix_invcol1(a, n)
Invert elements of a matrix .
Definition matrix_math.f90:212

matrix_math::matrix_glsc3
real(kind=rp) function, public matrix_glsc3(a, b, c, n)
Global inner product of three matrices .
Definition matrix_math.f90:648

matrix_math::matrix_sub2
subroutine, public matrix_sub2(a, b, n)
Vector substraction .
Definition matrix_math.f90:317

matrix_math::matrix_subcol3
subroutine, public matrix_subcol3(a, b, c, n)
Returns .
Definition matrix_math.f90:516

matrix_math::matrix_addsqr2s2
subroutine, public matrix_addsqr2s2(a, b, c1, n)
Returns .
Definition matrix_math.f90:407

matrix_math::matrix_add3
subroutine, public matrix_add3(a, b, c, n)
Vector addition .
Definition matrix_math.f90:275

matrix_math::matrix_rzero
subroutine, public matrix_rzero(a, n)
Zero a real matrix .
Definition matrix_math.f90:94

matrix_math::matrix_glsc2
real(kind=rp) function, public matrix_glsc2(a, b, n)
Global inner product of two matrices .
Definition matrix_math.f90:627

matrix_math::matrix_add2s2
subroutine, public matrix_add2s2(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on second argument)
Definition matrix_math.f90:385

matrix_math::matrix_addcol3
subroutine, public matrix_addcol3(a, b, c, n)
Returns .
Definition matrix_math.f90:561

matrix_math::matrix_add2s1
subroutine, public matrix_add2s1(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition matrix_math.f90:362

matrix_math::matrix_invcol3
subroutine, public matrix_invcol3(a, b, c, n)
Element division of two matrices .
Definition matrix_math.f90:232

matrix_math::matrix_glsubnorm
real(kind=rp) function, public matrix_glsubnorm(a, b, n)
Global subtracted norm of two matrices .
Definition matrix_math.f90:670

matrix_math::matrix_col2
subroutine, public matrix_col2(a, b, n)
Vector multiplication .
Definition matrix_math.f90:473

matrix_math::matrix_rone
subroutine, public matrix_rone(a, n)
Set all elements to one.
Definition matrix_math.f90:113

matrix_math::matrix_sub3
subroutine, public matrix_sub3(a, b, c, n)
Vector subtraction .
Definition matrix_math.f90:338

matrix
Defines a matrix.
Definition matrix.f90:34

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

matrix::matrix_t
Definition matrix.f90:47