d6/d03/vector__math_8f90_source.html

! Copyright (c) 2008-2020, UCHICAGO ARGONNE, LLC.

!

! The UChicago Argonne, LLC as Operator of Argonne National

! Laboratory holds copyright in the Software. The copyright holder

! reserves all rights except those expressly granted to licensees,

! and U.S. Government license rights.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

! 1. Redistributions of source code must retain the above copyright

! notice, this list of conditions and the disclaimer below.

!

! 2. Redistributions in binary form must reproduce the above copyright

! notice, this list of conditions and the disclaimer (as noted below)

! in the documentation and/or other materials provided with the

! distribution.

!

! 3. Neither the name of ANL nor the names of its contributors

! may be used to endorse or promote products derived from this software

! without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL

! UCHICAGO ARGONNE, LLC, THE U.S. DEPARTMENT OF

! ENERGY OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED

! TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

! DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

! THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

! (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

! OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

!

! Additional BSD Notice

! ---------------------

! 1. This notice is required to be provided under our contract with

! the U.S. Department of Energy (DOE). This work was produced at

! Argonne National Laboratory under Contract

! No. DE-AC02-06CH11357 with the DOE.

!

! 2. Neither the United States Government nor UCHICAGO ARGONNE,

! LLC nor any of their employees, makes any warranty,

! express or implied, or assumes any liability or responsibility for the

! accuracy, completeness, or usefulness of any information, apparatus,

! product, or process disclosed, or represents that its use would not

! infringe privately-owned rights.

!

! 3. Also, reference herein to any specific commercial products, process,

! or services by trade name, trademark, manufacturer or otherwise does

! not necessarily constitute or imply its endorsement, recommendation,

! or favoring by the United States Government or UCHICAGO ARGONNE LLC.

! The views and opinions of authors expressed

! herein do not necessarily state or reflect those of the United States

! Government or UCHICAGO ARGONNE, LLC, and shall

! not be used for advertising or product endorsement purposes.

!

module vector_math

  use neko_config, only: neko_bcknd_device

  use num_types, only: rp

  use vector, only: vector_t

  use device

  use math, only: rzero, rone, copy, cmult, cadd, cfill, invcol1, vdot3, add2, &

       add3, add4, sub2, sub3, add2s1, add2s2, addsqr2s2, cmult2, invcol2, &

       col2, col3, subcol3, add3s2, addcol3, addcol4, glsum, glsc2, glsc3, &

       masked_gather_copy_0, masked_scatter_copy_0, glsubnorm, invcol3

  use device_math, only: device_rzero, device_rone, device_copy, device_cmult, &

       device_cadd, device_cfill, device_invcol1, device_vdot3, device_add2, &

       device_add3, device_add4, device_sub2, device_sub3, device_add2s1, &

       device_add2s2, device_addsqr2s2, device_cmult2, device_invcol2, &

       device_col2, device_col3, device_subcol3, device_add3s2, &

       device_addcol3, device_addcol4, device_glsum, device_glsc2, &

       device_glsc3, device_masked_gather_copy_0, device_masked_scatter_copy_0,&

       device_glsubnorm, device_invcol3

  use, intrinsic :: iso_c_binding, only: c_ptr

  implicit none

  private


  public :: vector_rzero, vector_rone, vector_copy, vector_cmult, &

       vector_cadd, vector_cfill, vector_invcol1, vector_invcol3, vector_vdot3, &

       vector_add2, vector_sub2, vector_sub3, vector_add2s1, &

       vector_add2s2, vector_addsqr2s2, vector_cmult2, &

       vector_invcol2, vector_col2, vector_col3, vector_subcol3, &

       vector_add3s2, vector_addcol3, vector_addcol4, vector_glsum, &

       vector_glsc2, vector_glsc3, vector_add3, vector_masked_gather_copy_0, &

       vector_masked_scatter_copy_0, vector_glsubnorm


contains


  subroutine vector_rzero(a, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_rzero(a%x_d, size)

    else

       call rzero(a%x, size)

    end if


  end subroutine vector_rzero


  subroutine vector_rone(a, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_rone(a%x_d, size)

    else

       call rone(a%x, size)

    end if


  end subroutine vector_rone


  subroutine vector_copy(a, b, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: b

    type(vector_t), intent(inout) :: a

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_copy(a%x_d, b%x_d, size)

    else

       call copy(a%x, b%x, size)

    end if


  end subroutine vector_copy


  subroutine vector_cmult(a, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cmult(a%x_d, c, size)

    else

       call cmult(a%x, c, size)

    end if


  end subroutine vector_cmult


  subroutine vector_cadd(a, s, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    real(kind=rp), intent(in) :: s

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cadd(a%x_d, s, size)

    else

       call cadd(a%x, s, size)

    end if


  end subroutine vector_cadd


  subroutine vector_cfill(a, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cfill(a%x_d, c, size)

    else

       call cfill(a%x, c, size)

    end if


  end subroutine vector_cfill


  subroutine vector_invcol1(a, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol1(a%x_d, size)

    else

       call invcol1(a%x, size)

    end if


  end subroutine vector_invcol1


  subroutine vector_invcol3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call invcol3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_invcol3


  subroutine vector_vdot3(dot, u1, u2, u3, v1, v2, v3, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: u1, u2, u3

    type(vector_t), intent(in) :: v1, v2, v3

    type(vector_t), intent(out) :: dot

    integer :: size


    if (present(n)) then

       size = n

    else

       size = dot%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_vdot3(dot%x_d, &

            u1%x_d, u2%x_d, u3%x_d, &

            v1%x_d, v2%x_d, v3%x_d, &

            size)

    else

       call vdot3(dot%x, &

            u1%x, u2%x, u3%x, &

            v1%x, v2%x, v3%x, &

            size)

    end if


  end subroutine vector_vdot3


  subroutine vector_add2(a, b, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2(a%x_d, b%x_d, size)

    else

       call add2(a%x, b%x, size)

    end if


  end subroutine vector_add2


  subroutine vector_add3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b, c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add3(a%x_d, b%x_d, c%x_d, size)

    else

       call add3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_add3


  subroutine vector_add4(a, b, c, d, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b, c, d

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add4(a%x_d, b%x_d, c%x_d, d%x_d, size)

    else

       call add4(a%x, b%x, c%x, d%x, size)

    end if


  end subroutine vector_add4


  subroutine vector_sub2(a, b, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(inout) :: b

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_sub2(a%x_d, b%x_d, size)

    else

       call sub2(a%x, b%x, size)

    end if


  end subroutine vector_sub2


  subroutine vector_sub3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_sub3(a%x_d, b%x_d, c%x_d, size)

    else

       call sub3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_sub3


  subroutine vector_add2s1(a, b, c1, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(inout) :: b

    real(kind=rp), intent(in) :: c1

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2s1(a%x_d, b%x_d, c1, size)

    else

       call add2s1(a%x, b%x, c1, size)

    end if


  end subroutine vector_add2s1


  subroutine vector_add2s2(a, b, c1, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(inout) :: b

    real(kind=rp), intent(in) :: c1

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add2s2(a%x_d, b%x_d, c1, size)

    else

       call add2s2(a%x, b%x, c1, size)

    end if


  end subroutine vector_add2s2


  subroutine vector_addsqr2s2(a, b, c1, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    real(kind=rp), intent(in) :: c1

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addsqr2s2(a%x_d, b%x_d, c1, size)

    else

       call addsqr2s2(a%x, b%x, c1, size)

    end if


  end subroutine vector_addsqr2s2


  subroutine vector_cmult2(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    real(kind=rp), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_cmult2(a%x_d, b%x_d, c, size)

    else

       call cmult2(a%x, b%x, c, size)

    end if


  end subroutine vector_cmult2


  subroutine vector_invcol2(a, b, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_invcol2(a%x_d, b%x_d, size)

    else

       call invcol2(a%x, b%x, size)

    end if


  end subroutine vector_invcol2


  subroutine vector_col2(a, b, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_col2(a%x_d, b%x_d, size)

    else

       call col2(a%x, b%x, size)

    end if


  end subroutine vector_col2


  subroutine vector_col3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_col3(a%x_d, b%x_d, c%x_d, size)

    else

       call col3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_col3


  subroutine vector_subcol3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_subcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call subcol3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_subcol3


  subroutine vector_add3s2(a, b, c, c1, c2, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    real(kind=rp), intent(in) :: c1, c2

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_add3s2(a%x_d, b%x_d, c%x_d, c1, c2, size)

    else

       call add3s2(a%x, b%x, c%x, c1, c2, size)

    end if


  end subroutine vector_add3s2


  subroutine vector_addcol3(a, b, c, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addcol3(a%x_d, b%x_d, c%x_d, size)

    else

       call addcol3(a%x, b%x, c%x, size)

    end if


  end subroutine vector_addcol3


  subroutine vector_addcol4(a, b, c, d, n)

    integer, intent(in), optional :: n

    type(vector_t), intent(inout) :: a

    type(vector_t), intent(in) :: b

    type(vector_t), intent(in) :: c

    type(vector_t), intent(in) :: d

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_addcol4(a%x_d, b%x_d, c%x_d, d%x_d, size)

    else

       call addcol4(a%x, b%x, c%x, d%x, size)

    end if


  end subroutine vector_addcol4


  function vector_glsum(a, n) result(sum)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: a

    real(kind=rp) :: sum

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       sum = device_glsum(a%x_d, size)

    else

       sum = glsum(a%x, size)

    end if


  end function vector_glsum


  function vector_glsc2(a, b, n) result(norm)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: a, b

    real(kind=rp) :: norm

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       norm = device_glsc2(a%x_d, b%x_d, size)

    else

       norm = glsc2(a%x, b%x, size)

    end if


  end function vector_glsc2


  function vector_glsc3(a, b, c, n) result(norm)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: a, b, c

    real(kind=rp) :: norm

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       norm = device_glsc3(a%x_d, b%x_d, c%x_d, size)

    else

       norm = glsc3(a%x, b%x, c%x, size)

    end if


  end function vector_glsc3


  function vector_glsubnorm(a, b, n) result(norm)

    integer, intent(in), optional :: n

    type(vector_t), intent(in) :: a, b

    real(kind=rp) :: norm

    integer :: size


    if (present(n)) then

       size = n

    else

       size = a%size()

    end if


    if (neko_bcknd_device .eq. 1) then

       norm = device_glsubnorm(a%x_d, b%x_d, size)

    else

       norm = glsubnorm(a%x, b%x, size)

    end if


  end function vector_glsubnorm


  subroutine vector_masked_gather_copy_0(a, b, mask, n, n_mask)

    integer, intent(in) :: n, n_mask

    real(kind=rp), dimension(n_mask), intent(inout) :: a

    type(vector_t) :: b

    integer, dimension(0:n_mask) :: mask

    type(c_ptr) :: mask_d, a_d


    if (neko_bcknd_device .eq. 1) then

       mask_d = device_get_ptr(mask)

       a_d = device_get_ptr(a)

       call device_masked_gather_copy_0(a_d, b%x_d, mask_d, n, n_mask)

    else

       call masked_gather_copy_0(a, b%x, mask, n, n_mask)

    end if


  end subroutine vector_masked_gather_copy_0


  subroutine vector_masked_scatter_copy_0(a, b, mask, n, n_mask)

    integer, intent(in) :: n, n_mask

    real(kind=rp), dimension(n_mask), intent(in) :: b

    type(vector_t), intent(inout) :: a

    integer, dimension(0:n_mask) :: mask

    type(c_ptr) :: mask_d, b_d


    if (neko_bcknd_device .eq. 1) then

       mask_d = device_get_ptr(mask)

       b_d = device_get_ptr(b)

       call device_masked_scatter_copy_0(a%x_d, b_d, mask_d, n, n_mask)

    else

       call masked_scatter_copy_0(a%x, b, mask, n, n_mask)

    end if


  end subroutine vector_masked_scatter_copy_0


end module vector_math

device::device_get_ptr
Return the device pointer for an associated Fortran array.
Definition device.F90:101

device_math::device_cadd
Definition device_math.F90:50

device_math
Definition device_math.F90:33

device_math::device_add2s1
subroutine, public device_add2s1(a_d, b_d, c1, n, strm)
Definition device_math.F90:517

device_math::device_sub3
subroutine, public device_sub3(a_d, b_d, c_d, n, strm)
Vector subtraction .
Definition device_math.F90:886

device_math::device_masked_scatter_copy_0
subroutine, public device_masked_scatter_copy_0(a_d, b_d, mask_d, n, n_mask, strm)
Scatter a masked vector .
Definition device_math.F90:151

device_math::device_add2s2
subroutine, public device_add2s2(a_d, b_d, c1, n, strm)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition device_math.F90:545

device_math::device_add2
subroutine, public device_add2(a_d, b_d, n, strm)
Vector addition .
Definition device_math.F90:467

device_math::device_addcol3
subroutine, public device_addcol3(a_d, b_d, c_d, n, strm)
Returns .
Definition device_math.F90:912

device_math::device_glsum
real(kind=rp) function, public device_glsum(a_d, n, strm)
Sum a vector of length n.
Definition device_math.F90:1242

device_math::device_invcol1
subroutine, public device_invcol1(a_d, n, strm)
Invert a vector .
Definition device_math.F90:706

device_math::device_add3s2
subroutine, public device_add3s2(a_d, b_d, c_d, c1, c2, n, strm)
Returns .
Definition device_math.F90:625

device_math::device_rzero
subroutine, public device_rzero(a_d, n, strm)
Zero a real vector.
Definition device_math.F90:232

device_math::device_rone
subroutine, public device_rone(a_d, n, strm)
Set all elements to one.
Definition device_math.F90:258

device_math::device_cmult
subroutine, public device_cmult(a_d, c, n, strm)
Multiplication by constant c .
Definition device_math.F90:281

device_math::device_vdot3
subroutine, public device_vdot3(dot_d, u1_d, u2_d, u3_d, v1_d, v2_d, v3_d, n, strm)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition device_math.F90:992

device_math::device_glsubnorm
real(kind=rp) function, public device_glsubnorm(a_d, b_d, n, strm)
Returns the norm of the difference of two vectors .
Definition device_math.F90:1206

device_math::device_sub2
subroutine, public device_sub2(a_d, b_d, n, strm)
Vector substraction .
Definition device_math.F90:860

device_math::device_copy
subroutine, public device_copy(a_d, b_d, n, strm)
Copy a vector .
Definition device_math.F90:73

device_math::device_invcol3
subroutine, public device_invcol3(a_d, b_d, c_d, n, strm)
Vector division .
Definition device_math.F90:758

device_math::device_col2
subroutine, public device_col2(a_d, b_d, n, strm)
Vector multiplication .
Definition device_math.F90:783

device_math::device_add4
subroutine, public device_add4(a_d, b_d, c_d, d_d, n, strm)
Definition device_math.F90:492

device_math::device_subcol3
subroutine, public device_subcol3(a_d, b_d, c_d, n, strm)
Returns .
Definition device_math.F90:834

device_math::device_masked_gather_copy_0
subroutine, public device_masked_gather_copy_0(a_d, b_d, mask_d, n, n_mask, strm)
Gather a masked vector .
Definition device_math.F90:125

device_math::device_invcol2
subroutine, public device_invcol2(a_d, b_d, n, strm)
Vector division .
Definition device_math.F90:732

device_math::device_addsqr2s2
subroutine, public device_addsqr2s2(a_d, b_d, c1, n, strm)
Returns .
Definition device_math.F90:572

device_math::device_glsc3
real(kind=rp) function, public device_glsc3(a_d, b_d, c_d, n, strm)
Weighted inner product .
Definition device_math.F90:1082

device_math::device_glsc2
real(kind=rp) function, public device_glsc2(a_d, b_d, n, strm)
Weighted inner product .
Definition device_math.F90:1172

device_math::device_cmult2
subroutine, public device_cmult2(a_d, b_d, c, n, strm)
Multiplication by constant c .
Definition device_math.F90:308

device_math::device_col3
subroutine, public device_col3(a_d, b_d, c_d, n, strm)
Vector multiplication with 3 vectors .
Definition device_math.F90:808

device_math::device_addcol4
subroutine, public device_addcol4(a_d, b_d, c_d, d_d, n, strm)
Returns .
Definition device_math.F90:938

device_math::device_cfill
subroutine, public device_cfill(a_d, c, n, strm)
Set all elements to a constant c .
Definition device_math.F90:440

device_math::device_add3
subroutine, public device_add3(a_d, b_d, c_d, n, strm)
Vector addition .
Definition device_math.F90:599

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

mask
Object for handling masks in Neko.
Definition mask.f90:34

math
Definition math.f90:60

math::cmult
subroutine, public cmult(a, c, n)
Multiplication by constant c .
Definition math.f90:411

math::cmult2
subroutine, public cmult2(a, b, c, n)
Multiplication by constant c .
Definition math.f90:423

math::invcol2
subroutine, public invcol2(a, b, n)
Vector division .
Definition math.f90:840

math::glsc3
real(kind=rp) function, public glsc3(a, b, c, n)
Weighted inner product .
Definition math.f90:1067

math::cadd
subroutine, public cadd(a, s, n)
Add a scalar to vector .
Definition math.f90:462

math::addsqr2s2
subroutine, public addsqr2s2(a, b, c1, n)
Returns .
Definition math.f90:826

math::add2s1
subroutine, public add2s1(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition math.f90:797

math::glsc2
real(kind=rp) function, public glsc2(a, b, n)
Weighted inner product .
Definition math.f90:1048

math::masked_scatter_copy_0
subroutine, public masked_scatter_copy_0(a, b, mask, n, n_mask)
Scatter a contigous vector to masked positions in a target array .
Definition math.f90:358

math::subcol3
subroutine, public subcol3(a, b, c, n)
Returns .
Definition math.f90:881

math::rone
subroutine, public rone(a, n)
Set all elements to one.
Definition math.f90:238

math::add3
subroutine, public add3(a, b, c, n)
Vector addition .
Definition math.f90:739

math::glsum
real(kind=rp) function, public glsum(a, n)
Sum a vector of length n.
Definition math.f90:499

math::sub3
subroutine, public sub3(a, b, c, n)
Vector subtraction .
Definition math.f90:781

math::addcol4
subroutine, public addcol4(a, b, c, d, n)
Returns .
Definition math.f90:972

math::add2
subroutine, public add2(a, b, n)
Vector addition .
Definition math.f90:726

math::cfill
subroutine, public cfill(a, c, n)
Set all elements to a constant c .
Definition math.f90:487

math::invcol3
subroutine, public invcol3(a, b, c, n)
Invert a vector .
Definition math.f90:626

math::add3s2
subroutine, public add3s2(a, b, c, c1, c2, n)
Returns .
Definition math.f90:895

math::masked_gather_copy_0
subroutine, public masked_gather_copy_0(a, b, mask, n, n_mask)
Gather a masked vector to reduced contigous vector .
Definition math.f90:312

math::addcol3
subroutine, public addcol3(a, b, c, n)
Returns .
Definition math.f90:958

math::invcol1
subroutine, public invcol1(a, n)
Invert a vector .
Definition math.f90:614

math::col2
subroutine, public col2(a, b, n)
Vector multiplication .
Definition math.f90:854

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition math.f90:249

math::add4
subroutine, public add4(a, b, c, d, n)
Vector addition .
Definition math.f90:753

math::col3
subroutine, public col3(a, b, c, n)
Vector multiplication with 3 vectors .
Definition math.f90:867

math::vdot3
subroutine, public vdot3(dot, u1, u2, u3, v1, v2, v3, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition math.f90:684

math::rzero
subroutine, public rzero(a, n)
Zero a real vector.
Definition math.f90:205

math::glsubnorm
real(kind=rp) function, public glsubnorm(a, b, n)
Returns the norm of the difference of two vectors .
Definition math.f90:1109

math::sub2
subroutine, public sub2(a, b, n)
Vector substraction .
Definition math.f90:768

math::add2s2
subroutine, public add2s2(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on second argument)
Definition math.f90:812

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

vector_math
Definition vector_math.f90:60

vector_math::vector_masked_gather_copy_0
subroutine, public vector_masked_gather_copy_0(a, b, mask, n, n_mask)
Gather a vector to reduced contigous array .
Definition vector_math.f90:722

vector_math::vector_glsc3
real(kind=rp) function, public vector_glsc3(a, b, c, n)
Definition vector_math.f90:674

vector_math::vector_add2
subroutine, public vector_add2(a, b, n)
Vector addition .
Definition vector_math.f90:283

vector_math::vector_vdot3
subroutine, public vector_vdot3(dot, u1, u2, u3, v1, v2, v3, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition vector_math.f90:255

vector_math::vector_copy
subroutine, public vector_copy(a, b, n)
Copy a vector .
Definition vector_math.f90:132

vector_math::vector_sub3
subroutine, public vector_sub3(a, b, c, n)
Vector subtraction .
Definition vector_math.f90:367

vector_math::vector_cmult
subroutine, public vector_cmult(a, c, n)
Multiplication by constant c .
Definition vector_math.f90:152

vector_math::vector_invcol1
subroutine, public vector_invcol1(a, n)
Invert a vector .
Definition vector_math.f90:212

vector_math::vector_add3s2
subroutine, public vector_add3s2(a, b, c, c1, c2, n)
Returns .
Definition vector_math.f90:567

vector_math::vector_sub2
subroutine, public vector_sub2(a, b, n)
Vector substraction .
Definition vector_math.f90:346

vector_math::vector_addsqr2s2
subroutine, public vector_addsqr2s2(a, b, c1, n)
Returns .
Definition vector_math.f90:436

vector_math::vector_col2
subroutine, public vector_col2(a, b, n)
Vector multiplication .
Definition vector_math.f90:502

vector_math::vector_cfill
subroutine, public vector_cfill(a, c, n)
Set all elements to a constant c .
Definition vector_math.f90:192

vector_math::vector_glsum
real(kind=rp) function, public vector_glsum(a, n)
Definition vector_math.f90:634

vector_math::vector_glsc2
real(kind=rp) function, public vector_glsc2(a, b, n)
Definition vector_math.f90:654

vector_math::vector_addcol3
subroutine, public vector_addcol3(a, b, c, n)
Returns .
Definition vector_math.f90:590

vector_math::vector_glsubnorm
real(kind=rp) function, public vector_glsubnorm(a, b, n)
Definition vector_math.f90:694

vector_math::vector_invcol2
subroutine, public vector_invcol2(a, b, n)
Vector division .
Definition vector_math.f90:480

vector_math::vector_subcol3
subroutine, public vector_subcol3(a, b, c, n)
Returns .
Definition vector_math.f90:545

vector_math::vector_cadd
subroutine, public vector_cadd(a, s, n)
Add a scalar to vector .
Definition vector_math.f90:172

vector_math::vector_add4
subroutine vector_add4(a, b, c, d, n)
Vector addition .
Definition vector_math.f90:325

vector_math::vector_add3
subroutine, public vector_add3(a, b, c, n)
Vector addition .
Definition vector_math.f90:304

vector_math::vector_add2s1
subroutine, public vector_add2s1(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition vector_math.f90:391

vector_math::vector_add2s2
subroutine, public vector_add2s2(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on second argument)
Definition vector_math.f90:414

vector_math::vector_addcol4
subroutine, public vector_addcol4(a, b, c, d, n)
Returns .
Definition vector_math.f90:612

vector_math::vector_cmult2
subroutine, public vector_cmult2(a, b, c, n)
Multiplication by constant c .
Definition vector_math.f90:458

vector_math::vector_rone
subroutine, public vector_rone(a, n)
Set all elements to one.
Definition vector_math.f90:113

vector_math::vector_rzero
subroutine, public vector_rzero(a, n)
Zero a real vector.
Definition vector_math.f90:94

vector_math::vector_col3
subroutine, public vector_col3(a, b, c, n)
Vector multiplication with 3 vectors .
Definition vector_math.f90:523

vector_math::vector_masked_scatter_copy_0
subroutine, public vector_masked_scatter_copy_0(a, b, mask, n, n_mask)
Gather a contigous array into a vector .
Definition vector_math.f90:747

vector_math::vector_invcol3
subroutine, public vector_invcol3(a, b, c, n)
Invert a vector .
Definition vector_math.f90:232

vector
Defines a vector.
Definition vector.f90:34

vector::vector_t
Definition vector.f90:48