d6/ddb/math_8f90_source.html

! Copyright (c) 2008-2020, UCHICAGO ARGONNE, LLC.

!

! The UChicago Argonne, LLC as Operator of Argonne National

! Laboratory holds copyright in the Software. The copyright holder

! reserves all rights except those expressly granted to licensees,

! and U.S. Government license rights.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

! 1. Redistributions of source code must retain the above copyright

! notice, this list of conditions and the disclaimer below.

!

! 2. Redistributions in binary form must reproduce the above copyright

! notice, this list of conditions and the disclaimer (as noted below)

! in the documentation and/or other materials provided with the

! distribution.

!

! 3. Neither the name of ANL nor the names of its contributors

! may be used to endorse or promote products derived from this software

! without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL

! UCHICAGO ARGONNE, LLC, THE U.S. DEPARTMENT OF

! ENERGY OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED

! TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

! DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

! THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

! (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

! OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

!

! Additional BSD Notice

! ---------------------

! 1. This notice is required to be provided under our contract with

! the U.S. Department of Energy (DOE). This work was produced at

! Argonne National Laboratory under Contract

! No. DE-AC02-06CH11357 with the DOE.

!

! 2. Neither the United States Government nor UCHICAGO ARGONNE,

! LLC nor any of their employees, makes any warranty,

! express or implied, or assumes any liability or responsibility for the

! accuracy, completeness, or usefulness of any information, apparatus,

! product, or process disclosed, or represents that its use would not

! infringe privately-owned rights.

!

! 3. Also, reference herein to any specific commercial products, process,

! or services by trade name, trademark, manufacturer or otherwise does

! not necessarily constitute or imply its endorsement, recommendation,

! or favoring by the United States Government or UCHICAGO ARGONNE LLC.

! The views and opinions of authors expressed

! herein do not necessarily state or reflect those of the United States

! Government or UCHICAGO ARGONNE, LLC, and shall

! not be used for advertising or product endorsement purposes.

!

module math

  use num_types, only : rp, dp, sp, qp, i4, xp

  use utils, only: neko_error

  use comm, only: neko_comm, mpi_real_precision, mpi_extra_precision

  use mpi_f08, only: mpi_min, mpi_max, mpi_sum, mpi_in_place, mpi_integer, &

       mpi_allreduce

  implicit none

  private


  real(kind=rp), public, parameter :: neko_eps = epsilon(1.0_rp)


  real(kind=rp), public, parameter :: neko_m_ln2 = log(2.0_rp)


  real(kind=rp), public, parameter :: pi = 4._rp*atan(1._rp)


  interface abscmp

     module procedure sabscmp, dabscmp, qabscmp

  interface abscmp …

  end interface abscmp


  interface sort

     module procedure sortrp, sorti4

  interface sort …

  end interface sort


  interface swap

     module procedure swapdp, swapi4

  interface swap …

  end interface swap


  interface reord

     module procedure reorddp, reordi4

  interface reord …

  end interface reord


  interface flipv

     module procedure flipvdp, flipvi4

  interface flipv …

  end interface flipv


  interface relcmp

     module procedure srelcmp, drelcmp, qrelcmp

  interface relcmp …

  end interface relcmp


  interface pwmax

     module procedure pwmax_vec2, pwmax_vec3, pwmax_scal2, pwmax_scal3

  interface pwmax …

  end interface pwmax


  interface pwmin

     module procedure pwmin_vec2, pwmin_vec3, pwmin_sca2, pwmin_sca3

  interface pwmin …

  end interface pwmin


  public :: abscmp, rzero, izero, row_zero, rone, copy, cmult, cadd, cfill, &

       glsum, glmax, glmin, chsign, vlmax, vlmin, invcol1, invcol3, invers2, &

       vcross, vdot2, vdot3, vlsc3, vlsc2, add2, add3, add4, sub2, sub3, &

       add2s1, add2s2, addsqr2s2, cmult2, invcol2, col2, col3, subcol3, &

       add3s2, subcol4, addcol3, addcol4, ascol5, p_update, x_update, glsc2, &

       glsc3, glsc4, sort, masked_copy, cfill_mask, relcmp, glimax, glimin, &

       swap, reord, flipv, cadd2, masked_red_copy, absval, pwmax, pwmin


contains


  pure function sabscmp(x, y)

    real(kind=sp), intent(in) :: x

    real(kind=sp), intent(in) :: y

    logical :: sabscmp


    sabscmp = abs(x - y) .lt. neko_eps


  pure function sabscmp(x, y) …

  end function sabscmp


  pure function dabscmp(x, y)

    real(kind=dp), intent(in) :: x

    real(kind=dp), intent(in) :: y

    logical :: dabscmp


    dabscmp = abs(x - y) .lt. neko_eps


  pure function dabscmp(x, y) …

  end function dabscmp


  pure function qabscmp(x, y)

    real(kind=qp), intent(in) :: x

    real(kind=qp), intent(in) :: y

    logical :: qabscmp


    qabscmp = abs(x - y) .lt. neko_eps


  pure function qabscmp(x, y) …

  end function qabscmp


  pure function srelcmp(x, y, eps)

    real(kind=sp), intent(in) :: x

    real(kind=sp), intent(in) :: y

    real(kind=sp), intent(in), optional :: eps

    logical :: srelcmp

    if (present(eps)) then

       srelcmp = abs(x - y) .le. eps*abs(y)

    else

       srelcmp = abs(x - y) .le. neko_eps*abs(y)

    end if


  pure function srelcmp(x, y, eps) …

  end function srelcmp


  pure function drelcmp(x, y, eps)

    real(kind=dp), intent(in) :: x

    real(kind=dp), intent(in) :: y

    real(kind=dp), intent(in), optional :: eps

    logical :: drelcmp

    if (present(eps)) then

       drelcmp = abs(x - y) .le. eps*abs(y)

    else

       drelcmp = abs(x - y) .le. neko_eps*abs(y)

    end if


  pure function drelcmp(x, y, eps) …

  end function drelcmp


  pure function qrelcmp(x, y, eps)

    real(kind=qp), intent(in) :: x

    real(kind=qp), intent(in) :: y

    real(kind=qp), intent(in), optional :: eps

    logical :: qrelcmp

    if (present(eps)) then

       qrelcmp = abs(x - y)/abs(y) .lt. eps

    else

       qrelcmp = abs(x - y)/abs(y) .lt. neko_eps

    end if


  pure function qrelcmp(x, y, eps) …

  end function qrelcmp


  subroutine rzero(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = 0.0_rp

    end do

  subroutine rzero(a, n) …

  end subroutine rzero


  subroutine izero(a, n)

    integer, intent(in) :: n

    integer, dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = 0

    end do

  subroutine izero(a, n) …

  end subroutine izero


  subroutine row_zero(a, m, n, e)

    integer, intent(in) :: m, n, e

    real(kind=rp), intent(inout) :: a(m,n)

    integer :: j


    do j = 1,n

       a(e,j) = 0.0_rp

    end do

  subroutine row_zero(a, m, n, e) …

  end subroutine row_zero


  subroutine rone(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = 1.0_rp

    end do

  subroutine rone(a, n) …

  end subroutine rone


  subroutine copy(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = b(i)

    end do


  subroutine copy(a, b, n) …

  end subroutine copy


  subroutine masked_copy(a, b, mask, n, m)

    integer, intent(in) :: n, m

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(inout) :: a

    integer, dimension(0:m) :: mask

    integer :: i, j


    do i = 1, m

       j = mask(i)

       a(j) = b(j)

    end do


  subroutine masked_copy(a, b, mask, n, m) …

  end subroutine masked_copy


  subroutine masked_red_copy(a, b, mask, n, m)

    integer, intent(in) :: n, m

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(m), intent(inout) :: a

    integer, dimension(0:m) :: mask

    integer :: i, j


    do i = 1, m

       j = mask(i)

       a(i) = b(j)

    end do


  subroutine masked_red_copy(a, b, mask, n, m) …

  end subroutine masked_red_copy


  subroutine cfill_mask(a, c, size, mask, mask_size)

    integer, intent(in) :: size, mask_size

    real(kind=rp), dimension(size), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer, dimension(mask_size), intent(in) :: mask

    integer :: i


    do i = 1, mask_size

       a(mask(i)) = c

    end do


  subroutine cfill_mask(a, c, size, mask, mask_size) …

  end subroutine cfill_mask


  subroutine cmult(a, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = c * a(i)

    end do

  subroutine cmult(a, c, n) …

  end subroutine cmult


  subroutine cadd(a, s, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), intent(in) :: s

    integer :: i


    do i = 1, n

       a(i) = a(i) + s

    end do

  subroutine cadd(a, s, n) …

  end subroutine cadd


  subroutine cadd2(a, b, s, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), intent(in) :: s

    integer :: i


    do i = 1, n

       a(i) = b(i) + s

    end do

  subroutine cadd2(a, b, s, n) …

  end subroutine cadd2


  subroutine cfill(a, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = c

    end do

  subroutine cfill(a, c, n) …

  end subroutine cfill


  function glsum(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n) :: a

    real(kind=rp) :: glsum

    real(kind=xp) :: tmp

    integer :: i, ierr

    tmp = 0.0_rp

    do i = 1, n

       tmp = tmp + a(i)

    end do

    call mpi_allreduce(mpi_in_place, tmp, 1, &

         mpi_extra_precision, mpi_sum, neko_comm, ierr)

    glsum = tmp


  function glsum(a, n) …

  end function glsum


  function glmax(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n) :: a

    real(kind=rp) :: tmp, glmax

    integer :: i, ierr


    tmp = -huge(0.0_rp)

    do i = 1, n

       tmp = max(tmp,a(i))

    end do

    call mpi_allreduce(tmp, glmax, 1, &

         mpi_real_precision, mpi_max, neko_comm, ierr)

  function glmax(a, n) …

  end function glmax


  function glimax(a, n)

    integer, intent(in) :: n

    integer, dimension(n) :: a

    integer :: tmp, glimax

    integer :: i, ierr


    tmp = -huge(0)

    do i = 1, n

       tmp = max(tmp,a(i))

    end do

    call mpi_allreduce(tmp, glimax, 1, &

         mpi_integer, mpi_max, neko_comm, ierr)

  function glimax(a, n) …

  end function glimax


  function glmin(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n) :: a

    real(kind=rp) :: tmp, glmin

    integer :: i, ierr


    tmp = huge(0.0_rp)

    do i = 1, n

       tmp = min(tmp,a(i))

    end do

    call mpi_allreduce(tmp, glmin, 1, &

         mpi_real_precision, mpi_min, neko_comm, ierr)

  function glmin(a, n) …

  end function glmin


  function glimin(a, n)

    integer, intent(in) :: n

    integer, dimension(n) :: a

    integer :: tmp, glimin

    integer :: i, ierr


    tmp = huge(0)

    do i = 1, n

       tmp = min(tmp,a(i))

    end do

    call mpi_allreduce(tmp, glimin, 1, &

         mpi_integer, mpi_min, neko_comm, ierr)

  function glimin(a, n) …

  end function glimin


  subroutine chsign(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = -a(i)

    end do


  subroutine chsign(a, n) …

  end subroutine chsign


  function vlmax(vec,n) result(tmax)

    integer :: n, i

    real(kind=rp), intent(in) :: vec(n)

    real(kind=rp) :: tmax

    tmax = real(-99d20, rp)

    do i = 1, n

       tmax = max(tmax, vec(i))

    end do

  function vlmax(vec,n) result(tmax) …

  end function vlmax


  function vlmin(vec,n) result(tmin)

    integer, intent(in) :: n

    real(kind=rp), intent(in) :: vec(n)

    real(kind=rp) :: tmin

    integer :: i

    tmin = real(99.0e20, rp)

    do i = 1, n

       tmin = min(tmin, vec(i))

    end do

  function vlmin(vec,n) result(tmin) …

  end function vlmin


  subroutine invcol1(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i


    do i = 1, n

       a(i) = 1.0_xp / real(a(i),xp)

    end do


  subroutine invcol1(a, n) …

  end subroutine invcol1


  subroutine invcol3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b,c

    integer :: i


    do i = 1, n

       a(i) = real(b(i),xp) / c(i)

    end do


  subroutine invcol3(a, b, c, n) …

  end subroutine invcol3


  subroutine invers2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = 1.0_xp / real(b(i),xp)

    end do


  subroutine invers2(a, b, n) …

  end subroutine invers2


  subroutine vcross(u1, u2, u3, v1, v2, v3, w1, w2, w3, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: v1, v2, v3

    real(kind=rp), dimension(n), intent(in) :: w1, w2, w3

    real(kind=rp), dimension(n), intent(out) :: u1, u2, u3

    integer :: i


    do i = 1, n

       u1(i) = v2(i)*w3(i) - v3(i)*w2(i)

       u2(i) = v3(i)*w1(i) - v1(i)*w3(i)

       u3(i) = v1(i)*w2(i) - v2(i)*w1(i)

    end do


  subroutine vcross(u1, u2, u3, v1, v2, v3, w1, w2, w3, n) …

  end subroutine vcross


  subroutine vdot2(dot, u1, u2, v1, v2, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: u1, u2

    real(kind=rp), dimension(n), intent(in) :: v1, v2

    real(kind=rp), dimension(n), intent(out) :: dot

    integer :: i

    do i = 1, n

       dot(i) = u1(i)*v1(i) + u2(i)*v2(i)

    end do


  subroutine vdot2(dot, u1, u2, v1, v2, n) …

  end subroutine vdot2


  subroutine vdot3(dot, u1, u2, u3, v1, v2, v3, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: u1, u2, u3

    real(kind=rp), dimension(n), intent(in) :: v1, v2, v3

    real(kind=rp), dimension(n), intent(out) :: dot

    integer :: i


    do i = 1, n

       dot(i) = u1(i)*v1(i) + u2(i)*v2(i) + u3(i)*v3(i)

    end do


  subroutine vdot3(dot, u1, u2, u3, v1, v2, v3, n) …

  end subroutine vdot3


  function vlsc3(u, v, w, n) result(s)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: u, v, w

    real(kind=rp) :: s

    integer :: i


    s = 0.0_rp

    do i = 1, n

       s = s + u(i)*v(i)*w(i)

    end do


  function vlsc3(u, v, w, n) result(s) …

  end function vlsc3


  function vlsc2(u, v, n) result(s)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: u, v

    real(kind=rp) :: s

    integer :: i


    s = 0.0_rp

    do i = 1, n

       s = s + u(i)*v(i)

    end do


  function vlsc2(u, v, n) result(s) …

  end function vlsc2


  subroutine add2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = a(i) + b(i)

    end do


  subroutine add2(a, b, n) …

  end subroutine add2


  subroutine add3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = b(i) + c(i)

    end do


  subroutine add3(a, b, c, n) …

  end subroutine add3


  subroutine add4(a, b, c, d, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(out) :: a

    real(kind=rp), dimension(n), intent(in) :: d

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = b(i) + c(i) + d(i)

    end do


  subroutine add4(a, b, c, d, n) …

  end subroutine add4


  subroutine sub2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(inout) :: b

    integer :: i


    do i = 1, n

       a(i) = a(i) - b(i)

    end do


  subroutine sub2(a, b, n) …

  end subroutine sub2


  subroutine sub3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = b(i) - c(i)

    end do


  subroutine sub3(a, b, c, n) …

  end subroutine sub3


  subroutine add2s1(a, b, c1, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(inout) :: b

    real(kind=rp), intent(in) :: c1

    integer :: i


    do i = 1, n

       a(i) = c1 * a(i) + b(i)

    end do


  subroutine add2s1(a, b, c1, n) …

  end subroutine add2s1


  subroutine add2s2(a, b, c1, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(inout) :: b

    real(kind=rp), intent(in) :: c1

    integer :: i


    do i = 1, n

       a(i) = a(i) + c1 * b(i)

    end do


  subroutine add2s2(a, b, c1, n) …

  end subroutine add2s2


  subroutine addsqr2s2(a, b, c1, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), intent(in) :: c1

    integer :: i


    do i = 1,n

       a(i) = a(i) + c1 * ( b(i) * b(i) )

    end do


  subroutine addsqr2s2(a, b, c1, n) …

  end subroutine addsqr2s2


  subroutine cmult2(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = c * b(i)

    end do


  subroutine cmult2(a, b, c, n) …

  end subroutine cmult2


  subroutine invcol2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = real(a(i),xp) /b(i)

    end do


  subroutine invcol2(a, b, n) …

  end subroutine invcol2


  subroutine col2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = a(i) * b(i)

    end do


  subroutine col2(a, b, n) …

  end subroutine col2


  subroutine col3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = b(i) * c(i)

    end do


  subroutine col3(a, b, c, n) …

  end subroutine col3


  subroutine subcol3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    integer :: i


    do i = 1,n

       a(i) = a(i) - b(i) * c(i)

    end do


  subroutine subcol3(a, b, c, n) …

  end subroutine subcol3


  subroutine add3s2(a, b, c, c1, c2 ,n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), intent(in) :: c1, c2

    integer :: i


    do i = 1,n

       a(i) = c1 * b(i) + c2 * c(i)

    end do


  subroutine add3s2(a, b, c, c1, c2 ,n) …

  end subroutine add3s2


  subroutine subcol4(a, b, c, d, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), dimension(n), intent(in) :: d

    integer :: i


    do i = 1,n

       a(i) = a(i) - b(i) * c(i) * d(i)

    end do


  subroutine subcol4(a, b, c, d, n) …

  end subroutine subcol4


  subroutine addcol3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    integer :: i


    do i = 1,n

       a(i) = a(i) + b(i) * c(i)

    end do


  subroutine addcol3(a, b, c, n) …

  end subroutine addcol3


  subroutine addcol4(a, b, c, d, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), dimension(n), intent(in) :: d

    integer :: i


    do i = 1,n

       a(i) = a(i) + b(i) * c(i) * d(i)

    end do


  subroutine addcol4(a, b, c, d, n) …

  end subroutine addcol4


  subroutine ascol5(a, b, c, d, e, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), dimension(n), intent(in) :: d

    real(kind=rp), dimension(n), intent(in) :: e

    integer :: i


    do i = 1,n

       a(i) = b(i)*c(i)-d(i)*e(i)

    end do


  subroutine ascol5(a, b, c, d, e, n) …

  end subroutine ascol5


  subroutine p_update(a, b, c, c1, c2, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), intent(in) :: c1, c2

    integer :: i


    do i = 1,n

       a(i) = b(i) + c1*(a(i)-c2*c(i))

    end do


  subroutine p_update(a, b, c, c1, c2, n) …

  end subroutine p_update


  subroutine x_update(a, b, c, c1, c2, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), intent(in) :: c1, c2

    integer :: i


    do i = 1,n

       a(i) = a(i) + c1*b(i)+c2*c(i)

    end do


  subroutine x_update(a, b, c, c1, c2, n) …

  end subroutine x_update


  function glsc2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp) :: glsc2

    real(kind=xp) :: tmp

    integer :: i, ierr


    tmp = 0.0_xp

    do i = 1, n

       tmp = tmp + a(i) * b(i)

    end do


    call mpi_allreduce(mpi_in_place, tmp, 1, &

         mpi_extra_precision, mpi_sum, neko_comm, ierr)

    glsc2 = tmp

  function glsc2(a, b, n) …

  end function glsc2


  function glsc3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp) :: glsc3

    real(kind=xp) :: tmp

    integer :: i, ierr


    tmp = 0.0_xp

    do i = 1, n

       tmp = tmp + a(i) * b(i) * c(i)

    end do


    call mpi_allreduce(mpi_in_place, tmp, 1, &

         mpi_extra_precision, mpi_sum, neko_comm, ierr)

    glsc3 = tmp


  function glsc3(a, b, c, n) …

  end function glsc3


  function glsc4(a, b, c, d, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(in) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), dimension(n), intent(in) :: c

    real(kind=rp), dimension(n), intent(in) :: d

    real(kind=rp) :: glsc4

    real(kind=xp) :: tmp

    integer :: i, ierr


    tmp = 0.0_xp

    do i = 1, n

       tmp = tmp + a(i) * b(i) * c(i) * d(i)

    end do


    call mpi_allreduce(mpi_in_place, tmp, 1, &

         mpi_extra_precision, mpi_sum, neko_comm, ierr)

    glsc4 = tmp


  function glsc4(a, b, c, d, n) …

  end function glsc4


  subroutine sortrp(a, ind, n)

    integer, intent(in) :: n

    real(kind=rp), intent(inout) :: a(n)

    integer, intent(out) :: ind(n)

    real(kind=rp) :: aa

    integer :: j, ir, i, ii, l


    do j = 1, n

       ind(j) = j

    end do


    if (n .le. 1) return


    l = n/2+1

    ir = n

    do while (.true.)

       if (l .gt. 1) then

          l = l-1

          aa = a(l)

          ii = ind(l)

       else

          aa = a(ir)

          ii = ind(ir)

          a(ir) = a(1)

          ind(ir) = ind(1)

          ir = ir - 1

          if (ir .eq. 1) then

             a(1) = aa

             ind(1) = ii

             return

          end if

       end if

       i = l

       j = l+l

       do while (j .le. ir)

          if (j .lt. ir) then

             if ( a(j) .lt. a(j+1) ) j = j + 1

          end if

          if (aa .lt. a(j)) then

             a(i) = a(j)

             ind(i) = ind(j)

             i = j

             j = j+j

          else

             j = ir+1

          end if

       end do

       a(i) = aa

       ind(i) = ii

    end do

  subroutine sortrp(a, ind, n) …

  end subroutine sortrp


  subroutine sorti4(a, ind, n)

    integer, intent(in) :: n

    integer(i4), intent(inout) :: a(n)

    integer, intent(out) :: ind(n)

    integer(i4) :: aa

    integer :: j, ir, i, ii, l


    do j = 1, n

       ind(j) = j

    end do


    if (n .le. 1) return


    l = n/2+1

    ir = n

    do while (.true.)

       if (l .gt. 1) then

          l = l - 1

          aa = a(l)

          ii = ind(l)

       else

          aa = a(ir)

          ii = ind(ir)

          a(ir) = a( 1)

          ind(ir) = ind( 1)

          ir = ir - 1

          if (ir .eq. 1) then

             a(1) = aa

             ind(1) = ii

             return

          end if

       end if

       i = l

       j = l + l

       do while (j .le. ir)

          if (j .lt. ir) then

             if ( a(j) .lt. a(j + 1) ) j = j + 1

          end if

          if (aa .lt. a(j)) then

             a(i) = a(j)

             ind(i) = ind(j)

             i = j

             j = j + j

          else

             j = ir + 1

          end if

       end do

       a(i) = aa

       ind(i) = ii

    end do

  subroutine sorti4(a, ind, n) …

  end subroutine sorti4


  subroutine swapdp(b, ind, n)

    integer, intent(in) :: n

    real(kind=rp), intent(inout) :: b(n)

    integer, intent(in) :: ind(n)

    real(kind=rp) :: temp(n)

    integer :: i, jj


    do i = 1, n

       temp(i) = b(i)

    end do

    do i = 1, n

       jj = ind(i)

       b(i) = temp(jj)

    end do

  subroutine swapdp(b, ind, n) …

  end subroutine swapdp


  subroutine swapi4(b, ind, n)

    integer, intent(in) :: n

    integer(i4), intent(inout) :: b(n)

    integer, intent(in) :: ind(n)

    integer(i4) :: temp(n)

    integer :: i, jj


    do i = 1, n

       temp(i) = b(i)

    end do

    do i = 1, n

       jj = ind(i)

       b(i) = temp(jj)

    end do

  subroutine swapi4(b, ind, n) …

  end subroutine swapi4


  subroutine reorddp(b, ind, n)

    integer, intent(in) :: n

    real(kind=rp), intent(inout) :: b(n)

    integer, intent(in) :: ind(n)

    real(kind=rp) :: temp(n)

    integer :: i, jj


    do i = 1, n

       temp(i) = b(i)

    end do

    do i = 1, n

       jj = ind(i)

       b(jj) = temp(i)

    end do

  subroutine reorddp(b, ind, n) …

  end subroutine reorddp


  subroutine reordi4(b, ind, n)

    integer, intent(in) :: n

    integer(i4), intent(inout) :: b(n)

    integer, intent(in) :: ind(n)

    integer(i4) :: temp(n)

    integer :: i, jj


    do i = 1, n

       temp(i) = b(i)

    end do

    do i = 1, n

       jj = ind(i)

       b(jj) = temp(i)

    end do

  subroutine reordi4(b, ind, n) …

  end subroutine reordi4


  subroutine flipvdp(b, ind, n)

    integer, intent(in) :: n

    real(kind=rp), intent(inout) :: b(n)

    integer, intent(inout) :: ind(n)

    real(kind=rp) :: temp(n)

    integer :: tempind(n)

    integer :: i, jj


    do i = 1, n

       jj = n+1-i

       temp(jj) = b(i)

       tempind(jj) = ind(i)

    end do

    do i = 1,n

       b(i) = temp(i)

       ind(i) = tempind(i)

    end do

  subroutine flipvdp(b, ind, n) …

  end subroutine flipvdp


  subroutine flipvi4(b, ind, n)

    integer, intent(in) :: n

    integer(i4), intent(inout) :: b(n)

    integer, intent(inout) :: ind(n)

    integer(i4) :: temp(n)

    integer :: tempind(n)

    integer :: i, jj


    do i = 1, n

       jj = n+1-i

       temp(jj) = b(i)

       tempind(jj) = ind(i)

    end do

    do i = 1,n

       b(i) = temp(i)

       ind(i) = tempind(i)

    end do

  subroutine flipvi4(b, ind, n) …

  end subroutine flipvi4


  subroutine absval(a, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    integer :: i

    do i = 1, n

       a(i) = abs(a(i))

    end do

  subroutine absval(a, n) …

  end subroutine absval


  ! ========================================================================== !

  ! Point-wise operations


  subroutine pwmax_vec2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = max(a(i), b(i))

    end do

  subroutine pwmax_vec2(a, b, n) …

  end subroutine pwmax_vec2


  subroutine pwmax_vec3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b, c

    integer :: i


    do i = 1, n

       a(i) = max(b(i), c(i))

    end do

  subroutine pwmax_vec3(a, b, c, n) …

  end subroutine pwmax_vec3


  subroutine pwmax_scal2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = max(a(i), b)

    end do

  subroutine pwmax_scal2(a, b, n) …

  end subroutine pwmax_scal2


  subroutine pwmax_scal3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = max(b(i), c)

    end do

  subroutine pwmax_scal3(a, b, c, n) …

  end subroutine pwmax_scal3


  subroutine pwmin_vec2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = min(a(i), b(i))

    end do

  subroutine pwmin_vec2(a, b, n) …

  end subroutine pwmin_vec2


  subroutine pwmin_vec3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b, c

    integer :: i


    do i = 1, n

       a(i) = min(b(i), c(i))

    end do

  subroutine pwmin_vec3(a, b, c, n) …

  end subroutine pwmin_vec3


  subroutine pwmin_sca2(a, b, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), intent(in) :: b

    integer :: i


    do i = 1, n

       a(i) = min(a(i), b)

    end do

  subroutine pwmin_sca2(a, b, n) …

  end subroutine pwmin_sca2


  subroutine pwmin_sca3(a, b, c, n)

    integer, intent(in) :: n

    real(kind=rp), dimension(n), intent(inout) :: a

    real(kind=rp), dimension(n), intent(in) :: b

    real(kind=rp), intent(in) :: c

    integer :: i


    do i = 1, n

       a(i) = min(b(i), c)

    end do

  subroutine pwmin_sca3(a, b, c, n) …

  end subroutine pwmin_sca3


end module math

real
double real
Definition device_config.h:12

math::abscmp
Definition math.f90:78

math::flipv
Definition math.f90:94

math::pwmax
Definition math.f90:102

math::pwmin
Definition math.f90:106

math::relcmp
Definition math.f90:98

math::reord
Definition math.f90:90

math::sort
Definition math.f90:82

math::swap
Definition math.f90:86

utils::neko_error
Definition utils.f90:42

comm
Definition comm.F90:1

comm::neko_comm
type(mpi_comm) neko_comm
MPI communicator.
Definition comm.F90:16

comm::mpi_real_precision
type(mpi_datatype) mpi_real_precision
MPI type for working precision of REAL types.
Definition comm.F90:23

comm::mpi_extra_precision
type(mpi_datatype) mpi_extra_precision
Definition comm.F90:24

math
Definition math.f90:60

math::cmult
subroutine, public cmult(a, c, n)
Multiplication by constant c .
Definition math.f90:311

math::cmult2
subroutine, public cmult2(a, b, c, n)
Multiplication by constant c .
Definition math.f90:701

math::row_zero
subroutine, public row_zero(a, m, n, e)
Sets row e to 0 in matrix a.
Definition math.f90:217

math::invcol2
subroutine, public invcol2(a, b, n)
Vector division .
Definition math.f90:715

math::vlsc2
real(kind=rp) function, public vlsc2(u, v, n)
Compute multiplication sum .
Definition math.f90:573

math::pwmin_sca3
subroutine pwmin_sca3(a, b, c, n)
Point-wise minimum of scalar and vector .
Definition math.f90:1277

math::pi
real(kind=rp), parameter, public pi
Definition math.f90:76

math::pwmax_scal2
subroutine pwmax_scal2(a, b, n)
Point-wise maximum of scalar and vector .
Definition math.f90:1216

math::glsc3
real(kind=rp) function, public glsc3(a, b, c, n)
Weighted inner product .
Definition math.f90:895

math::qabscmp
pure logical function qabscmp(x, y)
Return double precision absolute comparison .
Definition math.f90:142

math::ascol5
subroutine, public ascol5(a, b, c, d, e, n)
Returns .
Definition math.f90:830

math::invers2
subroutine, public invers2(a, b, n)
Compute inverted vector .
Definition math.f90:500

math::cadd2
subroutine, public cadd2(a, b, s, n)
Add a scalar to vector .
Definition math.f90:335

math::pwmin_sca2
subroutine pwmin_sca2(a, b, n)
Point-wise minimum of scalar and vector .
Definition math.f90:1265

math::cadd
subroutine, public cadd(a, s, n)
Add a scalar to vector .
Definition math.f90:323

math::reorddp
subroutine reorddp(b, ind, n)
reorder double precision array - inverse of swap
Definition math.f90:1094

math::addsqr2s2
subroutine, public addsqr2s2(a, b, c1, n)
Returns .
Definition math.f90:687

math::glsc4
real(kind=rp) function, public glsc4(a, b, c, d, n)
Definition math.f90:914

math::masked_red_copy
subroutine, public masked_red_copy(a, b, mask, n, m)
Copy a masked vector to reduced contigous vector .
Definition math.f90:280

math::pwmax_vec3
subroutine pwmax_vec3(a, b, c, n)
Point-wise maximum of two vectors .
Definition math.f90:1204

math::swapdp
subroutine swapdp(b, ind, n)
sort double precision array acording to ind vector
Definition math.f90:1054

math::flipvi4
subroutine flipvi4(b, ind, n)
Flip single integer vector b and ind.
Definition math.f90:1157

math::add2s1
subroutine, public add2s1(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on first argument)
Definition math.f90:658

math::glsc2
real(kind=rp) function, public glsc2(a, b, n)
Weighted inner product .
Definition math.f90:876

math::subcol3
subroutine, public subcol3(a, b, c, n)
Returns .
Definition math.f90:756

math::rone
subroutine, public rone(a, n)
Set all elements to one.
Definition math.f90:228

math::flipvdp
subroutine flipvdp(b, ind, n)
Flip double precision vector b and ind.
Definition math.f90:1134

math::x_update
subroutine, public x_update(a, b, c, c1, c2, n)
Returns .
Definition math.f90:861

math::add3
subroutine, public add3(a, b, c, n)
Vector addition .
Definition math.f90:600

math::swapi4
subroutine swapi4(b, ind, n)
sort single integer array acording to ind vector
Definition math.f90:1074

math::glimin
integer function, public glimin(a, n)
Min of an integer vector of length n.
Definition math.f90:422

math::glsum
real(kind=rp) function, public glsum(a, n)
Sum a vector of length n.
Definition math.f90:360

math::sub3
subroutine, public sub3(a, b, c, n)
Vector subtraction .
Definition math.f90:642

math::addcol4
subroutine, public addcol4(a, b, c, d, n)
Returns .
Definition math.f90:815

math::add2
subroutine, public add2(a, b, n)
Vector addition .
Definition math.f90:587

math::cfill
subroutine, public cfill(a, c, n)
Set all elements to a constant c .
Definition math.f90:348

math::absval
subroutine, public absval(a, n)
Take the absolute value of an array.
Definition math.f90:1179

math::invcol3
subroutine, public invcol3(a, b, c, n)
Invert a vector .
Definition math.f90:487

math::sabscmp
pure logical function sabscmp(x, y)
Return single precision absolute comparison .
Definition math.f90:122

math::add3s2
subroutine, public add3s2(a, b, c, c1, c2, n)
Returns .
Definition math.f90:770

math::subcol4
subroutine, public subcol4(a, b, c, d, n)
Returns .
Definition math.f90:786

math::sorti4
subroutine sorti4(a, ind, n)
Heap Sort for single integer arrays.
Definition math.f90:998

math::addcol3
subroutine, public addcol3(a, b, c, n)
Returns .
Definition math.f90:801

math::dabscmp
pure logical function dabscmp(x, y)
Return double precision absolute comparison .
Definition math.f90:132

math::invcol1
subroutine, public invcol1(a, n)
Invert a vector .
Definition math.f90:475

math::masked_copy
subroutine, public masked_copy(a, b, mask, n, m)
Copy a masked vector .
Definition math.f90:258

math::neko_m_ln2
real(kind=rp), parameter, public neko_m_ln2
Definition math.f90:73

math::chsign
subroutine, public chsign(a, n)
Change sign of vector .
Definition math.f90:440

math::col2
subroutine, public col2(a, b, n)
Vector multiplication .
Definition math.f90:729

math::izero
subroutine, public izero(a, n)
Zero an integer vector.
Definition math.f90:206

math::glmax
real(kind=rp) function, public glmax(a, n)
Max of a vector of length n.
Definition math.f90:377

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition math.f90:239

math::pwmax_scal3
subroutine pwmax_scal3(a, b, c, n)
Point-wise maximum of scalar and vector .
Definition math.f90:1228

math::add4
subroutine, public add4(a, b, c, d, n)
Vector addition .
Definition math.f90:614

math::col3
subroutine, public col3(a, b, c, n)
Vector multiplication with 3 vectors .
Definition math.f90:742

math::pwmin_vec2
subroutine pwmin_vec2(a, b, n)
Point-wise minimum of two vectors .
Definition math.f90:1241

math::pwmin_vec3
subroutine pwmin_vec3(a, b, c, n)
Point-wise minimum of two vectors .
Definition math.f90:1253

math::pwmax_vec2
subroutine pwmax_vec2(a, b, n)
Point-wise maximum of two vectors .
Definition math.f90:1192

math::drelcmp
pure logical function drelcmp(x, y, eps)
Return double precision relative comparison .
Definition math.f90:166

math::neko_eps
real(kind=rp), parameter, public neko_eps
Machine epsilon .
Definition math.f90:70

math::vdot3
subroutine, public vdot3(dot, u1, u2, u3, v1, v2, v3, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition math.f90:545

math::qrelcmp
pure logical function qrelcmp(x, y, eps)
Return quad precision relative comparison .
Definition math.f90:181

math::rzero
subroutine, public rzero(a, n)
Zero a real vector.
Definition math.f90:195

math::vdot2
subroutine, public vdot2(dot, u1, u2, v1, v2, n)
Compute a dot product  (2-d version) assuming vector components  etc.
Definition math.f90:531

math::vlmin
real(kind=rp) function, public vlmin(vec, n)
minimun value of a vector of length n
Definition math.f90:463

math::vlmax
real(kind=rp) function, public vlmax(vec, n)
maximum value of a vector of length n
Definition math.f90:452

math::glimax
integer function, public glimax(a, n)
Max of an integer vector of length n.
Definition math.f90:392

math::sortrp
subroutine sortrp(a, ind, n)
Heap Sort for double precision arrays.
Definition math.f90:940

math::sub2
subroutine, public sub2(a, b, n)
Vector substraction .
Definition math.f90:629

math::cfill_mask
subroutine, public cfill_mask(a, c, size, mask, mask_size)
Fill a constant to a masked vector. .
Definition math.f90:297

math::add2s2
subroutine, public add2s2(a, b, c1, n)
Vector addition with scalar multiplication  (multiplication on second argument)
Definition math.f90:673

math::glmin
real(kind=rp) function, public glmin(a, n)
Min of a vector of length n.
Definition math.f90:407

math::vcross
subroutine, public vcross(u1, u2, u3, v1, v2, v3, w1, w2, w3, n)
Compute a cross product  assuming vector components  etc.
Definition math.f90:514

math::srelcmp
pure logical function srelcmp(x, y, eps)
Return single precision relative comparison .
Definition math.f90:152

math::vlsc3
real(kind=rp) function, public vlsc3(u, v, w, n)
Compute multiplication sum .
Definition math.f90:559

math::reordi4
subroutine reordi4(b, ind, n)
reorder single integer array - inverse of swap
Definition math.f90:1114

math::p_update
subroutine, public p_update(a, b, c, c1, c2, n)
Returns .
Definition math.f90:846

num_types
Definition num_types.f90:1

num_types::qp
integer, parameter, public qp
Definition num_types.f90:10

num_types::i4
integer, parameter, public i4
Definition num_types.f90:6

num_types::xp
integer, parameter, public xp
Definition num_types.f90:14

num_types::dp
integer, parameter, public dp
Definition num_types.f90:9

num_types::sp
integer, parameter, public sp
Definition num_types.f90:8

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

utils
Utilities.
Definition utils.f90:35

max
#define max(a, b)
Definition tensor.cu:40