dd/dbf/operators_8f90_source.html

! Copyright (c) 2020-2024, The Neko Authors

! All rights reserved.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

!   * Redistributions of source code must retain the above copyright

!     notice, this list of conditions and the following disclaimer.

!

!   * Redistributions in binary form must reproduce the above

!     copyright notice, this list of conditions and the following

!     disclaimer in the documentation and/or other materials provided

!     with the distribution.

!

!   * Neither the name of the authors nor the names of its

!     contributors may be used to endorse or promote products derived

!     from this software without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

! POSSIBILITY OF SUCH DAMAGE.

!

module operators

  use neko_config, only : neko_bcknd_sx, neko_bcknd_device, neko_bcknd_xsmm, &

                          neko_device_mpi

  use num_types, only : rp

  use opr_cpu, only : opr_cpu_cfl, opr_cpu_curl, opr_cpu_opgrad, &

                      opr_cpu_conv1, opr_cpu_convect_scalar, opr_cpu_cdtp, &

                      opr_cpu_dudxyz, opr_cpu_lambda2, opr_cpu_set_convect_rst

  use opr_sx, only : opr_sx_cfl, opr_sx_curl, opr_sx_opgrad, &

                     opr_sx_conv1, opr_sx_convect_scalar, opr_sx_cdtp, &

                     opr_sx_dudxyz, opr_sx_lambda2, opr_sx_set_convect_rst

  use opr_xsmm, only : opr_xsmm_cdtp, opr_xsmm_conv1, opr_xsmm_curl, &

                       opr_xsmm_dudxyz, opr_xsmm_opgrad, &

                       opr_xsmm_convect_scalar, opr_xsmm_set_convect_rst

  use opr_device, only : opr_device_cdtp, opr_device_cfl, opr_device_curl, &

                         opr_device_conv1, opr_device_dudxyz, &

                         opr_device_lambda2, opr_device_opgrad

  use space, only : space_t

  use coefs, only : coef_t

  use field, only : field_t

  use interpolation, only : interpolator_t

  use math, only : glsum, cmult, add2, add3s2, cadd, copy, col2, invcol2, &

                   invcol3, rzero

  use device, only : c_ptr, device_get_ptr

  use device_math, only : device_add2, device_cmult, device_copy

  use scratch_registry, only : neko_scratch_registry

  use comm

  implicit none

  private


  public :: dudxyz, opgrad, ortho, cdtp, conv1, curl, cfl, &

            lambda2op, strain_rate, div, grad, set_convect_rst, runge_kutta


contains


  subroutine dudxyz (du, u, dr, ds, dt, coef)

    type(coef_t), intent(in), target :: coef

    real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(inout) :: du

    real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(in) :: u, dr, ds, dt


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_dudxyz(du, u, dr, ds, dt, coef)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_dudxyz(du, u, dr, ds, dt, coef)

    else if (neko_bcknd_device .eq. 1) then

       call opr_device_dudxyz(du, u, dr, ds, dt, coef)

    else

       call opr_cpu_dudxyz(du, u, dr, ds, dt, coef)

    end if


  end subroutine dudxyz


  subroutine div(res, ux, uy, uz, coef)

    type(coef_t), intent(in), target :: coef


    real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(inout) :: res

    real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(in) :: ux, uy, uz

    type(field_t), pointer :: work

    integer :: ind

    type(c_ptr) :: res_d


    if (neko_bcknd_device .eq. 1) then

       res_d = device_get_ptr(res)

    end if


    call neko_scratch_registry%request_field(work, ind)


    ! Get dux / dx

    call dudxyz(res, ux, coef%drdx, coef%dsdx, coef%dtdx, coef)


    ! Get duy / dy

    call dudxyz(work%x, uy, coef%drdy, coef%dsdy, coef%dtdy, coef)

    if (neko_bcknd_device .eq. 1) then

       call device_add2(res_d, work%x_d, work%size())

    else

       call add2(res, work%x, work%size())

    end if


    ! Get dux / dz

    call dudxyz(work%x, uz, coef%drdz, coef%dsdz, coef%dtdz, coef)

    if (neko_bcknd_device .eq. 1) then

       call device_add2(res_d, work%x_d, work%size())

    else

       call add2(res, work%x, work%size())

    end if


    call neko_scratch_registry%relinquish_field(ind)


  end subroutine div


  subroutine grad(ux, uy, uz, u, coef)

    type(coef_t), intent(in) :: coef

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: ux

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uy


    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: u


    call dudxyz(ux, u, coef%drdx, coef%dsdx, coef%dtdx, coef)

    call dudxyz(uy, u, coef%drdy, coef%dsdy, coef%dtdy, coef)

    call dudxyz(uz, u, coef%drdz, coef%dsdz, coef%dtdz, coef)


  end subroutine grad


  subroutine opgrad(ux, uy, uz, u, coef, es, ee)

    type(coef_t), intent(in) :: coef

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: ux

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uy


    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: u

    integer, optional :: es, ee

    integer :: eblk_start, eblk_end


    if (present(es)) then

       eblk_start = es

    else

       eblk_start = 1

    end if


    if (present(ee)) then

       eblk_end = ee

    else

       eblk_end = coef%msh%nelv

    end if


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_opgrad(ux, uy, uz, u, coef)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_opgrad(ux, uy, uz, u, coef)

    else if (neko_bcknd_device .eq. 1) then

       call opr_device_opgrad(ux, uy, uz, u, coef)

    else

       call opr_cpu_opgrad(ux, uy, uz, u, coef, eblk_start, eblk_end)

    end if


  end subroutine opgrad


  subroutine ortho(x, n, glb_n)

    integer, intent(in) :: n

    integer, intent(in) :: glb_n

    real(kind=rp), dimension(n), intent(inout) :: x


    real(kind=rp) :: rlam


    rlam = glsum(x, n)/glb_n

    call cadd(x, -rlam, n)


  end subroutine ortho


  subroutine cdtp (dtx, x, dr, ds, dt, coef, es, ee)

    type(coef_t), intent(in) :: coef

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: dtx

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: x


    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: dr

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: ds

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: dt

    integer, optional :: es, ee

    integer :: eblk_start, eblk_end


     if (present(es)) then

        eblk_start = es

     else

        eblk_start = 1

     end if


     if (present(ee)) then

        eblk_end = ee

     else

        eblk_end = coef%msh%nelv

     end if


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_cdtp(dtx, x, dr, ds, dt, coef)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_cdtp(dtx, x, dr, ds, dt, coef)

    else if (neko_bcknd_device .eq. 1) then

       call opr_device_cdtp(dtx, x, dr, ds, dt, coef)

    else

       call opr_cpu_cdtp(dtx, x, dr, ds, dt, coef, eblk_start, eblk_end)

    end if


  end subroutine cdtp


  subroutine conv1(du, u, vx, vy, vz, Xh, coef, es, ee)

    type(space_t), intent(inout) :: xh

    type(coef_t), intent(inout) :: coef

    real(kind=rp), intent(inout) :: du(xh%lxyz, coef%msh%nelv)


    real(kind=rp), intent(inout) :: u(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

    real(kind=rp), intent(inout) :: vx(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

    real(kind=rp), intent(inout) :: vy(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

    real(kind=rp), intent(inout) :: vz(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

    integer, optional :: es, ee

    integer :: eblk_end, eblk_start


    associate(nelv => coef%msh%nelv, gdim => coef%msh%gdim)

      if (present(es)) then

         eblk_start = es

      else

         eblk_start = 1

      end if


      if (present(ee)) then

         eblk_end = ee

      else

         eblk_end = coef%msh%nelv

      end if


      if (neko_bcknd_sx .eq. 1) then

         call opr_sx_conv1(du, u, vx, vy, vz, xh, coef, nelv)

      else if (neko_bcknd_xsmm .eq. 1) then

         call opr_xsmm_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)

      else if (neko_bcknd_device .eq. 1) then

         call opr_device_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)

      else

         call opr_cpu_conv1(du, u, vx, vy, vz, xh, coef, eblk_start, eblk_end)

      end if

    end associate


  end subroutine conv1


  subroutine convect_scalar(du, u, c, Xh_GLL, Xh_GL, coef_GLL, &

                            coef_GL, GLL_to_GL)

    type(space_t), intent(in) :: xh_gl

    type(space_t), intent(in) :: xh_gll


    type(coef_t), intent(in) :: coef_GLL

    type(coef_t), intent(in) :: coef_GL

    type(interpolator_t), intent(inout) :: GLL_to_GL

    real(kind=rp), intent(inout) :: &

                   du(xh_gll%lx, xh_gll%ly, xh_gll%lz, coef_gl%msh%nelv)

    real(kind=rp), intent(inout) :: &

                   u(xh_gl%lx, xh_gl%lx, xh_gl%lx, coef_gl%msh%nelv)

    real(kind=rp), intent(inout) :: c(xh_gl%lxyz, coef_gl%msh%nelv, 3)


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_convect_scalar(du, u, c, xh_gll, xh_gl, &

                               coef_gll, coef_gl, gll_to_gl)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_convect_scalar(du, u, c, xh_gll, xh_gl, &

                                 coef_gll, coef_gl, gll_to_gl)

    else

       call opr_cpu_convect_scalar(du, u, c, xh_gll, xh_gl, &

                                coef_gll, coef_gl, gll_to_gl)

    end if


  end subroutine convect_scalar


  !! Compute the curl fo a vector field.

  !! @param w1 Will store the x component of the curl.

    type(coef_t), intent(in) :: coef_GLL …

  !! @param w2 Will store the y component of the curl.

  !! @param w3 Will store the z component of the curl.

  !! @param u1 The x component of the vector field.

  !! @param u2 The y component of the vector field.

  !! @param u3 The z component of the vector field.

  !! @param work1 A temporary array for computations.

  !! @param work2 A temporary array for computations.

  !! @param coef The SEM coefficients.

  subroutine curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

    type(field_t), intent(inout) :: w1

    type(field_t), intent(inout) :: w2

    type(field_t), intent(inout) :: w3


    type(field_t), intent(inout) :: u1

    type(field_t), intent(inout) :: u2

    type(field_t), intent(inout) :: u3

    type(field_t), intent(inout) :: work1

    type(field_t), intent(inout) :: work2

    type(coef_t), intent(in) :: coef


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

    else if (neko_bcknd_device .eq. 1) then

       call opr_device_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

    else

       call opr_cpu_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

    end if


  end subroutine curl


  !! Compute the CFL number

  !! @param dt The timestep.

    type(field_t), intent(inout) :: u1 …

  !! @param u The x component of velocity.

  !! @param v The y component of velocity.

  !! @param w The z component of velocity.

  !! @param Xh The SEM function space.

  !! @param coef The SEM coefficients.

  !! @param nelv The total number of elements.

  !! @param gdim Number of geometric dimensions.

  function cfl(dt, u, v, w, Xh, coef, nelv, gdim)

    type(space_t), intent(in) :: xh

    type(coef_t), intent(in) :: coef

    integer, intent(in) :: nelv, gdim


    real(kind=rp), intent(in) :: dt

    real(kind=rp), dimension(Xh%lx, Xh%ly, Xh%lz, nelv), intent(in) :: u, v, w

    real(kind=rp) :: cfl

    integer :: ierr


    if (neko_bcknd_sx .eq. 1) then

       cfl = opr_sx_cfl(dt, u, v, w, xh, coef, nelv)

    else if (neko_bcknd_device .eq. 1) then

       cfl = opr_device_cfl(dt, u, v, w, xh, coef, nelv, gdim)

    else

       cfl = opr_cpu_cfl(dt, u, v, w, xh, coef, nelv, gdim)

    end if


    if (.not. neko_device_mpi) then

       call mpi_allreduce(mpi_in_place, cfl, 1, &

            mpi_real_precision, mpi_max, neko_comm, ierr)

    end if


  end function cfl


  subroutine strain_rate(s11, s22, s33, s12, s13, s23, u, v, w, coef)

    type(field_t), intent(in) :: u, v, w

    type(coef_t), intent(in) :: coef

    real(kind=rp), intent(inout) :: s11(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)


    real(kind=rp), intent(inout) :: s22(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

    real(kind=rp), intent(inout) :: s33(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

    real(kind=rp), intent(inout) :: s12(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

    real(kind=rp), intent(inout) :: s13(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

    real(kind=rp), intent(inout) :: s23(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)


    type(c_ptr) :: s11_d, s22_d, s33_d, s12_d, s23_d, s13_d


    integer :: nelv, lxyz


    if (neko_bcknd_device .eq. 1) then

       s11_d = device_get_ptr(s11)

       s22_d = device_get_ptr(s22)

       s33_d = device_get_ptr(s33)

       s12_d = device_get_ptr(s12)

       s23_d = device_get_ptr(s23)

       s13_d = device_get_ptr(s13)

    end if


    nelv = u%msh%nelv

    lxyz = u%Xh%lxyz


    ! we use s11 as a work array here

    call dudxyz (s12, u%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

    call dudxyz (s11, v%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

    if (neko_bcknd_device .eq. 1) then

       call device_add2(s12_d, s11_d, nelv*lxyz)

    else

       call add2(s12, s11, nelv*lxyz)

    end if


    call dudxyz (s13, u%x, coef%drdz, coef%dsdz, coef%dtdz, coef)

    call dudxyz (s11, w%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

    if (neko_bcknd_device .eq. 1) then

       call device_add2(s13_d, s11_d, nelv*lxyz)

    else

       call add2(s13, s11, nelv*lxyz)

    end if


    call dudxyz (s23, v%x, coef%drdz, coef%dsdz, coef%dtdz, coef)

    call dudxyz (s11, w%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

    if (neko_bcknd_device .eq. 1) then

       call device_add2(s23_d, s11_d, nelv*lxyz)

    else

       call add2(s23, s11, nelv*lxyz)

    end if


    call dudxyz (s11, u%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

    call dudxyz (s22, v%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

    call dudxyz (s33, w%x, coef%drdz, coef%dsdz, coef%dtdz, coef)


    if (neko_bcknd_device .eq. 1) then

       call device_cmult(s12_d, 0.5_rp, nelv*lxyz)

       call device_cmult(s13_d, 0.5_rp, nelv*lxyz)

       call device_cmult(s23_d, 0.5_rp, nelv*lxyz)

    else

       call cmult(s12, 0.5_rp, nelv*lxyz)

       call cmult(s13, 0.5_rp, nelv*lxyz)

       call cmult(s23, 0.5_rp, nelv*lxyz)

    end if


  end subroutine strain_rate


  subroutine lambda2op(lambda2, u, v, w, coef)

    type(coef_t), intent(in) :: coef

    type(field_t), intent(inout) :: lambda2

    type(field_t), intent(in) :: u, v, w


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_lambda2(lambda2, u, v, w, coef)

    else if (neko_bcknd_device .eq. 1) then

       call opr_device_lambda2(lambda2, u, v, w, coef)

    else

       call opr_cpu_lambda2(lambda2, u, v, w, coef)

    end if


  end subroutine lambda2op


  subroutine set_convect_rst(cr, cs, ct, cx, cy, cz, Xh, coef)

    type(space_t), intent(inout) :: xh

    type(coef_t), intent(inout) :: coef

    real(kind=rp), dimension(Xh%lxyz, coef%msh%nelv), &


                   intent(inout) :: cr, cs, ct

    real(kind=rp), dimension(Xh%lxyz, coef%msh%nelv), &

                   intent(in) :: cx, cy, cz


    if (neko_bcknd_sx .eq. 1) then

       call opr_sx_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

    else if (neko_bcknd_xsmm .eq. 1) then

       call opr_xsmm_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

    else

       call opr_cpu_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

    end if


  end subroutine set_convect_rst


  subroutine runge_kutta(phi, c_r1, c_r23, c_r4, Xh_GLL, Xh_GL, coef, &

                         coef_GL, GLL_to_GL, tau, dtau, n, nel, n_GL)

    type(space_t), intent(inout) :: xh_gll

    type(space_t), intent(inout) :: xh_gl


    type(coef_t), intent(inout) :: coef

    type(coef_t), intent(inout) :: coef_gl

    type(interpolator_t) :: gll_to_gl

    real(kind=rp), intent(inout) :: tau, dtau

    integer, intent(in) :: n, nel, n_gl

    real(kind=rp), dimension(n), intent(inout) :: phi

    real(kind=rp), dimension(3 * n_GL), intent(inout) :: c_r1, c_r23, c_r4

    real(kind=rp) :: c1, c2, c3

    ! Work Arrays

    real(kind=rp), dimension(n) ::  u1, r1, r2, r3, r4

    real(kind=rp), dimension(n_GL) :: u1_gl

    integer :: i, e


    c1 = 1.

    c2 = -dtau/2.

    c3 = -dtau


    ! Stage 1:

    call invcol3 (u1, phi, coef%B, n)

    call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

    call convect_scalar(r1, u1_gl, c_r1, xh_gll, xh_gl, coef, &

                        coef_gl, gll_to_gl)

    call col2(r1, coef%B, n)


    ! Stage 2:

    call add3s2 (u1, phi, r1, c1, c2, n)

    call invcol2 (u1, coef%B, n)

    call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

    call convect_scalar(r2, u1_gl, c_r23, xh_gll, xh_gl, coef, &

                        coef_gl, gll_to_gl)

    call col2(r2, coef%B, n)


    ! Stage 3:

    call add3s2 (u1, phi, r2, c1, c2, n)

    call invcol2 (u1,  coef%B, n)

    call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

    call convect_scalar(r3, u1_gl, c_r23, xh_gll, xh_gl, coef, &

                        coef_gl, gll_to_gl)

    call col2(r3, coef%B, n)


    ! Stage 4:

    call add3s2 (u1, phi, r3, c1, c3, n)

    call invcol2 (u1, coef%B, n)

    call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

    call convect_scalar(r4, u1_gl, c_r4, xh_gll, xh_gl, coef, &

                        coef_gl, gll_to_gl)

    call col2(r4, coef%B, n)


    c1 = -dtau/6.

    c2 = -dtau/3.

    do i = 1, n

       phi(i) = phi(i) + c1 * (r1(i) + r4(i)) + c2 * (r2(i) + r3(i))

    end do


  end subroutine runge_kutta


end module operators


    type(coef_t), intent(inout) :: coef …

                   intent(inout) :: cr, cs, ct …

  …

    real(kind=rp), intent(inout) :: s22(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv) …

    real(kind=rp), intent(in) :: dt …

    real(kind=rp), intent(inout) :: u(xh%lx, xh%ly, xh%lz, coef%msh%nelv) …

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: dr …

    real(kind=rp) :: rlam …

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz …

    real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz …

    real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(inout) :: res …

  subroutine dudxyz (du, u, dr, ds, dt, coef) …

device::device_get_ptr
Return the device pointer for an associated Fortran array.
Definition device.F90:81

coefs
Coefficients.
Definition coef.f90:34

comm
Definition comm.F90:1

device_math
Definition device_math.F90:33

device_math::device_add2
subroutine, public device_add2(a_d, b_d, n)
Vector addition .
Definition device_math.F90:247

device_math::device_cmult
subroutine, public device_cmult(a_d, c, n)
Multiplication by constant c .
Definition device_math.F90:166

device_math::device_copy
subroutine, public device_copy(a_d, b_d, n)
Copy a vector .
Definition device_math.F90:76

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

field
Defines a field.
Definition field.f90:34

interpolation
Routines to interpolate between different spaces.
Definition interpolation.f90:34

lambda2
A simulation component that computes lambda2 The values are stored in the field registry under the na...
Definition lambda2.f90:37

math
Definition math.f90:60

math::cmult
subroutine, public cmult(a, c, n)
Multiplication by constant c .
Definition math.f90:311

math::invcol2
subroutine, public invcol2(a, b, n)
Vector division .
Definition math.f90:715

math::cadd
subroutine, public cadd(a, s, n)
Add a scalar to vector .
Definition math.f90:323

math::glsum
real(kind=rp) function, public glsum(a, n)
Sum a vector of length n.
Definition math.f90:360

math::add2
subroutine, public add2(a, b, n)
Vector addition .
Definition math.f90:587

math::invcol3
subroutine, public invcol3(a, b, c, n)
Invert a vector .
Definition math.f90:487

math::add3s2
subroutine, public add3s2(a, b, c, c1, c2, n)
Returns .
Definition math.f90:770

math::col2
subroutine, public col2(a, b, n)
Vector multiplication .
Definition math.f90:729

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition math.f90:239

math::rzero
subroutine, public rzero(a, n)
Zero a real vector.
Definition math.f90:195

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_sx
integer, parameter neko_bcknd_sx
Definition neko_config.f90:39

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

neko_config::neko_device_mpi
logical, parameter neko_device_mpi
Definition neko_config.f90:46

neko_config::neko_bcknd_xsmm
integer, parameter neko_bcknd_xsmm
Definition neko_config.f90:40

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

operators
Operators.
Definition operators.f90:34

operators::runge_kutta
subroutine, public runge_kutta(phi, c_r1, c_r23, c_r4, xh_gll, xh_gl, coef, coef_gl, gll_to_gl, tau, dtau, n, nel, n_gl)
Compute one step of Runge Kutta time interpolation for OIFS scheme.
Definition operators.f90:562

operators::set_convect_rst
subroutine, public set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)
Transforms the convecting velocity field to the rst form of the GL space.
Definition operators.f90:528

operators::convect_scalar
subroutine convect_scalar(du, u, c, xh_gll, xh_gl, coef_gll, coef_gl, gll_to_gl)
Apply the convecting velocity c to the to the scalar field u, used in the OIFS scheme.
Definition operators.f90:327

operators::cfl
real(kind=rp) function, public cfl(dt, u, v, w, xh, coef, nelv, gdim)
Definition operators.f90:394

operators::opgrad
subroutine, public opgrad(ux, uy, uz, u, coef, es, ee)
Compute the weak gradient of a scalar field, i.e. the gradient multiplied by the mass matrix.
Definition operators.f90:171

operators::div
subroutine, public div(res, ux, uy, uz, coef)
Compute the divergence of a vector field.
Definition operators.f90:101

operators::conv1
subroutine, public conv1(du, u, vx, vy, vz, xh, coef, es, ee)
Compute the advection term.
Definition operators.f90:274

operators::grad
subroutine, public grad(ux, uy, uz, u, coef)
Compute the gradient of a scalar field.
Definition operators.f90:146

operators::curl
subroutine, public curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)
Definition operators.f90:362

operators::strain_rate
subroutine, public strain_rate(s11, s22, s33, s12, s13, s23, u, v, w, coef)
Compute the strain rate tensor, i.e 0.5 * du_i/dx_j + du_j/dx_i.
Definition operators.f90:430

operators::lambda2op
subroutine, public lambda2op(lambda2, u, v, w, coef)
Compute the Lambda2 field for a given velocity field.
Definition operators.f90:503

operators::ortho
subroutine, public ortho(x, n, glb_n)
Othogonalize with regard to vector (1,1,1,1,1,1...,1)^T.
Definition operators.f90:208

operators::cdtp
subroutine, public cdtp(dtx, x, dr, ds, dt, coef, es, ee)
Apply D^T to a scalar field, where D is the derivative matrix.
Definition operators.f90:230

operators::dudxyz
subroutine, public dudxyz(du, u, dr, ds, dt, coef)
Compute derivative of a scalar field along a single direction.
Definition operators.f90:76

opr_cpu
Operators CPU backend.
Definition opr_cpu.f90:34

opr_cpu::opr_cpu_curl
subroutine, public opr_cpu_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_xh)
Definition opr_cpu.f90:124

opr_cpu::opr_cpu_cfl
real(kind=rp) function, public opr_cpu_cfl(dt, u, v, w, xh, coef, nelv, gdim)
Definition opr_cpu.f90:175

opr_cpu::opr_cpu_lambda2
subroutine, public opr_cpu_lambda2(lambda2, u, v, w, coef)
Definition opr_cpu.f90:235

opr_device
Operators accelerator backends.
Definition opr_device.F90:34

opr_device::opr_device_curl
subroutine, public opr_device_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_xh)
Definition opr_device.F90:515

opr_device::opr_device_cdtp
subroutine, public opr_device_cdtp(dtx, x, dr, ds, dt, coef)
Definition opr_device.F90:432

opr_device::opr_device_cfl
real(kind=rp) function, public opr_device_cfl(dt, u, v, w, xh, coef, nelv, gdim)
Definition opr_device.F90:665

opr_device::opr_device_dudxyz
subroutine, public opr_device_dudxyz(du, u, dr, ds, dt, coef)
Definition opr_device.F90:325

opr_device::opr_device_opgrad
subroutine, public opr_device_opgrad(ux, uy, uz, u, coef)
Definition opr_device.F90:360

opr_device::opr_device_conv1
subroutine, public opr_device_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)
Definition opr_device.F90:468

opr_device::opr_device_lambda2
subroutine, public opr_device_lambda2(lambda2, u, v, w, coef)
Definition opr_device.F90:402

opr_sx
Operators SX-Aurora backend.
Definition opr_sx.f90:2

opr_sx::opr_sx_curl
subroutine, public opr_sx_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_xh)
Definition opr_sx.f90:100

opr_xsmm
Operators libxsmm backend.
Definition opr_xsmm.F90:61

opr_xsmm::opr_xsmm_conv1
subroutine, public opr_xsmm_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)
Definition opr_xsmm.F90:297

opr_xsmm::opr_xsmm_cdtp
subroutine, public opr_xsmm_cdtp(dtx, x, dr, ds, dt, coef)
Definition opr_xsmm.F90:242

opr_xsmm::opr_xsmm_curl
subroutine, public opr_xsmm_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_xh)
Definition opr_xsmm.F90:416

opr_xsmm::opr_xsmm_dudxyz
subroutine, public opr_xsmm_dudxyz(du, u, dr, ds, dt, coef)
Definition opr_xsmm.F90:92

opr_xsmm::opr_xsmm_opgrad
subroutine, public opr_xsmm_opgrad(ux, uy, uz, u, coef)
Definition opr_xsmm.F90:146

opr_xsmm::opr_xsmm_set_convect_rst
subroutine, public opr_xsmm_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)
Definition opr_xsmm.F90:467

opr_xsmm::opr_xsmm_convect_scalar
subroutine, public opr_xsmm_convect_scalar(du, u, c, xh_gll, xh_gl, coef_gll, coef_gl, gll_to_gl)
Definition opr_xsmm.F90:371

scratch_registry
Defines a registry for storing and requesting temporary fields This can be used when you have a funct...
Definition scratch_registry.f90:37

scratch_registry::neko_scratch_registry
type(scratch_registry_t), target, public neko_scratch_registry
Global scratch registry.
Definition scratch_registry.f90:85

space
Defines a function space.
Definition space.f90:34

coefs::coef_t
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
Definition coef.f90:55

field::field_t
Definition field.f90:46

interpolation::interpolator_t
Interpolation between two space::space_t.
Definition interpolation.f90:51

space::space_t
The function space for the SEM solution fields.
Definition space.f90:62