dd/dbf/operators_8f90_source.html

 ! Copyright (c) 2020-2024, The Neko Authors

 ! All rights reserved.

 !

 ! Redistribution and use in source and binary forms, with or without

 ! modification, are permitted provided that the following conditions

 ! are met:

 !

 !   * Redistributions of source code must retain the above copyright

 !     notice, this list of conditions and the following disclaimer.

 !

 !   * Redistributions in binary form must reproduce the above

 !     copyright notice, this list of conditions and the following

 !     disclaimer in the documentation and/or other materials provided

 !     with the distribution.

 !

 !   * Neither the name of the authors nor the names of its

 !     contributors may be used to endorse or promote products derived

 !     from this software without specific prior written permission.

 !

 ! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

 ! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

 ! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

 ! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

 ! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

 ! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

 ! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 ! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

 ! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

 ! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

 ! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 ! POSSIBILITY OF SUCH DAMAGE.

 !

 module operators

   use neko_config, only : neko_bcknd_sx, neko_bcknd_device, neko_bcknd_xsmm, &

                           neko_device_mpi

   use num_types, only : rp

   use opr_cpu, only : opr_cpu_cfl, opr_cpu_curl, opr_cpu_opgrad, &

                       opr_cpu_conv1, opr_cpu_convect_scalar, opr_cpu_cdtp, &

                       opr_cpu_dudxyz, opr_cpu_lambda2, opr_cpu_set_convect_rst

   use opr_sx, only : opr_sx_cfl, opr_sx_curl, opr_sx_opgrad, &

                      opr_sx_conv1, opr_sx_convect_scalar, opr_sx_cdtp, &

                      opr_sx_dudxyz, opr_sx_lambda2, opr_sx_set_convect_rst

   use opr_xsmm, only : opr_xsmm_cdtp, opr_xsmm_conv1, opr_xsmm_curl, &

                        opr_xsmm_dudxyz, opr_xsmm_opgrad, &

                        opr_xsmm_convect_scalar, opr_xsmm_set_convect_rst

   use opr_device, only : opr_device_cdtp, opr_device_cfl, opr_device_curl, &

                          opr_device_conv1, opr_device_dudxyz, &

                          opr_device_lambda2, opr_device_opgrad

   use space, only : space_t

   use coefs, only : coef_t

   use field, only : field_t

   use interpolation, only : interpolator_t

   use math, only : glsum, cmult, add2, add3s2, cadd, copy, col2, invcol2, &

                    invcol3, rzero

   use device, only : c_ptr, device_get_ptr

   use device_math, only : device_add2, device_cmult, device_copy

   use scratch_registry, only : neko_scratch_registry

   use comm

   implicit none

   private


   public :: dudxyz, opgrad, ortho, cdtp, conv1, curl, cfl, &

             lambda2op, strain_rate, div, grad, set_convect_rst, runge_kutta


 contains


   subroutine dudxyz (du, u, dr, ds, dt, coef)

     type(coef_t), intent(in), target :: coef

     real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(inout) :: du

     real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(in) :: u, dr, ds, dt


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_dudxyz(du, u, dr, ds, dt, coef)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_dudxyz(du, u, dr, ds, dt, coef)

     else if (neko_bcknd_device .eq. 1) then

        call opr_device_dudxyz(du, u, dr, ds, dt, coef)

     else

        call opr_cpu_dudxyz(du, u, dr, ds, dt, coef)

     end if


   end subroutine dudxyz


   subroutine div(res, ux, uy, uz, coef)

     type(coef_t), intent(in), target :: coef

     real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(inout) :: res

     real(kind=rp), dimension(coef%Xh%lx, coef%Xh%ly, coef%Xh%lz, &
         coef%msh%nelv), intent(in) :: ux, uy, uz

     type(field_t), pointer :: work

     integer :: ind

     type(c_ptr) :: res_d


     if (neko_bcknd_device .eq. 1) then

        res_d = device_get_ptr(res)

     end if


     call neko_scratch_registry%request_field(work, ind)


     ! Get dux / dx

     call dudxyz(res, ux, coef%drdx, coef%dsdx, coef%dtdx, coef)


     ! Get duy / dy

     call dudxyz(work%x, uy, coef%drdy, coef%dsdy, coef%dtdy, coef)

     if (neko_bcknd_device .eq. 1) then

        call device_add2(res_d, work%x_d, work%size())

     else

        call add2(res, work%x, work%size())

     end if


     ! Get dux / dz

     call dudxyz(work%x, uz, coef%drdz, coef%dsdz, coef%dtdz, coef)

     if (neko_bcknd_device .eq. 1) then

        call device_add2(res_d, work%x_d, work%size())

     else

        call add2(res, work%x, work%size())

     end if


     call neko_scratch_registry%relinquish_field(ind)


   end subroutine div


   subroutine grad(ux, uy, uz, u, coef)

     type(coef_t), intent(in) :: coef

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: ux

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uy

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: u


     call dudxyz(ux, u, coef%drdx, coef%dsdx, coef%dtdx, coef)

     call dudxyz(uy, u, coef%drdy, coef%dsdy, coef%dtdy, coef)

     call dudxyz(uz, u, coef%drdz, coef%dsdz, coef%dtdz, coef)


   end subroutine grad


   subroutine opgrad(ux, uy, uz, u, coef, es, ee)

     type(coef_t), intent(in) :: coef

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: ux

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uy

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: uz

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: u

     integer, optional :: es, ee

     integer :: eblk_start, eblk_end


     if (present(es)) then

        eblk_start = es

     else

        eblk_start = 1

     end if


     if (present(ee)) then

        eblk_end = ee

     else

        eblk_end = coef%msh%nelv

     end if


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_opgrad(ux, uy, uz, u, coef)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_opgrad(ux, uy, uz, u, coef)

     else if (neko_bcknd_device .eq. 1) then

        call opr_device_opgrad(ux, uy, uz, u, coef)

     else

        call opr_cpu_opgrad(ux, uy, uz, u, coef, eblk_start, eblk_end)

     end if


   end subroutine opgrad


   subroutine ortho(x, n, glb_n)

     integer, intent(in) :: n

     integer, intent(in) :: glb_n

     real(kind=rp), dimension(n), intent(inout) :: x

     real(kind=rp) :: rlam


     rlam = glsum(x, n)/glb_n

     call cadd(x, -rlam, n)


   end subroutine ortho


   subroutine cdtp (dtx, x, dr, ds, dt, coef, es, ee)

     type(coef_t), intent(in) :: coef

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: dtx

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(inout) :: x

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: dr

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: ds

     real(kind=rp), dimension(coef%Xh%lxyz, coef%msh%nelv), intent(in) :: dt

     integer, optional :: es, ee

     integer :: eblk_start, eblk_end


      if (present(es)) then

         eblk_start = es

      else

         eblk_start = 1

      end if


      if (present(ee)) then

         eblk_end = ee

      else

         eblk_end = coef%msh%nelv

      end if


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_cdtp(dtx, x, dr, ds, dt, coef)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_cdtp(dtx, x, dr, ds, dt, coef)

     else if (neko_bcknd_device .eq. 1) then

        call opr_device_cdtp(dtx, x, dr, ds, dt, coef)

     else

        call opr_cpu_cdtp(dtx, x, dr, ds, dt, coef, eblk_start, eblk_end)

     end if


   end subroutine cdtp


   subroutine conv1(du, u, vx, vy, vz, Xh, coef, es, ee)

     type(space_t), intent(inout) :: xh

     type(coef_t), intent(inout) :: coef

     real(kind=rp), intent(inout) :: du(xh%lxyz, coef%msh%nelv)

     real(kind=rp), intent(inout) :: u(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

     real(kind=rp), intent(inout) :: vx(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

     real(kind=rp), intent(inout) :: vy(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

     real(kind=rp), intent(inout) :: vz(xh%lx, xh%ly, xh%lz, coef%msh%nelv)

     integer, optional :: es, ee

     integer :: eblk_end, eblk_start


     associate(nelv => coef%msh%nelv, gdim => coef%msh%gdim)

       if (present(es)) then

          eblk_start = es

       else

          eblk_start = 1

       end if


       if (present(ee)) then

          eblk_end = ee

       else

          eblk_end = coef%msh%nelv

       end if


       if (neko_bcknd_sx .eq. 1) then

          call opr_sx_conv1(du, u, vx, vy, vz, xh, coef, nelv)

       else if (neko_bcknd_xsmm .eq. 1) then

          call opr_xsmm_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)

       else if (neko_bcknd_device .eq. 1) then

          call opr_device_conv1(du, u, vx, vy, vz, xh, coef, nelv, gdim)

       else

          call opr_cpu_conv1(du, u, vx, vy, vz, xh, coef, eblk_start, eblk_end)

       end if

     end associate


   end subroutine conv1


   subroutine convect_scalar(du, u, c, Xh_GLL, Xh_GL, coef_GLL, &

                             coef_GL, GLL_to_GL)

     type(space_t), intent(in) :: xh_gl

     type(space_t), intent(in) :: xh_gll

     type(coef_t), intent(in) :: coef_GLL

     type(coef_t), intent(in) :: coef_GL

     type(interpolator_t), intent(inout) :: GLL_to_GL

     real(kind=rp), intent(inout) :: &

                    du(xh_gll%lx, xh_gll%ly, xh_gll%lz, coef_gl%msh%nelv)

     real(kind=rp), intent(inout) :: &

                    u(xh_gl%lx, xh_gl%lx, xh_gl%lx, coef_gl%msh%nelv)

     real(kind=rp), intent(inout) :: c(xh_gl%lxyz, coef_gl%msh%nelv, 3)


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_convect_scalar(du, u, c, xh_gll, xh_gl, &

                                coef_gll, coef_gl, gll_to_gl)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_convect_scalar(du, u, c, xh_gll, xh_gl, &

                                  coef_gll, coef_gl, gll_to_gl)

     else

        call opr_cpu_convect_scalar(du, u, c, xh_gll, xh_gl, &

                                 coef_gll, coef_gl, gll_to_gl)

     end if


   end subroutine convect_scalar


   !! Compute the curl fo a vector field.

   !! @param w1 Will store the x component of the curl.

   !! @param w2 Will store the y component of the curl.

   !! @param w3 Will store the z component of the curl.

   !! @param u1 The x component of the vector field.

   !! @param u2 The y component of the vector field.

   !! @param u3 The z component of the vector field.

   !! @param work1 A temporary array for computations.

   !! @param work2 A temporary array for computations.

   !! @param coef The SEM coefficients.

   subroutine curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

     type(field_t), intent(inout) :: w1

     type(field_t), intent(inout) :: w2

     type(field_t), intent(inout) :: w3

     type(field_t), intent(inout) :: u1

     type(field_t), intent(inout) :: u2

     type(field_t), intent(inout) :: u3

     type(field_t), intent(inout) :: work1

     type(field_t), intent(inout) :: work2

     type(coef_t), intent(in) :: coef


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

     else if (neko_bcknd_device .eq. 1) then

        call opr_device_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

     else

        call opr_cpu_curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)

     end if


   end subroutine curl


   !! Compute the CFL number

   !! @param dt The timestep.

   !! @param u The x component of velocity.

   !! @param v The y component of velocity.

   !! @param w The z component of velocity.

   !! @param Xh The SEM function space.

   !! @param coef The SEM coefficients.

   !! @param nelv The total number of elements.

   !! @param gdim Number of geometric dimensions.

   function cfl(dt, u, v, w, Xh, coef, nelv, gdim)

     type(space_t), intent(in) :: xh

     type(coef_t), intent(in) :: coef

     integer, intent(in) :: nelv, gdim

     real(kind=rp), intent(in) :: dt

     real(kind=rp), dimension(Xh%lx, Xh%ly, Xh%lz, nelv), intent(in) :: u, v, w

     real(kind=rp) :: cfl

     integer :: ierr


     if (neko_bcknd_sx .eq. 1) then

        cfl = opr_sx_cfl(dt, u, v, w, xh, coef, nelv)

     else if (neko_bcknd_device .eq. 1) then

        cfl = opr_device_cfl(dt, u, v, w, xh, coef, nelv, gdim)

     else

        cfl = opr_cpu_cfl(dt, u, v, w, xh, coef, nelv, gdim)

     end if


     if (.not. neko_device_mpi) then

        call mpi_allreduce(mpi_in_place, cfl, 1, &

             mpi_real_precision, mpi_max, neko_comm, ierr)

     end if


   end function cfl


   subroutine strain_rate(s11, s22, s33, s12, s13, s23, u, v, w, coef)

     type(field_t), intent(in) :: u, v, w

     type(coef_t), intent(in) :: coef

     real(kind=rp), intent(inout) :: s11(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

     real(kind=rp), intent(inout) :: s22(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

     real(kind=rp), intent(inout) :: s33(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

     real(kind=rp), intent(inout) :: s12(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

     real(kind=rp), intent(inout) :: s13(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)

     real(kind=rp), intent(inout) :: s23(u%Xh%lx, u%Xh%ly, u%Xh%lz, u%msh%nelv)


     type(c_ptr) :: s11_d, s22_d, s33_d, s12_d, s23_d, s13_d


     integer :: nelv, lxyz


     if (neko_bcknd_device .eq. 1) then

        s11_d = device_get_ptr(s11)

        s22_d = device_get_ptr(s22)

        s33_d = device_get_ptr(s33)

        s12_d = device_get_ptr(s12)

        s23_d = device_get_ptr(s23)

        s13_d = device_get_ptr(s13)

     end if


     nelv = u%msh%nelv

     lxyz = u%Xh%lxyz


     ! we use s11 as a work array here

     call dudxyz (s12, u%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

     call dudxyz (s11, v%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

     if (neko_bcknd_device .eq. 1) then

        call device_add2(s12_d, s11_d, nelv*lxyz)

     else

        call add2(s12, s11, nelv*lxyz)

     end if


     call dudxyz (s13, u%x, coef%drdz, coef%dsdz, coef%dtdz, coef)

     call dudxyz (s11, w%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

     if (neko_bcknd_device .eq. 1) then

        call device_add2(s13_d, s11_d, nelv*lxyz)

     else

        call add2(s13, s11, nelv*lxyz)

     end if


     call dudxyz (s23, v%x, coef%drdz, coef%dsdz, coef%dtdz, coef)

     call dudxyz (s11, w%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

     if (neko_bcknd_device .eq. 1) then

        call device_add2(s23_d, s11_d, nelv*lxyz)

     else

        call add2(s23, s11, nelv*lxyz)

     end if


     call dudxyz (s11, u%x, coef%drdx, coef%dsdx, coef%dtdx, coef)

     call dudxyz (s22, v%x, coef%drdy, coef%dsdy, coef%dtdy, coef)

     call dudxyz (s33, w%x, coef%drdz, coef%dsdz, coef%dtdz, coef)


     if (neko_bcknd_device .eq. 1) then

        call device_cmult(s12_d, 0.5_rp, nelv*lxyz)

        call device_cmult(s13_d, 0.5_rp, nelv*lxyz)

        call device_cmult(s23_d, 0.5_rp, nelv*lxyz)

     else

        call cmult(s12, 0.5_rp, nelv*lxyz)

        call cmult(s13, 0.5_rp, nelv*lxyz)

        call cmult(s23, 0.5_rp, nelv*lxyz)

     end if


   end subroutine strain_rate


   subroutine lambda2op(lambda2, u, v, w, coef)

     type(coef_t), intent(in) :: coef

     type(field_t), intent(inout) :: lambda2

     type(field_t), intent(in) :: u, v, w


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_lambda2(lambda2, u, v, w, coef)

     else if (neko_bcknd_device .eq. 1) then

        call opr_device_lambda2(lambda2, u, v, w, coef)

     else

        call opr_cpu_lambda2(lambda2, u, v, w, coef)

     end if


   end subroutine lambda2op


   subroutine set_convect_rst(cr, cs, ct, cx, cy, cz, Xh, coef)

     type(space_t), intent(inout) :: xh

     type(coef_t), intent(inout) :: coef

     real(kind=rp), dimension(Xh%lxyz, coef%msh%nelv), &

                    intent(inout) :: cr, cs, ct

     real(kind=rp), dimension(Xh%lxyz, coef%msh%nelv), &

                    intent(in) :: cx, cy, cz


     if (neko_bcknd_sx .eq. 1) then

        call opr_sx_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

     else if (neko_bcknd_xsmm .eq. 1) then

        call opr_xsmm_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

     else

        call opr_cpu_set_convect_rst(cr, cs, ct, cx, cy, cz, xh, coef)

     end if


   end subroutine set_convect_rst


   subroutine runge_kutta(phi, c_r1, c_r23, c_r4, Xh_GLL, Xh_GL, coef, &

                          coef_GL, GLL_to_GL, tau, dtau, n, nel, n_GL)

     type(space_t), intent(inout) :: xh_gll

     type(space_t), intent(inout) :: xh_gl

     type(coef_t), intent(inout) :: coef

     type(coef_t), intent(inout) :: coef_gl

     type(interpolator_t) :: gll_to_gl

     real(kind=rp), intent(inout) :: tau, dtau

     integer, intent(in) :: n, nel, n_gl

     real(kind=rp), dimension(n), intent(inout) :: phi

     real(kind=rp), dimension(3 * n_GL), intent(inout) :: c_r1, c_r23, c_r4

     real(kind=rp) :: c1, c2, c3

     ! Work Arrays

     real(kind=rp), dimension(n) ::  u1, r1, r2, r3, r4

     real(kind=rp), dimension(n_GL) :: u1_gl

     integer :: i, e


     c1 = 1.

     c2 = -dtau/2.

     c3 = -dtau


     ! Stage 1:

     call invcol3 (u1, phi, coef%B, n)

     call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

     call convect_scalar(r1, u1_gl, c_r1, xh_gll, xh_gl, coef, &

                         coef_gl, gll_to_gl)

     call col2(r1, coef%B, n)


     ! Stage 2:

     call add3s2 (u1, phi, r1, c1, c2, n)

     call invcol2 (u1, coef%B, n)

     call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

     call convect_scalar(r2, u1_gl, c_r23, xh_gll, xh_gl, coef, &

                         coef_gl, gll_to_gl)

     call col2(r2, coef%B, n)


     ! Stage 3:

     call add3s2 (u1, phi, r2, c1, c2, n)

     call invcol2 (u1,  coef%B, n)

     call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

     call convect_scalar(r3, u1_gl, c_r23, xh_gll, xh_gl, coef, &

                         coef_gl, gll_to_gl)

     call col2(r3, coef%B, n)


     ! Stage 4:

     call add3s2 (u1, phi, r3, c1, c3, n)

     call invcol2 (u1, coef%B, n)

     call gll_to_gl%map(u1_gl, u1, nel, xh_gl)

     call convect_scalar(r4, u1_gl, c_r4, xh_gll, xh_gl, coef, &

                         coef_gl, gll_to_gl)

     call col2(r4, coef%B, n)


     c1 = -dtau/6.

     c2 = -dtau/3.

     do i = 1, n

        phi(i) = phi(i) + c1 * (r1(i) + r4(i)) + c2 * (r2(i) + r3(i))

     end do


   end subroutine runge_kutta


 end module operators

 device::device_get_ptr
Return the device pointer for an associated Fortran array.
Definition: device.F90:81

coefs
Coefficients.
Definition: coef.f90:34

comm
Definition: comm.F90:1

device_math
Definition: device_math.F90:33

device_math::device_add2
subroutine, public device_add2(a_d, b_d, n)
Vector addition .
Definition: device_math.F90:247

device_math::device_cmult
subroutine, public device_cmult(a_d, c, n)
Multiplication by constant c .
Definition: device_math.F90:166

device_math::device_copy
subroutine, public device_copy(a_d, b_d, n)
Copy a vector .
Definition: device_math.F90:76

device
Device abstraction, common interface for various accelerators.
Definition: device.F90:34

field
Defines a field.
Definition: field.f90:34

interpolation
Routines to interpolate between different spaces.
Definition: interpolation.f90:34

lambda2
A simulation component that computes lambda2 The values are stored in the field registry under the na...
Definition: lambda2.f90:37

math
Definition: math.f90:60

math::cmult
subroutine, public cmult(a, c, n)
Multiplication by constant c .
Definition: math.f90:311

math::invcol2
subroutine, public invcol2(a, b, n)
Vector division .
Definition: math.f90:715

math::cadd
subroutine, public cadd(a, s, n)
Add a scalar to vector .
Definition: math.f90:323

math::glsum
real(kind=rp) function, public glsum(a, n)
Sum a vector of length n.
Definition: math.f90:360

math::add2
subroutine, public add2(a, b, n)
Vector addition .
Definition: math.f90:587

math::invcol3
subroutine, public invcol3(a, b, c, n)
Invert a vector .
Definition: math.f90:487

math::add3s2
subroutine, public add3s2(a, b, c, c1, c2, n)
Returns .
Definition: math.f90:770

math::col2
subroutine, public col2(a, b, n)
Vector multiplication .
Definition: math.f90:729

math::copy
subroutine, public copy(a, b, n)
Copy a vector .
Definition: math.f90:239

math::rzero
subroutine, public rzero(a, n)
Zero a real vector.
Definition: math.f90:195

neko_config
Build configurations.
Definition: neko_config.f90:34

neko_config::neko_bcknd_sx
integer, parameter neko_bcknd_sx
Definition: neko_config.f90:39

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition: neko_config.f90:44

neko_config::neko_device_mpi
logical, parameter neko_device_mpi
Definition: neko_config.f90:46

neko_config::neko_bcknd_xsmm
integer, parameter neko_bcknd_xsmm
Definition: neko_config.f90:40

num_types
Definition: num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition: num_types.f90:12

operators
Operators.
Definition: operators.f90:34

operators::runge_kutta
subroutine, public runge_kutta(phi, c_r1, c_r23, c_r4, Xh_GLL, Xh_GL, coef, coef_GL, GLL_to_GL, tau, dtau, n, nel, n_GL)
Compute one step of Runge Kutta time interpolation for OIFS scheme.
Definition: operators.f90:562

operators::opgrad
subroutine, public opgrad(ux, uy, uz, u, coef, es, ee)
Compute the weak gradient of a scalar field, i.e. the gradient multiplied by the mass matrix.
Definition: operators.f90:171

operators::set_convect_rst
subroutine, public set_convect_rst(cr, cs, ct, cx, cy, cz, Xh, coef)
Transforms the convecting velocity field to the rst form of the GL space.
Definition: operators.f90:528

operators::div
subroutine, public div(res, ux, uy, uz, coef)
Compute the divergence of a vector field.
Definition: operators.f90:101

operators::convect_scalar
subroutine convect_scalar(du, u, c, Xh_GLL, Xh_GL, coef_GLL, coef_GL, GLL_to_GL)
Apply the convecting velocity c to the to the scalar field u, used in the OIFS scheme.
Definition: operators.f90:327

operators::grad
subroutine, public grad(ux, uy, uz, u, coef)
Compute the gradient of a scalar field.
Definition: operators.f90:146

operators::curl
subroutine, public curl(w1, w2, w3, u1, u2, u3, work1, work2, coef)
Definition: operators.f90:362

operators::strain_rate
subroutine, public strain_rate(s11, s22, s33, s12, s13, s23, u, v, w, coef)
Compute the strain rate tensor, i.e 0.5 * du_i/dx_j + du_j/dx_i.
Definition: operators.f90:430

operators::lambda2op
subroutine, public lambda2op(lambda2, u, v, w, coef)
Compute the Lambda2 field for a given velocity field.
Definition: operators.f90:503

operators::ortho
subroutine, public ortho(x, n, glb_n)
Othogonalize with regard to vector (1,1,1,1,1,1...,1)^T.
Definition: operators.f90:208

operators::cdtp
subroutine, public cdtp(dtx, x, dr, ds, dt, coef, es, ee)
Apply D^T to a scalar field, where D is the derivative matrix.
Definition: operators.f90:230

operators::dudxyz
subroutine, public dudxyz(du, u, dr, ds, dt, coef)
Compute derivative of a scalar field along a single direction.
Definition: operators.f90:76

operators::cfl
real(kind=rp) function, public cfl(dt, u, v, w, Xh, coef, nelv, gdim)
Definition: operators.f90:394

operators::conv1
subroutine, public conv1(du, u, vx, vy, vz, Xh, coef, es, ee)
Compute the advection term.
Definition: operators.f90:274

opr_cpu
Operators CPU backend.
Definition: opr_cpu.f90:34

opr_cpu::opr_cpu_curl
subroutine, public opr_cpu_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_Xh)
Definition: opr_cpu.f90:124

opr_cpu::opr_cpu_lambda2
subroutine, public opr_cpu_lambda2(lambda2, u, v, w, coef)
Definition: opr_cpu.f90:235

opr_cpu::opr_cpu_cfl
real(kind=rp) function, public opr_cpu_cfl(dt, u, v, w, Xh, coef, nelv, gdim)
Definition: opr_cpu.f90:175

opr_device
Operators accelerator backends.
Definition: opr_device.F90:34

opr_device::opr_device_cfl
real(kind=rp) function, public opr_device_cfl(dt, u, v, w, Xh, coef, nelv, gdim)
Definition: opr_device.F90:665

opr_device::opr_device_cdtp
subroutine, public opr_device_cdtp(dtx, x, dr, ds, dt, coef)
Definition: opr_device.F90:432

opr_device::opr_device_conv1
subroutine, public opr_device_conv1(du, u, vx, vy, vz, Xh, coef, nelv, gdim)
Definition: opr_device.F90:468

opr_device::opr_device_dudxyz
subroutine, public opr_device_dudxyz(du, u, dr, ds, dt, coef)
Definition: opr_device.F90:325

opr_device::opr_device_curl
subroutine, public opr_device_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_Xh)
Definition: opr_device.F90:515

opr_device::opr_device_opgrad
subroutine, public opr_device_opgrad(ux, uy, uz, u, coef)
Definition: opr_device.F90:360

opr_device::opr_device_lambda2
subroutine, public opr_device_lambda2(lambda2, u, v, w, coef)
Definition: opr_device.F90:402

opr_sx
Operators SX-Aurora backend.
Definition: opr_sx.f90:2

opr_sx::opr_sx_curl
subroutine, public opr_sx_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_Xh)
Definition: opr_sx.f90:100

opr_xsmm
Operators libxsmm backend.
Definition: opr_xsmm.F90:61

opr_xsmm::opr_xsmm_convect_scalar
subroutine, public opr_xsmm_convect_scalar(du, u, c, Xh_GLL, Xh_GL, coef_GLL, coef_GL, GLL_to_GL)
Definition: opr_xsmm.F90:371

opr_xsmm::opr_xsmm_cdtp
subroutine, public opr_xsmm_cdtp(dtx, x, dr, ds, dt, coef)
Definition: opr_xsmm.F90:242

opr_xsmm::opr_xsmm_set_convect_rst
subroutine, public opr_xsmm_set_convect_rst(cr, cs, ct, cx, cy, cz, Xh, coef)
Definition: opr_xsmm.F90:467

opr_xsmm::opr_xsmm_dudxyz
subroutine, public opr_xsmm_dudxyz(du, u, dr, ds, dt, coef)
Definition: opr_xsmm.F90:92

opr_xsmm::opr_xsmm_opgrad
subroutine, public opr_xsmm_opgrad(ux, uy, uz, u, coef)
Definition: opr_xsmm.F90:146

opr_xsmm::opr_xsmm_curl
subroutine, public opr_xsmm_curl(w1, w2, w3, u1, u2, u3, work1, work2, c_Xh)
Definition: opr_xsmm.F90:416

opr_xsmm::opr_xsmm_conv1
subroutine, public opr_xsmm_conv1(du, u, vx, vy, vz, Xh, coef, nelv, gdim)
Definition: opr_xsmm.F90:297

scratch_registry
Defines a registry for storing and requesting temporary fields This can be used when you have a funct...
Definition: scratch_registry.f90:37

scratch_registry::neko_scratch_registry
type(scratch_registry_t), target, public neko_scratch_registry
Global scratch registry.
Definition: scratch_registry.f90:85

space
Defines a function space.
Definition: space.f90:34

coefs::coef_t
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
Definition: coef.f90:55

field::field_t
Definition: field.f90:46

interpolation::interpolator_t
Interpolation between two space::space_t.
Definition: interpolation.f90:51

space::space_t
The function space for the SEM solution fields.
Definition: space.f90:62