d7/dbb/adv__dealias_8f90_source.html

! Copyright (c) 2021-2024, The Neko Authors

! All rights reserved.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

!   * Redistributions of source code must retain the above copyright

!     notice, this list of conditions and the following disclaimer.

!

!   * Redistributions in binary form must reproduce the above

!     copyright notice, this list of conditions and the following

!     disclaimer in the documentation and/or other materials provided

!     with the distribution.

!

!   * Neither the name of the authors nor the names of its

!     contributors may be used to endorse or promote products derived

!     from this software without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

! POSSIBILITY OF SUCH DAMAGE.

!

module adv_dealias

  use advection, only: advection_t

  use num_types, only: rp

  use math, only: vdot3, sub2

  use space, only: space_t, gl

  use field, only: field_t

  use coefs, only: coef_t

  use device_math, only: device_vdot3, device_sub2

  use neko_config, only: neko_bcknd_device, neko_bcknd_sx, neko_bcknd_xsmm, &

    neko_bcknd_opencl, neko_bcknd_cuda, neko_bcknd_hip

  use operators, only: opgrad

  use interpolation, only: interpolator_t

  use device, only: device_map, device_get_ptr

  use, intrinsic :: iso_c_binding, only: c_ptr, c_null_ptr

  implicit none

  private


  type, public, extends(advection_t) :: adv_dealias_t

     type(coef_t) :: coef_gl

     type(coef_t), pointer :: coef_gll

     type(interpolator_t) :: gll_to_gl

     type(space_t) :: xh_gl

     type(space_t), pointer :: xh_gll

     real(kind=rp), allocatable :: temp(:), tbf(:)

     real(kind=rp), allocatable :: tx(:), ty(:), tz(:)

     real(kind=rp), allocatable :: vr(:), vs(:), vt(:)

     type(c_ptr) :: temp_d = c_null_ptr

     type(c_ptr) :: tbf_d = c_null_ptr

     type(c_ptr) :: tx_d = c_null_ptr

     type(c_ptr) :: ty_d = c_null_ptr

     type(c_ptr) :: tz_d = c_null_ptr

     type(c_ptr) :: vr_d = c_null_ptr

     type(c_ptr) :: vs_d = c_null_ptr

     type(c_ptr) :: vt_d = c_null_ptr


   contains

     procedure, pass(this) :: compute => compute_advection_dealias

     procedure, pass(this) :: compute_scalar => compute_scalar_advection_dealias

     procedure, pass(this) :: init => init_dealias

     procedure, pass(this) :: free => free_dealias

  end type adv_dealias_t


contains


  subroutine init_dealias(this, lxd, coef)

    class(adv_dealias_t), target, intent(inout) :: this

    integer, intent(in) :: lxd

    type(coef_t), intent(inout), target :: coef

    integer :: nel, n_GL, n


    call this%Xh_GL%init(gl, lxd, lxd, lxd)

    this%Xh_GLL => coef%Xh

    this%coef_GLL => coef

    call this%GLL_to_GL%init(this%Xh_GL, this%Xh_GLL)


    call this%coef_GL%init(this%Xh_GL, coef%msh)


    nel = coef%msh%nelv

    n_gl = nel*this%Xh_GL%lxyz

    n = nel*coef%Xh%lxyz

    call this%GLL_to_GL%map(this%coef_GL%drdx, coef%drdx, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dsdx, coef%dsdx, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dtdx, coef%dtdx, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%drdy, coef%drdy, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dsdy, coef%dsdy, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dtdy, coef%dtdy, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%drdz, coef%drdz, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dsdz, coef%dsdz, nel, this%Xh_GL)

    call this%GLL_to_GL%map(this%coef_GL%dtdz, coef%dtdz, nel, this%Xh_GL)

    if ((neko_bcknd_hip .eq. 1) .or. (neko_bcknd_cuda .eq. 1) .or. &

       (neko_bcknd_opencl .eq. 1) .or. (neko_bcknd_sx .eq. 1) .or. &

       (neko_bcknd_xsmm .eq. 1)) then

       allocate(this%temp(n_gl))

       allocate(this%tbf(n_gl))

       allocate(this%tx(n_gl))

       allocate(this%ty(n_gl))

       allocate(this%tz(n_gl))

       allocate(this%vr(n_gl))

       allocate(this%vs(n_gl))

       allocate(this%vt(n_gl))

    end if


    if (neko_bcknd_device .eq. 1) then

       call device_map(this%temp, this%temp_d, n_gl)

       call device_map(this%tbf, this%tbf_d, n_gl)

       call device_map(this%tx, this%tx_d, n_gl)

       call device_map(this%ty, this%ty_d, n_gl)

       call device_map(this%tz, this%tz_d, n_gl)

       call device_map(this%vr, this%vr_d, n_gl)

       call device_map(this%vs, this%vs_d, n_gl)

       call device_map(this%vt, this%vt_d, n_gl)

    end if


  end subroutine init_dealias


  subroutine free_dealias(this)

    class(adv_dealias_t), intent(inout) :: this


  end subroutine free_dealias


  subroutine compute_advection_dealias(this, vx, vy, vz, fx, fy, fz, Xh, &

                                       coef, n, dt)

    class(adv_dealias_t), intent(inout) :: this

    type(space_t), intent(in) :: Xh

    type(coef_t), intent(in) :: coef

    type(field_t), intent(inout) :: vx, vy, vz

    type(field_t), intent(inout) :: fx, fy, fz

    integer, intent(in) :: n

    real(kind=rp), intent(in), optional :: dt


    real(kind=rp), dimension(this%Xh_GL%lxyz) :: tx, ty, tz

    real(kind=rp), dimension(this%Xh_GL%lxyz) :: tfx, tfy, tfz

    real(kind=rp), dimension(this%Xh_GL%lxyz) :: vr, vs, vt

    real(kind=rp), dimension(this%Xh_GLL%lxyz) :: tempx, tempy, tempz

    integer :: e, i, idx, nel, n_GL


    nel = coef%msh%nelv

    n_gl = nel * this%Xh_GL%lxyz


    !This is extremely primitive and unoptimized  on the device //Karp

    associate(c_gl => this%coef_GL)

      if (neko_bcknd_device .eq. 1) then

         call this%GLL_to_GL%map(this%tx, vx%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%ty, vy%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%tz, vz%x, nel, this%Xh_GL)


         call opgrad(this%vr, this%vs, this%vt, this%tx, c_gl)

         call device_vdot3(this%tbf_d, this%vr_d, this%vs_d, this%vt_d, &

                           this%tx_d, this%ty_d, this%tz_d, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call device_sub2(fx%x_d, this%temp_d, n)


         call opgrad(this%vr, this%vs, this%vt, this%ty, c_gl)

         call device_vdot3(this%tbf_d, this%vr_d, this%vs_d, this%vt_d, &

                           this%tx_d, this%ty_d, this%tz_d, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call device_sub2(fy%x_d, this%temp_d, n)


         call opgrad(this%vr, this%vs, this%vt, this%tz, c_gl)

         call device_vdot3(this%tbf_d, this%vr_d, this%vs_d, this%vt_d, &

                           this%tx_d, this%ty_d, this%tz_d, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call device_sub2(fz%x_d, this%temp_d, n)


      else if ((neko_bcknd_sx .eq. 1) .or. (neko_bcknd_xsmm .eq. 1)) then


         call this%GLL_to_GL%map(this%tx, vx%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%ty, vy%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%tz, vz%x, nel, this%Xh_GL)


         call opgrad(this%vr, this%vs, this%vt, this%tx, c_gl)

         call vdot3(this%tbf, this%vr, this%vs, this%vt, &

                    this%tx, this%ty, this%tz, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call sub2(fx%x, this%temp, n)


         call opgrad(this%vr, this%vs, this%vt, this%ty, c_gl)

         call vdot3(this%tbf, this%vr, this%vs, this%vt, &

                    this%tx, this%ty, this%tz, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call sub2(fy%x, this%temp, n)


         call opgrad(this%vr, this%vs, this%vt, this%tz, c_gl)

         call vdot3(this%tbf, this%vr, this%vs, this%vt, &

                    this%tx, this%ty, this%tz, n_gl)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)

         call sub2(fz%x, this%temp, n)


      else


         do e = 1, coef%msh%nelv

            call this%GLL_to_GL%map(tx, vx%x(1,1,1,e), 1, this%Xh_GL)

            call this%GLL_to_GL%map(ty, vy%x(1,1,1,e), 1, this%Xh_GL)

            call this%GLL_to_GL%map(tz, vz%x(1,1,1,e), 1, this%Xh_GL)


            call opgrad(vr, vs, vt, tx, c_gl, e, e)

            do i = 1, this%Xh_GL%lxyz

               tfx(i) = tx(i)*vr(i) + ty(i)*vs(i) + tz(i)*vt(i)

            end do


            call opgrad(vr, vs, vt, ty, c_gl, e, e)

            do i = 1, this%Xh_GL%lxyz

               tfy(i) = tx(i)*vr(i) + ty(i)*vs(i) + tz(i)*vt(i)

            end do


            call opgrad(vr, vs, vt, tz, c_gl, e, e)

            do i = 1, this%Xh_GL%lxyz

               tfz(i) = tx(i)*vr(i) + ty(i)*vs(i) + tz(i)*vt(i)

            end do


            call this%GLL_to_GL%map(tempx, tfx, 1, this%Xh_GLL)

            call this%GLL_to_GL%map(tempy, tfy, 1, this%Xh_GLL)

            call this%GLL_to_GL%map(tempz, tfz, 1, this%Xh_GLL)


            idx = (e-1)*this%Xh_GLL%lxyz+1

            do concurrent(i = 0:this%Xh_GLL%lxyz-1)

               fx%x(i+idx,1,1,1) = fx%x(i+idx,1,1,1) - tempx(i+1)

               fy%x(i+idx,1,1,1) = fy%x(i+idx,1,1,1) - tempy(i+1)

               fz%x(i+idx,1,1,1) = fz%x(i+idx,1,1,1) - tempz(i+1)

            end do

         end do

      end if

    end associate


  end subroutine compute_advection_dealias


  subroutine compute_scalar_advection_dealias(this, vx, vy, vz, s, fs, Xh, &

                                              coef, n, dt)

    class(adv_dealias_t), intent(inout) :: this

    type(field_t), intent(inout) :: vx, vy, vz

    type(field_t), intent(inout) :: s

    type(field_t), intent(inout) :: fs

    type(space_t), intent(in) :: Xh

    type(coef_t), intent(in) :: coef

    integer, intent(in) :: n

    real(kind=rp), intent(in), optional :: dt


    real(kind=rp), dimension(this%Xh_GL%lxyz) :: vx_gl, vy_gl, vz_gl, s_gl

    real(kind=rp), dimension(this%Xh_GL%lxyz) :: dsdx, dsdy, dsdz

    real(kind=rp), dimension(this%Xh_GL%lxyz) :: f_gl

    integer :: e, i, idx, nel, n_GL

    real(kind=rp), dimension(this%Xh_GLL%lxyz) :: temp


    nel = coef%msh%nelv

    n_gl = nel * this%Xh_GL%lxyz


    associate(c_gl => this%coef_GL)

      if (neko_bcknd_device .eq. 1) then


         ! Map advecting velocity onto the higher-order space

         call this%GLL_to_GL%map(this%tx, vx%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%ty, vy%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%tz, vz%x, nel, this%Xh_GL)


         ! Map the scalar onto the high-order space

         call this%GLL_to_GL%map(this%temp, s%x, nel, this%Xh_GL)


         ! Compute the scalar gradient in the high-order space

         call opgrad(this%vr, this%vs, this%vt, this%temp, c_gl)


         ! Compute the convective term, i.e dot the velocity with the scalar grad

         call device_vdot3(this%tbf_d, this%vr_d, this%vs_d, this%vt_d, &

                           this%tx_d, this%ty_d, this%tz_d, n_gl)


         ! Map back to the original space (we reuse this%temp)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)


         ! Update the source term

         call device_sub2(fs%x_d, this%temp_d, n)


      else if ((neko_bcknd_sx .eq. 1) .or. (neko_bcknd_xsmm .eq. 1)) then


         ! Map advecting velocity onto the higher-order space

         call this%GLL_to_GL%map(this%tx, vx%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%ty, vy%x, nel, this%Xh_GL)

         call this%GLL_to_GL%map(this%tz, vz%x, nel, this%Xh_GL)


         ! Map the scalar onto the high-order space

         call this%GLL_to_GL%map(this%temp, s%x, nel, this%Xh_GL)


         ! Compute the scalar gradient in the high-order space

         call opgrad(this%vr, this%vs, this%vt, this%temp, c_gl)


         ! Compute the convective term, i.e dot the velocity with the scalar grad

         call vdot3(this%tbf, this%vr, this%vs, this%vt, &

                    this%tx, this%ty, this%tz, n_gl)


         ! Map back to the original space (we reuse this%temp)

         call this%GLL_to_GL%map(this%temp, this%tbf, nel, this%Xh_GLL)


         ! Update the source term

         call sub2(fs%x, this%temp, n)


      else

         do e = 1, coef%msh%nelv

            ! Map advecting velocity onto the higher-order space

            call this%GLL_to_GL%map(vx_gl, vx%x(1,1,1,e), 1, this%Xh_GL)

            call this%GLL_to_GL%map(vy_gl, vy%x(1,1,1,e), 1, this%Xh_GL)

            call this%GLL_to_GL%map(vz_gl, vz%x(1,1,1,e), 1, this%Xh_GL)


            ! Map scalar onto the higher-order space

            call this%GLL_to_GL%map(s_gl, s%x(1,1,1,e), 1, this%Xh_GL)


            ! Gradient of s in the higher-order space

            call opgrad(dsdx, dsdy, dsdz, s_gl, c_gl, e, e)


            ! vx * ds/dx + vy * ds/dy + vz * ds/dz for each point in the element

            do i = 1, this%Xh_GL%lxyz

               f_gl(i) = vx_gl(i)*dsdx(i) + vy_gl(i)*dsdy(i) + vz_gl(i)*dsdz(i)

            end do


            ! Map back the contructed operator to the original space

            call this%GLL_to_GL%map(temp, f_gl, 1, this%Xh_GLL)


            idx = (e-1)*this%Xh_GLL%lxyz + 1


            call sub2(fs%x(idx, 1, 1, 1), temp, this%Xh_GLL%lxyz)

         end do

      end if

    end associate


  end subroutine compute_scalar_advection_dealias


end module adv_dealias

device::device_get_ptr
Return the device pointer for an associated Fortran array.
Definition device.F90:92

device::device_map
Map a Fortran array to a device (allocate and associate)
Definition device.F90:68

adv_dealias
Subroutines to add advection terms to the RHS of a transport equation.
Definition adv_dealias.f90:34

adv_dealias::init_dealias
subroutine init_dealias(this, lxd, coef)
Constructor.
Definition adv_dealias.f90:103

adv_dealias::compute_scalar_advection_dealias
subroutine compute_scalar_advection_dealias(this, vx, vy, vz, s, fs, xh, coef, n, dt)
Add the advection term for a scalar, i.e. , to the RHS.
Definition adv_dealias.f90:293

adv_dealias::free_dealias
subroutine free_dealias(this)
Destructor.
Definition adv_dealias.f90:155

adv_dealias::compute_advection_dealias
subroutine compute_advection_dealias(this, vx, vy, vz, fx, fy, fz, xh, coef, n, dt)
Add the advection term for the fluid, i.e. , to the RHS.
Definition adv_dealias.f90:173

advection
Subroutines to add advection terms to the RHS of a transport equation.
Definition advection.f90:34

coefs
Coefficients.
Definition coef.f90:34

device_math
Definition device_math.F90:33

device_math::device_vdot3
subroutine, public device_vdot3(dot_d, u1_d, u2_d, u3_d, v1_d, v2_d, v3_d, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition device_math.F90:491

device_math::device_sub2
subroutine, public device_sub2(a_d, b_d, n)
Vector substraction .
Definition device_math.F90:430

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

field
Defines a field.
Definition field.f90:34

interpolation
Routines to interpolate between different spaces.
Definition interpolation.f90:34

math
Definition math.f90:60

math::vdot3
subroutine, public vdot3(dot, u1, u2, u3, v1, v2, v3, n)
Compute a dot product  (3-d version) assuming vector components  etc.
Definition math.f90:544

math::sub2
subroutine, public sub2(a, b, n)
Vector substraction .
Definition math.f90:628

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_sx
integer, parameter neko_bcknd_sx
Definition neko_config.f90:39

neko_config::neko_bcknd_hip
integer, parameter neko_bcknd_hip
Definition neko_config.f90:42

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

neko_config::neko_bcknd_opencl
integer, parameter neko_bcknd_opencl
Definition neko_config.f90:43

neko_config::neko_bcknd_cuda
integer, parameter neko_bcknd_cuda
Definition neko_config.f90:41

neko_config::neko_bcknd_xsmm
integer, parameter neko_bcknd_xsmm
Definition neko_config.f90:40

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

operators
Operators.
Definition operators.f90:34

operators::opgrad
subroutine, public opgrad(ux, uy, uz, u, coef, es, ee)
Compute the weak gradient of a scalar field, i.e. the gradient multiplied by the mass matrix.
Definition operators.f90:173

space
Defines a function space.
Definition space.f90:34

space::gl
integer, parameter, public gl
Definition space.f90:48

adv_dealias::adv_dealias_t
Type encapsulating advection routines with dealiasing.
Definition adv_dealias.f90:52

advection::advection_t
Base abstract type for computing the advection operator.
Definition advection.f90:46

coefs::coef_t
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
Definition coef.f90:55

field::field_t
Definition field.f90:47

interpolation::interpolator_t
Interpolation between two space::space_t.
Definition interpolation.f90:53

space::space_t
The function space for the SEM solution fields.
Definition space.f90:62