db/da5/gradient__jump__penalty_8f90_source.html

! Copyright (c) 2024, The Neko Authors

! All rights reserved.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

!   * Redistributions of source code must retain the above copyright

!     notice, this list of conditions and the following disclaimer.

!

!   * Redistributions in binary form must reproduce the above

!     copyright notice, this list of conditions and the following

!     disclaimer in the documentation and/or other materials provided

!     with the distribution.

!

!   * Neither the name of the authors nor the names of its

!     contributors may be used to endorse or promote products derived

!     from this software without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

! POSSIBILITY OF SUCH DAMAGE.

!

!

module gradient_jump_penalty

  use num_types, only : rp

  use utils, only : neko_error

  use json_utils, only : json_get_or_default

  use json_module, only : json_file

  use math

  use point, only : point_t

  use field, only : field_t

  use dofmap , only : dofmap_t

  use neko_config, only : neko_bcknd_device

  use coefs, only : coef_t

  use element, only : element_t

  use hex

  use quad

  use operators, only : dudxyz

  use gs_ops, only : gs_op_add

  use space

  use gather_scatter, only : gs_t

  use device

  use device_math

  use device_gradient_jump_penalty


  implicit none

  private


  type, public :: gradient_jump_penalty_t

     real(kind=rp) :: tau

     integer :: p

     integer :: lx

     real(kind=rp), allocatable, dimension(:, :, :, :) :: penalty

     type(c_ptr) :: penalty_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: penalty_facet

     type(c_ptr) :: penalty_facet_d = c_null_ptr

     type(coef_t), pointer :: coef => null()

     type(dofmap_t), pointer :: dm => null()


     real(kind=rp), allocatable, dimension(:, :, :, :) :: grad1, &

                                                          grad2, grad3

     real(kind=rp), allocatable, dimension(:, :, :, :) :: grad1, & …

     type(c_ptr) :: grad1_d = c_null_ptr

     type(c_ptr) :: grad2_d = c_null_ptr

     type(c_ptr) :: grad3_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: g

     type(c_ptr) :: g_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: flux1, flux2, flux3

     type(c_ptr) :: flux1_d = c_null_ptr

     type(c_ptr) :: flux2_d = c_null_ptr

     type(c_ptr) :: flux3_d = c_null_ptr


     real(kind=rp), allocatable, dimension(:, :, :, :) :: volflux1, &

                                                          volflux2, volflux3

     real(kind=rp), allocatable, dimension(:, :, :, :) :: volflux1, & …

     type(c_ptr) :: volflux1_d = c_null_ptr

     type(c_ptr) :: volflux2_d = c_null_ptr

     type(c_ptr) :: volflux3_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: absvolflux

     type(c_ptr) :: absvolflux_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: n1, n2, n3

     type(c_ptr) :: n1_d = c_null_ptr

     type(c_ptr) :: n2_d = c_null_ptr

     type(c_ptr) :: n3_d = c_null_ptr

     real(kind=rp), allocatable, dimension(:, :, :, :) :: facet_factor

     type(c_ptr) :: facet_factor_d = c_null_ptr

     integer, allocatable :: n_facet(:)

     integer :: n_facet_max

     real(kind=rp), allocatable, dimension(:, :, :, :) :: h2

     real(kind=rp), allocatable :: dphidxi(:, :)

     type(c_ptr) :: dphidxi_d = c_null_ptr

     type(space_t) :: xh_gjp

     type(dofmap_t) :: dm_gjp

     type(gs_t) :: gs_gjp

     integer :: n

     integer :: n_large


  contains

     procedure, pass(this) :: init => gradient_jump_penalty_init

     procedure, pass(this) :: free => gradient_jump_penalty_free

     procedure, pass(this) :: compute => gradient_jump_penalty_compute

     procedure, pass(this) :: perform => gradient_jump_penalty_perform


  end type gradient_jump_penalty_t

  type, public :: gradient_jump_penalty_t …


contains


  subroutine gradient_jump_penalty_init(this, params, dofmap, coef, a, b)

    implicit none

    class(gradient_jump_penalty_t), intent(inout) :: this

    type(json_file), target, intent(inout) :: params

    type(dofmap_t), target, intent(in) :: dofmap

    type(coef_t), target, intent(in) :: coef

    real(kind=rp), intent(in) :: a, b


    integer :: i, j, k, l

    real(kind=rp), allocatable :: zg(:) ! Quadrature points

    real(kind=rp) :: normal(3)


    call this%free()


    this%dm => dofmap

    this%p = dofmap%xh%lx - 1

    this%lx = dofmap%xh%lx


    if (this%p .gt. 1) then

       this%tau = -a * (this%p + 1) ** (-b)

    else

       this%tau = -a

    end if


    this%coef => coef

    this%n = this%lx ** 3 * this%coef%msh%nelv

    this%n_large = (this%lx + 2) ** 3 * this%coef%msh%nelv


    allocate(this%n_facet(this%coef%msh%nelv))

    do i = 1, this%coef%msh%nelv

       select type (ep  => this%coef%msh%elements(i)%e)

       type is (hex_t)

          this%n_facet(i) = 6

       type is (quad_t)

          call neko_error("Only Hexahedral element is &

                           &supported now for gradient jump penalty")

       end select

    end do

    this%n_facet_max = maxval(this%n_facet)


    allocate(this%h2(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))


    do i = 1, this%coef%msh%nelv

       select type (ep => this%coef%msh%elements(i)%e)

       type is (hex_t)

          call eval_h2_hex(this%h2(:, :, :, i), this%lx, i, this%dm, this%coef)

       type is (quad_t)

          call neko_error("Gradient jump penalty error: mesh size &

                            &evaluation is not supported for quad_t")

       end select

    end do


    allocate(zg(this%lx))

    allocate(this%dphidxi(this%lx, this%lx))


    zg = dofmap%xh%zg(:,1)

    do i = 1, dofmap%xh%lx

       do j = 1, dofmap%xh%lx

          this%dphidxi(j,i) = this%coef%Xh%dx(j,i)

       end do

    end do


    allocate(this%penalty(this%lx, this%lx, this%lx, this%coef%msh%nelv))

    allocate(this%grad1(this%lx, this%lx, this%lx, this%coef%msh%nelv))

    allocate(this%grad2(this%lx, this%lx, this%lx, this%coef%msh%nelv))

    allocate(this%grad3(this%lx, this%lx, this%lx, this%coef%msh%nelv))


    allocate(this%penalty_facet(this%lx + 2, this%lx + 2, &

                    this%lx + 2, this%coef%msh%nelv))

    allocate(this%G(this%lx + 2, this%lx + 2, &

                    this%lx + 2, this%coef%msh%nelv))

    allocate(this%flux1(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%flux2(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%flux3(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%volflux1(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%volflux2(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%volflux3(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%absvolflux(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%n1(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%n2(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))

    allocate(this%n3(this%lx + 2, this%lx + 2, &

                        this%lx + 2, this%coef%msh%nelv))


    ! Extract facets' normals

    do i = 1, this%coef%msh%nelv

       do j = 1, 6 ! for hexahedral elements

          do k = 1, this%lx

             do l = 1, this%lx

                select case(j)

                case(1)

                   normal = this%coef%get_normal(1, l, k, i, j)

                   this%n1(1, l + 1, k + 1, i) = normal(1)

                   this%n2(1, l + 1, k + 1, i) = normal(2)

                   this%n3(1, l + 1, k + 1, i) = normal(3)

                case(2)

                   normal = this%coef%get_normal(1, l, k, i, j)

                   this%n1(this%lx + 2, l + 1, k + 1, i) = normal(1)

                   this%n2(this%lx + 2, l + 1, k + 1, i) = normal(2)

                   this%n3(this%lx + 2, l + 1, k + 1, i) = normal(3)

                case(3)

                   normal = this%coef%get_normal(l, 1, k, i, j)

                   this%n1(l + 1, 1, k + 1, i) = normal(1)

                   this%n2(l + 1, 1, k + 1, i) = normal(2)

                   this%n3(l + 1, 1, k + 1, i) = normal(3)

                case(4)

                   normal = this%coef%get_normal(l, 1, k, i, j)

                   this%n1(l + 1, this%lx + 2, k + 1, i) = normal(1)

                   this%n2(l + 1, this%lx + 2, k + 1, i) = normal(2)

                   this%n3(l + 1, this%lx + 2, k + 1, i) = normal(3)

                case(5)

                   normal = this%coef%get_normal(l, k, 1, i, j)

                   this%n1(l + 1, k + 1, 1, i) = normal(1)

                   this%n2(l + 1, k + 1, 1, i) = normal(2)

                   this%n3(l + 1, k + 1, 1, i) = normal(3)

                case(6)

                   normal = this%coef%get_normal(l, k, 1, i, j)

                   this%n1(l + 1, k + 1, this%lx + 2, i) = normal(1)

                   this%n2(l + 1, k + 1, this%lx + 2, i) = normal(2)

                   this%n3(l + 1, k + 1, this%lx + 2, i) = normal(3)

                case default

                   call neko_error("The face index is not correct")

                end select

             end do

          end do

       end do

    end do


    ! Assemble facet factor

    call facet_factor_init(this)


    ! Initialize Gather-Scatter

    call this%Xh_GJP%init(gll, this%lx+2, this%lx+2, this%lx+2)

    call this%dm_GJP%init(this%coef%msh, this%Xh_GJP)

    call this%gs_GJP%init(this%dm_GJP)


    ! Initialize pointers for device

    if (neko_bcknd_device .eq. 1) then

       call device_map(this%dphidxi, this%dphidxi_d, &

                       this%lx * this%lx)

       call device_map(this%penalty, this%penalty_d, this%n)

       call device_map(this%grad1, this%grad1_d, this%n)

       call device_map(this%grad2, this%grad2_d, this%n)

       call device_map(this%grad3, this%grad3_d, this%n)


       call device_map(this%penalty_facet, this%penalty_facet_d, this%n_large)

       call device_map(this%G, this%G_d, this%n_large)

       call device_map(this%flux1, this%flux1_d, this%n_large)

       call device_map(this%flux2, this%flux2_d, this%n_large)

       call device_map(this%flux3, this%flux3_d, this%n_large)


       call device_map(this%volflux1, this%volflux1_d, this%n_large)

       call device_map(this%volflux2, this%volflux2_d, this%n_large)

       call device_map(this%volflux3, this%volflux3_d, this%n_large)

       call device_map(this%absvolflux, this%absvolflux_d, this%n_large)


       call device_map(this%n1, this%n1_d, this%n_large)

       call device_map(this%n2, this%n2_d, this%n_large)

       call device_map(this%n3, this%n3_d, this%n_large)

       call device_map(this%facet_factor, this%facet_factor_d, this%n_large)


       call device_memcpy(this%dphidxi, this%dphidxi_d, &

                       this%lx * this%lx, &

                       host_to_device, sync = .false.)

       call device_memcpy(this%n1, this%n1_d, this%n_large, &

                          host_to_device, sync = .false.)

       call device_memcpy(this%n2, this%n2_d, this%n_large, &

                          host_to_device, sync = .false.)

       call device_memcpy(this%n3, this%n3_d, this%n_large, &

                          host_to_device, sync = .false.)

       call device_memcpy(this%facet_factor, this%facet_factor_d, this%n_large,&

                          host_to_device, sync = .false.)


    end if


  subroutine gradient_jump_penalty_init(this, params, dofmap, coef, a, b) …

  end subroutine gradient_jump_penalty_init


  subroutine eval_h2_hex(h2_el, n, i, dm, coef)

    integer, intent(in) :: n, i

    type(dofmap_t), pointer, intent(in) :: dm

    type(coef_t), pointer, intent(in) :: coef

    real(kind=rp), intent(inout) :: h2_el(n + 2, n + 2, n + 2)


    integer :: j, k, l


    h2_el = 0.0_rp


    do j = 1, 6

       do k = 1, n

          do l = 1, n

             select case(j)

             case(1)

                h2_el(1, l + 1, k + 1) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case(2)

                h2_el(n + 2, l + 1, k + 1) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case(3)

                h2_el(l + 1, 1, k + 1) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case(4)

                h2_el(l + 1, n + 2, k + 1) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case(5)

                h2_el(l + 1, k + 1, 1) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case(6)

                h2_el(l + 1, k + 1, n + 2) = &

                  dist2_quadrature_hex(l, k, j, i, n, dm, coef)

             case default

                call neko_error("The face index is not correct")

             end select

          end do

       end do

    end do


  subroutine eval_h2_hex(h2_el, n, i, dm, coef) …

  end subroutine eval_h2_hex


  function dist2_quadrature_hex(l, k, j, i, n, dm, coef) result(dist2)

    integer, intent(in) :: l, k, j, i, n

    type(dofmap_t), pointer, intent(in) :: dm

    type(coef_t), pointer, intent(in) :: coef

    real(kind=rp) :: dist2, dist_1, dist_2


    real(kind=rp) :: x1, y1, z1, x2, y2, z2

    real(kind=rp) :: normal1(3), normal2(3)

    real(kind=rp) :: n11, n12, n13, n21, n22, n23

    real(kind=rp) :: v1, v2, v3


    dist2 = 0.0_rp

    select case(j)

    case(1)

       normal1 = coef%get_normal(1, l, k, i, 1)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(1, l, k, i)

       y1 = dm%y(1, l, k, i)

       z1 = dm%z(1, l, k, i)

       normal2 = coef%get_normal(1, l, k, i, 2)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(n, l, k, i)

       y2 = dm%y(n, l, k, i)

       z2 = dm%z(n, l, k, i)

    case(2)

       ! now the facet pair share the same value for h

       ! but just let it be here for furture possible changes

       normal1 = coef%get_normal(1, l, k, i, 2)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(n, l, k, i)

       y1 = dm%y(n, l, k, i)

       z1 = dm%z(n, l, k, i)

       normal2 = coef%get_normal(1, l, k, i, 1)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(1, l, k, i)

       y2 = dm%y(1, l, k, i)

       z2 = dm%z(1, l, k, i)

    case(3)

       normal1 = coef%get_normal(1, l, k, i, 3)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(l, 1, k, i)

       y1 = dm%y(l, 1, k, i)

       z1 = dm%z(l, 1, k, i)

       normal2 = coef%get_normal(1, l, k, i, 4)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(l, n, k, i)

       y2 = dm%y(l, n, k, i)

       z2 = dm%z(l, n, k, i)

    case(4)

       normal1 = coef%get_normal(1, l, k, i, 4)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(l, n, k, i)

       y1 = dm%y(l, n, k, i)

       z1 = dm%z(l, n, k, i)

       normal2 = coef%get_normal(1, l, k, i, 3)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(l, 1, k, i)

       y2 = dm%y(l, 1, k, i)

       z2 = dm%z(l, 1, k, i)

    case(5)

       normal1 = coef%get_normal(1, l, k, i, 5)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(l, k, 1, i)

       y1 = dm%y(l, k, 1, i)

       z1 = dm%z(l, k, 1, i)

       normal2 = coef%get_normal(1, l, k, i, 6)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(l, k, n, i)

       y2 = dm%y(l, k, n, i)

       z2 = dm%z(l, k, n, i)

    case(6)

       normal1 = coef%get_normal(1, l, k, i, 6)

       n11 = normal1(1)

       n12 = normal1(2)

       n13 = normal1(3)

       x1 = dm%x(l, k, n, i)

       y1 = dm%y(l, k, n, i)

       z1 = dm%z(l, k, n, i)

       normal2 = coef%get_normal(1, l, k, i, 5)

       n21 = normal2(1)

       n22 = normal2(2)

       n23 = normal2(3)

       x2 = dm%x(l, k, 1, i)

       y2 = dm%y(l, k, 1, i)

       z2 = dm%z(l, k, 1, i)

    case default

       call neko_error("The face index is not correct")

    end select


    ! get the vector from the quadrature point to the one on the other side

    v1 = x2 - x1

    v2 = y2 - y1

    v3 = z2 - z1

    ! Project onto tabsvolflhe facet-normal direction of the point

    dist_1 = v1*n11 + v2*n12 + v3*n13

    dist_2 = - (v1*n21 + v2*n22 + v3*n23)


    dist2 = ((dist_1 + dist_2)/2.0_rp)*((dist_1 + dist_2)/2.0_rp)


  function dist2_quadrature_hex(l, k, j, i, n, dm, coef) result(dist2) …

  end function


  subroutine facet_factor_init(this)

    class(gradient_jump_penalty_t), intent(inout) :: this

    integer :: i, j, k, l

    real(kind=rp) :: area_tmp


    allocate(this%facet_factor(this%lx + 2, this%lx + 2, &

                               this%lx + 2, this%coef%msh%nelv))


    associate(facet_factor => this%facet_factor, &

              coef => this%coef, &

              lx => this%lx, &

              nelv => this%coef%msh%nelv, &

              jacinv => this%coef%jacinv, h2 => this%h2, &

              tau => this%tau, n1 => this%n1, &

              n2 => this%n2, n3 => this%n3)


    do i = 1, nelv

       do j = 1, 6 ! for hexahedral elementsh2

          do k = 1, lx

             do l = 1, lx

                select case(j)

                case(1)

                   area_tmp = coef%get_area(1, l, k, i, j)

                   facet_factor(1, l + 1, k + 1, i) = area_tmp * tau * &

                           h2(1, l + 1, k + 1, i) * &

                           (n1(1, l + 1, k + 1, i) * coef%drdx(1, l, k, i) + &

                            n2(1, l + 1, k + 1, i) * coef%drdy(1, l, k, i) + &

                            n3(1, l + 1, k + 1, i) * coef%drdz(1, l, k, i) ) &

                           * jacinv(1, l, k, i)

                case(2)

                   area_tmp = coef%get_area(1, l, k, i, j)

                   facet_factor(lx + 2, l + 1, k + 1, i) = area_tmp * tau * &

                           h2(lx + 2, l + 1, k + 1, i) * &

                           (n1(lx + 2, l + 1, k + 1, i) * &

                            coef%drdx(lx, l, k, i) + &

                            n2(lx + 2, l + 1, k + 1, i) * &

                            coef%drdy(lx, l, k, i) + &

                            n3(lx + 2, l + 1, k + 1, i) * &

                            coef%drdz(lx, l, k, i) ) &

                           * jacinv(lx, l, k, i)

                case(3)

                   area_tmp = coef%get_area(l, 1, k, i, j)

                   facet_factor(l + 1, 1, k + 1, i) = area_tmp * tau * &

                           h2(l + 1, 1, k + 1, i) * &

                           (n1(l + 1, 1, k + 1, i) * coef%dsdx(l, 1, k, i) + &

                            n2(l + 1, 1, k + 1, i) * coef%dsdy(l, 1, k, i) + &

                            n3(l + 1, 1, k + 1, i) * coef%dsdz(l, 1, k, i) ) &

                           * jacinv(l, 1, k, i)

                case(4)

                   area_tmp = coef%get_area(l, 1, k, i, j)

                   facet_factor(l + 1, lx + 2, k + 1, i) = area_tmp * tau * &

                           h2(l + 1, lx + 2, k + 1, i) * &

                           (n1(l + 1, lx + 2, k + 1, i) * &

                            coef%dsdx(l, lx, k, i) + &

                            n2(l + 1, lx + 2, k + 1, i) * &

                            coef%dsdy(l, lx, k, i) + &

                            n3(l + 1, lx + 2, k + 1, i) * &

                            coef%dsdz(l, lx, k, i) ) &

                           * jacinv(l, lx, k, i)

                case(5)

                   area_tmp = coef%get_area(l, k, 1, i, j)

                   facet_factor(l + 1, k + 1, 1, i) = area_tmp * tau * &

                           h2(l + 1, k + 1, 1, i) * &

                           (n1(l + 1, k + 1, 1, i) * coef%dtdx(l, k, 1, i) + &

                            n2(l + 1, k + 1, 1, i) * coef%dtdy(l, k, 1, i) + &

                            n3(l + 1, k + 1, 1, i) * coef%dtdz(l, k, 1, i) ) &

                           * jacinv(l, k, 1, i)

                case(6)

                   area_tmp = coef%get_area(l, k, 1, i, j)

                   facet_factor(l + 1, k + 1, lx + 2, i) = area_tmp * tau * &

                           h2(l + 1, k + 1, lx + 2, i) * &

                           (n1(l + 1, k + 1, lx + 2, i) * coef%dtdx(l, k, lx, i) + &

                            n2(l + 1, k + 1, lx + 2, i) * coef%dtdy(l, k, lx, i) + &

                            n3(l + 1, k + 1, lx + 2, i) * coef%dtdz(l, k, lx, i) ) &

                           * jacinv(l, k, lx, i)

                case default

                   call neko_error("The face index is not correct")

                end select

             end do

          end do

       end do

    end do


    end associate

  subroutine facet_factor_init(this) …

  end subroutine facet_factor_init


  subroutine gradient_jump_penalty_free(this)

    implicit none

    class(gradient_jump_penalty_t), intent(inout) :: this


    if (c_associated(this%dphidxi_d)) then

       call device_free(this%dphidxi_d)

    end if

    if (c_associated(this%penalty_d)) then

       call device_free(this%penalty_d)

    end if

    if (c_associated(this%grad1_d)) then

       call device_free(this%grad1_d)

    end if

    if (c_associated(this%grad2_d)) then

       call device_free(this%grad2_d)

    end if

    if (c_associated(this%grad3_d)) then

       call device_free(this%grad3_d)

    end if

    if (c_associated(this%penalty_facet_d)) then

       call device_free(this%penalty_facet_d)

    end if

    if (c_associated(this%G_d)) then

       call device_free(this%G_d)

    end if

    if (c_associated(this%flux1_d)) then

       call device_free(this%flux1_d)

    end if

    if (c_associated(this%flux2_d)) then

       call device_free(this%flux2_d)

    end if

    if (c_associated(this%flux3_d)) then

       call device_free(this%flux3_d)

    end if

    if (c_associated(this%volflux1_d)) then

       call device_free(this%volflux1_d)

    end if

    if (c_associated(this%volflux2_d)) then

       call device_free(this%volflux2_d)

    end if

    if (c_associated(this%volflux3_d)) then

       call device_free(this%volflux3_d)

    end if

    if (c_associated(this%absvolflux_d)) then

       call device_free(this%absvolflux_d)

    end if

    if (c_associated(this%n1_d)) then

       call device_free(this%n1_d)

    end if

    if (c_associated(this%n2_d)) then

       call device_free(this%n2_d)

    end if

    if (c_associated(this%n3_d)) then

       call device_free(this%n3_d)

    end if

    if (c_associated(this%facet_factor_d)) then

       call device_free(this%facet_factor_d)

    end if


    if (allocated(this%penalty)) then

       deallocate(this%penalty)

    end if

    if (allocated(this%grad1)) then

       deallocate(this%grad1)

    end if

    if (allocated(this%grad2)) then

       deallocate(this%grad2)

    end if

    if (allocated(this%grad3)) then

       deallocate(this%grad3)

    end if

    if (allocated(this%h2)) then

       deallocate(this%h2)

    end if

    if (allocated(this%n_facet)) then

       deallocate(this%n_facet)

    end if

    if (allocated(this%dphidxi)) then

       deallocate(this%dphidxi)

    end if

    if (allocated(this%penalty_facet)) then

       deallocate(this%penalty_facet)

    end if

    if (allocated(this%G)) then

       deallocate(this%G)

    end if

    if (allocated(this%flux1)) then

       deallocate(this%flux1)

    end if

    if (allocated(this%flux2)) then

       deallocate(this%flux2)

    end if

    if (allocated(this%flux3)) then

       deallocate(this%flux3)

    end if

     if (allocated(this%volflux1)) then

       deallocate(this%volflux1)

    end if

    if (allocated(this%volflux2)) then

       deallocate(this%volflux2)

    end if

    if (allocated(this%volflux3)) then

       deallocate(this%volflux3)

    end if

    if (allocated(this%absvolflux)) then

       deallocate(this%absvolflux)

    end if

    if (allocated(this%n1)) then

       deallocate(this%n1)

    end if

    if (allocated(this%n2)) then

       deallocate(this%n2)

    end if

    if (allocated(this%n3)) then

       deallocate(this%n3)

    end if

    if (allocated(this%facet_factor)) then

       deallocate(this%facet_factor)

    end if


    nullify(this%coef)

    nullify(this%dm)


    call this%Xh_GJP%free()

    call this%gs_GJP%free()


  subroutine gradient_jump_penalty_free(this) …

  end subroutine gradient_jump_penalty_free


  subroutine gradient_jump_penalty_compute(this, u, v, w, s)

    class(gradient_jump_penalty_t), intent(inout) :: this

    type(field_t), intent(in) :: u, v, w, s


    class(element_t), pointer :: ep

    integer :: i


    call g_compute(this, s)

    call absvolflux_compute(this, u, v, w)


    if (neko_bcknd_device .eq. 1) then

       call device_col3(this%penalty_facet_d, this%absvolflux_d, this%G_d, &

                        this%n_large)

       call device_col2(this%penalty_facet_d, this%facet_factor_d, this%n_large)

       call device_gradient_jump_penalty_finalize(this%penalty_d, &

                                           this%penalty_facet_d, &

                                           this%dphidxi_d, &

                                           this%lx, this%coef%msh%nelv)

    else

       call col3(this%penalty_facet, this%absvolflux, this%G, this%n_large)

       call col2(this%penalty_facet, this%facet_factor, this%n_large)

       call gradient_jump_penalty_finalize(this%penalty, this%penalty_facet, &

                                           this%dphidxi, &

                                           this%lx, this%coef%msh%nelv)

    end if


  subroutine gradient_jump_penalty_compute(this, u, v, w, s) …

  end subroutine gradient_jump_penalty_compute


  subroutine gradient_jump_penalty_perform(this, f)

    class(gradient_jump_penalty_t), intent(inout) :: this

    type(field_t), intent(inout) :: f


    integer :: i, j, k, l


    if (neko_bcknd_device .eq. 1) then

       call device_add2(f%x_d, this%penalty_d, this%coef%dof%size())

    else

       call add2(f%x, this%penalty, this%coef%dof%size())

    end if


  subroutine gradient_jump_penalty_perform(this, f) …

  end subroutine gradient_jump_penalty_perform


  subroutine gradient_jump_penalty_finalize(penalty, wa, dphidxi, lx, nelv)

    integer, intent(in) :: lx, nelv

    real(kind=rp), intent(inout) :: penalty(lx, lx, lx, nelv)

    real(kind=rp), intent(in) :: wa(lx + 2, lx + 2, lx + 2, nelv)

    real(kind=rp), intent(in) :: dphidxi(lx, lx)


    call gradient_jump_penalty_finalize_hex(penalty, wa, dphidxi, lx, nelv)


  subroutine gradient_jump_penalty_finalize(penalty, wa, dphidxi, lx, nelv) …

  end subroutine gradient_jump_penalty_finalize


  subroutine gradient_jump_penalty_finalize_hex(penalty, wa, dphidxi, lx, nelv)

    integer, intent(in) :: lx, nelv

    real(kind=rp), intent(inout) :: penalty(lx, lx, lx, nelv)

    real(kind=rp), intent(in) :: wa(lx + 2, lx + 2, lx + 2, nelv)

    real(kind=rp), intent(in) :: dphidxi(lx, lx)


    integer :: i, j, k


    do i = 1, lx

       do j = 1, lx

          do k = 1, lx

             penalty(i, j, k, :) = &

               wa(1, j + 1, k + 1, :) * &

                  dphidxi(1, i) + &

               wa(lx + 2, j + 1, k + 1, :) * &

                  dphidxi(lx, i) + &

               wa(i + 1, 1, k + 1, :) * &

                  dphidxi(1, j) + &

               wa(i + 1, lx + 2, k + 1, :) * &

                  dphidxi(lx, j) + &

               wa(i + 1, j + 1, 1, :) * &

                  dphidxi(1, k) + &

               wa(i + 1, j + 1, lx + 2, :) * &

                  dphidxi(lx, k)

          end do

       end do

    end do


  subroutine gradient_jump_penalty_finalize_hex(penalty, wa, dphidxi, lx, nelv) …

  end subroutine gradient_jump_penalty_finalize_hex


  subroutine g_compute(this, s)

    class(gradient_jump_penalty_t), intent(inout) :: this

    type(field_t), intent(in) :: s


    call dudxyz(this%grad1, s%x, this%coef%drdx, &

                this%coef%dsdx, this%coef%dtdx, this%coef)

    call dudxyz(this%grad2, s%x, this%coef%drdy, &

                this%coef%dsdy, this%coef%dtdy, this%coef)

    call dudxyz(this%grad3, s%x, this%coef%drdz, &

                this%coef%dsdz, this%coef%dtdz, this%coef)


    if (neko_bcknd_device .eq. 1) then

       call device_pick_facet_value_hex(this%flux1_d, this%grad1_d, &

                                 this%lx, this%coef%msh%nelv)

       call device_pick_facet_value_hex(this%flux2_d, this%grad2_d, &

                                 this%lx, this%coef%msh%nelv)

       call device_pick_facet_value_hex(this%flux3_d, this%grad3_d, &

                                 this%lx, this%coef%msh%nelv)

       call device_col2(this%flux1_d, this%n1_d, this%n_large)

       call device_col2(this%flux2_d, this%n2_d, this%n_large)

       call device_col2(this%flux3_d, this%n3_d, this%n_large)

       call device_add3s2(this%G_d, this%flux1_d, this%flux2_d, &

                          1.0_rp, 1.0_rp, this%n_large)

       call device_add2(this%G_d, this%flux3_d, this%n_large)

    else

       call pick_facet_value_hex(this%flux1, this%grad1, &

                                 this%lx, this%coef%msh%nelv)

       call pick_facet_value_hex(this%flux2, this%grad2, &

                                 this%lx, this%coef%msh%nelv)

       call pick_facet_value_hex(this%flux3, this%grad3, &

                                 this%lx, this%coef%msh%nelv)

       call col2(this%flux1, this%n1, this%n_large)

       call col2(this%flux2, this%n2, this%n_large)

       call col2(this%flux3, this%n3, this%n_large)

       call add3(this%G, this%flux1, this%flux2, this%n_large)

       call add2(this%G, this%flux3, this%n_large)

    end if


    call this%gs_GJP%op(this%G, this%n_large, gs_op_add)


  subroutine g_compute(this, s) …

  end subroutine g_compute


  subroutine absvolflux_compute(this, u, v, w)

    class(gradient_jump_penalty_t), intent(inout) :: this

    type(field_t), intent(in) :: u, v, w


    integer :: i


    if (neko_bcknd_device .eq. 1) then

       call device_pick_facet_value_hex(this%volflux1_d, u%x_d, this%lx, &

                                        this%coef%msh%nelv)

       call device_pick_facet_value_hex(this%volflux2_d, v%x_d, this%lx, &

                                        this%coef%msh%nelv)

       call device_pick_facet_value_hex(this%volflux3_d, w%x_d, this%lx, &

                                        this%coef%msh%nelv)

       call device_col2(this%volflux1_d, this%n1_d, this%n_large)

       call device_col2(this%volflux2_d, this%n2_d, this%n_large)

       call device_col2(this%volflux3_d, this%n3_d, this%n_large)

       call device_add3s2(this%absvolflux_d, this%volflux1_d, &

                          this%volflux2_d, 1.0_rp, 1.0_rp, this%n_large)

       call device_add2(this%absvolflux_d, this%volflux3_d, this%n_large)

       call device_absval(this%absvolflux_d, this%n_large)

    else

       call pick_facet_value_hex(this%volflux1, u%x, &

                                 this%lx, this%coef%msh%nelv)

       call pick_facet_value_hex(this%volflux2, v%x, &

                                 this%lx, this%coef%msh%nelv)

       call pick_facet_value_hex(this%volflux3, w%x, &

                                 this%lx, this%coef%msh%nelv)

       call col2(this%volflux1, this%n1, this%n_large)

       call col2(this%volflux2, this%n2, this%n_large)

       call col2(this%volflux3, this%n3, this%n_large)

       call add3(this%absvolflux, this%volflux1, this%volflux2, this%n_large)

       call add2(this%absvolflux, this%volflux3, this%n_large)

       call absval(this%absvolflux, this%n_large)

    end if


  subroutine absvolflux_compute(this, u, v, w) …

  end subroutine absvolflux_compute


  subroutine pick_facet_value_hex(f_facet, f_field, lx, nelv)

    integer, intent(in) :: lx, nelv

    real(kind=rp), intent(in) :: f_field(lx, lx, lx, nelv)

    real(kind=rp), intent(inout) :: f_facet(lx + 2, lx + 2, lx + 2, nelv)


    call copy(f_facet(1, 2: lx + 1, 2: lx + 1, :), &

              f_field(1, :, :, :), lx * lx * nelv)

    call copy(f_facet(lx + 2, 2: lx + 1, 2: lx + 1, :), &

              f_field(lx, :, :, :), lx * lx * nelv)

    call copy(f_facet(2: lx + 1, 1, 2: lx + 1, :), &

              f_field(:, 1, :, :), lx * lx * nelv)

    call copy(f_facet(2: lx + 1, lx + 2, 2: lx + 1, :), &

              f_field(:, lx, :, :), lx * lx * nelv)

    call copy(f_facet(2: lx + 1, 2: lx + 1, 1, :), &

              f_field(:, :, 1, :), lx * lx * nelv)

    call copy(f_facet(2: lx + 1, 2: lx + 1, lx + 2, :), &

              f_field(:, :, lx, :), lx * lx * nelv)


  subroutine pick_facet_value_hex(f_facet, f_field, lx, nelv) …

  end subroutine pick_facet_value_hex


end module gradient_jump_penalty

device::device_map
Map a Fortran array to a device (allocate and associate)
Definition device.F90:57

device::device_memcpy
Copy data between host and device (or device and device)
Definition device.F90:51

json_utils::json_get_or_default
Retrieves a parameter by name or assigns a provided default value. In the latter case also adds the m...
Definition json_utils.f90:54

utils::neko_error
Definition utils.f90:42

coefs
Coefficients.
Definition coef.f90:34

device_gradient_jump_penalty
Definition device_gradient_jump_penalty.F90:33

device_math
Definition device_math.F90:33

device
Device abstraction, common interface for various accelerators.
Definition device.F90:34

device::host_to_device
integer, parameter, public host_to_device
Definition device.F90:47

dofmap
Defines a mapping of the degrees of freedom.
Definition dofmap.f90:35

element
Definition element.f90:33

field
Defines a field.
Definition field.f90:34

gather_scatter
Gather-scatter.
Definition gather_scatter.f90:34

gradient_jump_penalty
Implements gradient_jump_penalty_t.
Definition gradient_jump_penalty.f90:35

gradient_jump_penalty::gradient_jump_penalty_finalize_hex
subroutine gradient_jump_penalty_finalize_hex(penalty, wa, dphidxi, lx, nelv)
Finalizinge the gradient jump penalty term for hexahedral elements. <tau * h^2 * absvolflux * G * phi...
Definition gradient_jump_penalty.f90:786

gradient_jump_penalty::gradient_jump_penalty_compute
subroutine gradient_jump_penalty_compute(this, u, v, w, s)
Compute the gradient jump penalty term.
Definition gradient_jump_penalty.f90:718

gradient_jump_penalty::gradient_jump_penalty_finalize
subroutine gradient_jump_penalty_finalize(penalty, wa, dphidxi, lx, nelv)
Interface of finalizing the gradient jump penalty term. <tau * h^2 * absvolflux * G * phij * phik * d...
Definition gradient_jump_penalty.f90:769

gradient_jump_penalty::absvolflux_compute
subroutine absvolflux_compute(this, u, v, w)
Compute the average of the volumetric flux over facets.
Definition gradient_jump_penalty.f90:864

gradient_jump_penalty::gradient_jump_penalty_perform
subroutine gradient_jump_penalty_perform(this, f)
Assign the gradient jump penalty term.
Definition gradient_jump_penalty.f90:748

gradient_jump_penalty::facet_factor_init
subroutine facet_factor_init(this)
Initialize the facet factor array.
Definition gradient_jump_penalty.f90:498

gradient_jump_penalty::g_compute
subroutine g_compute(this, s)
Compute the average of the flux over facets.
Definition gradient_jump_penalty.f90:818

gradient_jump_penalty::eval_h2_hex
subroutine eval_h2_hex(h2_el, n, i, dm, coef)
Evaluate h^2 for each element for hexahedral mesh.
Definition gradient_jump_penalty.f90:335

gradient_jump_penalty::dist2_quadrature_hex
real(kind=rp) function dist2_quadrature_hex(l, k, j, i, n, dm, coef)
Definition gradient_jump_penalty.f90:376

gradient_jump_penalty::gradient_jump_penalty_init
subroutine gradient_jump_penalty_init(this, params, dofmap, coef, a, b)
Constructor.
Definition gradient_jump_penalty.f90:146

gradient_jump_penalty::pick_facet_value_hex
subroutine pick_facet_value_hex(f_facet, f_field, lx, nelv)
Pick facet values of a field.
Definition gradient_jump_penalty.f90:906

gradient_jump_penalty::gradient_jump_penalty_free
subroutine gradient_jump_penalty_free(this)
Destructor for the gradient_jump_penalty_t class.
Definition gradient_jump_penalty.f90:585

gs_ops
Defines Gather-scatter operations.
Definition gs_ops.f90:34

gs_ops::gs_op_add
integer, parameter, public gs_op_add
Definition gs_ops.f90:36

hex
Defines a hexahedron element.
Definition hex.f90:34

json_utils
Utilities for retrieving parameters from the case files.
Definition json_utils.f90:34

math
Definition math.f90:60

neko_config
Build configurations.
Definition neko_config.f90:34

neko_config::neko_bcknd_device
integer, parameter neko_bcknd_device
Definition neko_config.f90:44

num_types
Definition num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

operators
Operators.
Definition operators.f90:34

operators::dudxyz
subroutine, public dudxyz(du, u, dr, ds, dt, coef)
Compute derivative of a scalar field along a single direction.
Definition operators.f90:76

point
Implements a point.
Definition point.f90:35

quad
Defines a quadrilateral element.
Definition quad.f90:34

space
Defines a function space.
Definition space.f90:34

space::gll
integer, parameter, public gll
Definition space.f90:48

utils
Utilities.
Definition utils.f90:35

coefs::coef_t
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
Definition coef.f90:55

dofmap::dofmap_t
Definition dofmap.f90:53

element::element_t
Base type for an element.
Definition element.f90:44

field::field_t
Definition field.f90:46

gather_scatter::gs_t
Definition gather_scatter.f90:58

gradient_jump_penalty::gradient_jump_penalty_t
Implements the gradient jump penalty.
Definition gradient_jump_penalty.f90:62

hex::hex_t
Hexahedron element.
Definition hex.f90:63

point::point_t
A point in  with coordinates .
Definition point.f90:43

quad::quad_t
Quadrilateral element.
Definition quad.f90:58

space::space_t
The function space for the SEM solution fields.
Definition space.f90:62