dd/dbf/cg__coupled_8f90_source.html

 ! Copyright (c) 2024, The Neko Authors

 ! All rights reserved.

 !

 ! Redistribution and use in source and binary forms, with or without

 ! modification, are permitted provided that the following conditions

 ! are met:

 !

 !   * Redistributions of source code must retain the above copyright

 !     notice, this list of conditions and the following disclaimer.

 !

 !   * Redistributions in binary form must reproduce the above

 !     copyright notice, this list of conditions and the following

 !     disclaimer in the documentation and/or other materials provided

 !     with the distribution.

 !

 !   * Neither the name of the authors nor the names of its

 !     contributors may be used to endorse or promote products derived

 !     from this software without specific prior written permission.

 !

 ! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

 ! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

 ! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

 ! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

 ! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

 ! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

 ! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 ! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

 ! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

 ! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

 ! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 ! POSSIBILITY OF SUCH DAMAGE.

 !

 module cg_cpld

   use num_types, only: rp

   use krylov, only : ksp_t, ksp_monitor_t, ksp_max_iter

   use precon,  only : pc_t

   use ax_product, only : ax_t

   use field, only : field_t

   use coefs, only : coef_t

   use gather_scatter, only : gs_t, gs_op_add

   use bc, only : bc_list_t, bc_list_apply

   use math, only : glsc3, glsc2

   use utils, only : neko_error

   implicit none

   private


   type, public, extends(ksp_t) :: cg_cpld_t

      real(kind=rp), allocatable :: w1(:)

      real(kind=rp), allocatable :: w2(:)

      real(kind=rp), allocatable :: w3(:)

      real(kind=rp), allocatable :: r1(:)

      real(kind=rp), allocatable :: r2(:)

      real(kind=rp), allocatable :: r3(:)

      real(kind=rp), allocatable :: p1(:)

      real(kind=rp), allocatable :: p2(:)

      real(kind=rp), allocatable :: p3(:)

      real(kind=rp), allocatable :: z1(:)

      real(kind=rp), allocatable :: z2(:)

      real(kind=rp), allocatable :: z3(:)

      real(kind=rp), allocatable :: tmp(:)

    contains

      procedure, pass(this) :: init => cg_cpld_init

      procedure, pass(this) :: free => cg_cpld_free

      procedure, pass(this) :: solve => cg_cpld_nop

      procedure, pass(this) :: solve_coupled => cg_cpld_solve

   end type cg_cpld_t


 contains


   subroutine cg_cpld_init(this, n, max_iter, M, rel_tol, abs_tol, monitor)

     class(cg_cpld_t), intent(inout) :: this

     integer, intent(in) :: max_iter

     class(pc_t), optional, intent(in), target :: M

     integer, intent(in) :: n

     real(kind=rp), optional, intent(in) :: rel_tol

     real(kind=rp), optional, intent(in) :: abs_tol

     logical, optional, intent(in) :: monitor


     call this%free()


     allocate(this%w1(n))

     allocate(this%w2(n))

     allocate(this%w3(n))

     allocate(this%r1(n))

     allocate(this%r2(n))

     allocate(this%r3(n))

     allocate(this%p1(n))

     allocate(this%p2(n))

     allocate(this%p3(n))

     allocate(this%z1(n))

     allocate(this%z2(n))

     allocate(this%z3(n))

     allocate(this%tmp(n))


     if (present(m)) then

        this%M => m

     end if


     if (present(rel_tol) .and. present(abs_tol) .and. present(monitor)) then

        call this%ksp_init(max_iter, rel_tol, abs_tol, monitor = monitor)

     else if (present(rel_tol) .and. present(abs_tol)) then

        call this%ksp_init(max_iter, rel_tol, abs_tol)

     else if (present(monitor) .and. present(abs_tol)) then

        call this%ksp_init(max_iter, abs_tol = abs_tol, monitor = monitor)

     else if (present(rel_tol) .and. present(monitor)) then

        call this%ksp_init(max_iter, rel_tol, monitor = monitor)

     else if (present(rel_tol)) then

        call this%ksp_init(max_iter, rel_tol = rel_tol)

     else if (present(abs_tol)) then

        call this%ksp_init(max_iter, abs_tol = abs_tol)

     else if (present(monitor)) then

        call this%ksp_init(max_iter, monitor = monitor)

     else

        call this%ksp_init(max_iter)

     end if


   end subroutine cg_cpld_init


   subroutine cg_cpld_free(this)

     class(cg_cpld_t), intent(inout) :: this


     call this%ksp_free()


     if (allocated(this%w1)) then

        deallocate(this%w1)

     end if


     if (allocated(this%w2)) then

        deallocate(this%w2)

     end if


     if (allocated(this%w3)) then

        deallocate(this%w3)

     end if


     if (allocated(this%r1)) then

        deallocate(this%r1)

     end if


     if (allocated(this%r2)) then

        deallocate(this%r2)

     end if


     if (allocated(this%r3)) then

        deallocate(this%r3)

     end if


     if (allocated(this%p1)) then

        deallocate(this%p1)

     end if


     if (allocated(this%p2)) then

        deallocate(this%p2)

     end if


     if (allocated(this%p3)) then

        deallocate(this%p3)

     end if


     if (allocated(this%z1)) then

        deallocate(this%z1)

     end if


     if (allocated(this%z2)) then

        deallocate(this%z2)

     end if


     if (allocated(this%z3)) then

        deallocate(this%z3)

     end if


     if (allocated(this%tmp)) then

        deallocate(this%tmp)

     end if


     nullify(this%M)


   end subroutine cg_cpld_free


   function cg_cpld_nop(this, Ax, x, f, n, coef, blst, gs_h, niter) &

        result(ksp_results)

     class(cg_cpld_t), intent(inout) :: this

     class(ax_t), intent(in) :: ax

     type(field_t), intent(inout) :: x

     integer, intent(in) :: n

     real(kind=rp), dimension(n), intent(in) :: f

     type(coef_t), intent(inout) :: coef

     type(bc_list_t), intent(in) :: blst

     type(gs_t), intent(inout) :: gs_h

     type(ksp_monitor_t) :: ksp_results

     integer, optional, intent(in) :: niter


     ! Throw and error

     call neko_error('The cpldcg solver is only defined for coupled solves')


     ksp_results%res_final = 0.0

     ksp_results%iter = 0

   end function cg_cpld_nop


   function cg_cpld_solve(this, Ax, x, y, z, fx, fy, fz, &

        n, coef, blstx, blsty, blstz, gs_h, niter) result(ksp_results)

     class(cg_cpld_t), intent(inout) :: this

     class(ax_t), intent(in) :: ax

     type(field_t), intent(inout) :: x

     type(field_t), intent(inout) :: y

     type(field_t), intent(inout) :: z

     integer, intent(in) :: n

     real(kind=rp), dimension(n), intent(in) :: fx

     real(kind=rp), dimension(n), intent(in) :: fy

     real(kind=rp), dimension(n), intent(in) :: fz

     type(coef_t), intent(inout) :: coef

     type(bc_list_t), intent(in) :: blstx

     type(bc_list_t), intent(in) :: blsty

     type(bc_list_t), intent(in) :: blstz

     type(gs_t), intent(inout) :: gs_h

     type(ksp_monitor_t), dimension(3) :: ksp_results

     integer, optional, intent(in) :: niter

     real(kind=rp), parameter :: one = 1.0

     real(kind=rp), parameter :: zero = 0.0

     integer :: i, iter, max_iter

     real(kind=rp) :: rnorm, rtr, rtr0, rtz2, rtz1

     real(kind=rp) :: beta, pap, alpha, alphm, norm_fac


     if (present(niter)) then

        max_iter = niter

     else

        max_iter = this%max_iter

     end if

     norm_fac = one / coef%volume


     associate(p1 => this%p1, p2 => this%p2, p3 => this%p3, z1 => this%z1, &

          z2 => this%z2, z3 => this%z3, r1 => this%r1, r2 => this%r2, &

          r3 => this%r3, tmp => this%tmp, w1 => this%w1, w2 => this%w2, &

          w3 => this%w3)


       rtz1 = one

       do concurrent(i = 1:n)

          x%x(i,1,1,1) = 0.0_rp

          y%x(i,1,1,1) = 0.0_rp

          z%x(i,1,1,1) = 0.0_rp

          p1(i) = 0.0_rp

          p2(i) = 0.0_rp

          p3(i) = 0.0_rp

          z1(i) = 0.0_rp

          z2(i) = 0.0_rp

          z3(i) = 0.0_rp

          r1(i) = fx(i)

          r2(i) = fy(i)

          r3(i) = fz(i)

          tmp(i) = r1(i)**2 + r2(i)**2 + r3(i)**2

       end do


       rtr = glsc3(tmp, coef%mult, coef%binv, n)

       rnorm = sqrt(rtr*norm_fac)

       ksp_results%res_start = rnorm

       ksp_results%res_final = rnorm

       ksp_results%iter = 0

       if (rnorm .eq. zero) return


       call this%monitor_start('cpldCG')

       do iter = 1, max_iter

          call this%M%solve(z1, this%r1, n)

          call this%M%solve(z2, this%r2, n)

          call this%M%solve(z3, this%r3, n)

          rtz2 = rtz1


          do concurrent(i = 1:n)

             this%tmp(i) = z1(i) * r1(i) &

                         + z2(i) * r2(i) &

                         + z3(i) * r3(i)

          end do


          rtz1 = glsc2(tmp, coef%mult, n)


          beta = rtz1 / rtz2

          if (iter .eq. 1) beta = zero

          do concurrent(i = 1:n)

             p1(i) = p1(i) * beta + z1(i)

             p2(i) = p2(i) * beta + z2(i)

             p3(i) = p3(i) * beta + z3(i)

          end do


          call ax%compute_vector(w1, w2, w3, p1, p2, p3, coef, x%msh, x%Xh)

          call gs_h%op(w1, n, gs_op_add)

          call gs_h%op(w2, n, gs_op_add)

          call gs_h%op(w3, n, gs_op_add)

          call bc_list_apply(blstx, w1, n)

          call bc_list_apply(blsty, w2, n)

          call bc_list_apply(blstz, w3, n)


          do concurrent(i = 1:n)

             tmp(i) = w1(i) * p1(i) &

                    + w2(i) * p2(i) &

                    + w3(i) * p3(i)

          end do


          pap = glsc2(tmp, coef%mult, n)


          alpha = rtz1 / pap

          alphm = -alpha

          do concurrent(i = 1:n)

             x%x(i,1,1,1) = x%x(i,1,1,1) + alpha * p1(i)

             y%x(i,1,1,1) = y%x(i,1,1,1) + alpha * p2(i)

             z%x(i,1,1,1) = z%x(i,1,1,1) + alpha * p3(i)

             r1(i) = r1(i) + alphm * w1(i)

             r2(i) = r2(i) + alphm * w2(i)

             r3(i) = r3(i) + alphm * w3(i)

             tmp(i) = r1(i)**2 + r2(i)**2 + r3(i)**2

          end do


          rtr = glsc3(tmp, coef%mult, coef%binv, n)

          if (iter .eq. 1) rtr0 = rtr

          rnorm = sqrt(rtr * norm_fac)

          call this%monitor_iter(iter, rnorm)

          if (rnorm .lt. this%abs_tol) then

             exit

          end if

       end do

     end associate

     call this%monitor_stop()

     ksp_results%res_final = rnorm

     ksp_results%iter = iter

   end function cg_cpld_solve


 end module cg_cpld

bc::bc_list_apply
Definition: bc.f90:190

utils::neko_error
Definition: utils.f90:42

ax_product
Defines a Matrix-vector product.
Definition: ax.f90:34

bc
Defines a boundary condition.
Definition: bc.f90:34

cg_cpld
Defines a coupled Conjugate Gradient methods.
Definition: cg_coupled.f90:34

cg_cpld::cg_cpld_solve
type(ksp_monitor_t) function, dimension(3) cg_cpld_solve(this, Ax, x, y, z, fx, fy, fz, n, coef, blstx, blsty, blstz, gs_h, niter)
Coupled PCG solve.
Definition: cg_coupled.f90:207

cg_cpld::cg_cpld_init
subroutine cg_cpld_init(this, n, max_iter, M, rel_tol, abs_tol, monitor)
Initialise a coupled PCG solver.
Definition: cg_coupled.f90:74

cg_cpld::cg_cpld_nop
type(ksp_monitor_t) function cg_cpld_nop(this, Ax, x, f, n, coef, blst, gs_h, niter)
Definition: cg_coupled.f90:186

cg_cpld::cg_cpld_free
subroutine cg_cpld_free(this)
Deallocate a coupled PCG solver.
Definition: cg_coupled.f90:124

coefs
Coefficients.
Definition: coef.f90:34

field
Defines a field.
Definition: field.f90:34

gather_scatter
Gather-scatter.
Definition: gather_scatter.f90:34

krylov
Implements the base abstract type for Krylov solvers plus helper types.
Definition: krylov.f90:34

krylov::ksp_max_iter
integer, parameter, public ksp_max_iter
Maximum number of iters.
Definition: krylov.f90:51

math
Definition: math.f90:60

math::glsc3
real(kind=rp) function, public glsc3(a, b, c, n)
Weighted inner product .
Definition: math.f90:895

math::glsc2
real(kind=rp) function, public glsc2(a, b, n)
Weighted inner product .
Definition: math.f90:876

num_types
Definition: num_types.f90:1

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition: num_types.f90:12

precon
Krylov preconditioner.
Definition: precon.f90:34

utils
Utilities.
Definition: utils.f90:35

ax_product::ax_t
Base type for a matrix-vector product providing .
Definition: ax.f90:43

bc::bc_list_t
A list of boundary conditions.
Definition: bc.f90:104

cg_cpld::cg_cpld_t
Coupled preconditioned conjugate gradient method.
Definition: cg_coupled.f90:49

coefs::coef_t
Coefficients defined on a given (mesh, ) tuple. Arrays use indices (i,j,k,e): element e,...
Definition: coef.f90:55

field::field_t
Definition: field.f90:46

gather_scatter::gs_t
Definition: gather_scatter.f90:58

krylov::ksp_monitor_t
Type for storing initial and final residuals in a Krylov solver.
Definition: krylov.f90:56

krylov::ksp_t
Base abstract type for a canonical Krylov method, solving .
Definition: krylov.f90:66

precon::pc_t
Defines a canonical Krylov preconditioner.
Definition: precon.f90:40