d0/d28/device__mathops_8F90_source.html

! Copyright (c) 2021-2023, The Neko Authors

! All rights reserved.

!

! Redistribution and use in source and binary forms, with or without

! modification, are permitted provided that the following conditions

! are met:

!

!   * Redistributions of source code must retain the above copyright

!     notice, this list of conditions and the following disclaimer.

!

!   * Redistributions in binary form must reproduce the above

!     copyright notice, this list of conditions and the following

!     disclaimer in the documentation and/or other materials provided

!     with the distribution.

!

!   * Neither the name of the authors nor the names of its

!     contributors may be used to endorse or promote products derived

!     from this software without specific prior written permission.

!

! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

! "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

! LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS

! FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE

! COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,

! INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

! BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

! LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

! CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT

! LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

! ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

! POSSIBILITY OF SUCH DAMAGE.

!

module device_mathops

  use num_types, only : rp, c_rp

  use utils, only : neko_error

  use, intrinsic :: iso_c_binding, only : c_int, c_ptr

  implicit none

  private


#ifdef HAVE_HIP

  interface


     subroutine hip_opchsign(a1_d, a2_d, a3_d, gdim, n) &

          bind(c, name='hip_opchsign')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d

       integer(c_int) :: gdim, n

     subroutine hip_opchsign(a1_d, a2_d, a3_d, gdim, n) & …

     end subroutine hip_opchsign

  end interface


  interface


     subroutine hip_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n) &

          bind(c, name='hip_opcolv')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, c_d

       integer(c_int) :: gdim, n

     subroutine hip_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n) & …

     end subroutine hip_opcolv

  end interface


  interface


     subroutine hip_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n) &

          bind(c, name='hip_opcolv3c')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       real(c_rp) :: d

       integer(c_int) :: gdim, n

     subroutine hip_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n) & …

     end subroutine hip_opcolv3c

  end interface


  interface


     subroutine hip_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n) &

          bind(c, name='hip_opadd2cm')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d

       real(c_rp) :: c

       integer(c_int) :: gdim, n

     subroutine hip_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n) & …

     end subroutine hip_opadd2cm

  end interface


  interface


     subroutine hip_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n) &

          bind(c, name='hip_opadd2col')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       integer(c_int) :: gdim, n

     subroutine hip_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n) & …

     end subroutine hip_opadd2col

  end interface

#elif HAVE_CUDA

  interface

     subroutine cuda_opchsign(a1_d, a2_d, a3_d, gdim, n) &

          bind(c, name='cuda_opchsign')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d

       integer(c_int) :: gdim, n

     end subroutine cuda_opchsign

  end interface


  interface

     subroutine cuda_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n) &

          bind(c, name='cuda_opcolv')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, c_d

       integer(c_int) :: gdim, n

     end subroutine cuda_opcolv

  end interface


  interface

     subroutine cuda_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n) &

          bind(c, name='cuda_opcolv3c')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       real(c_rp) :: d

       integer(c_int) :: gdim, n

     end subroutine cuda_opcolv3c

  end interface


  interface

     subroutine cuda_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n) &

          bind(c, name='cuda_opadd2cm')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d

       real(c_rp) :: c

       integer(c_int) :: gdim, n

     end subroutine cuda_opadd2cm

  end interface


  interface

     subroutine cuda_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n) &

          bind(c, name='cuda_opadd2col')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       integer(c_int) :: gdim, n

     end subroutine cuda_opadd2col

  end interface

#elif HAVE_OPENCL

  interface

     subroutine opencl_opchsign(a1_d, a2_d, a3_d, gdim, n) &

          bind(c, name='opencl_opchsign')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d

       integer(c_int) :: gdim, n

     end subroutine opencl_opchsign

  end interface


  interface

     subroutine opencl_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n) &

          bind(c, name='opencl_opcolv')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, c_d

       integer(c_int) :: gdim, n

     end subroutine opencl_opcolv

  end interface


  interface

     subroutine opencl_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n) &

          bind(c, name='opencl_opcolv3c')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       real(c_rp) :: d

       integer(c_int) :: gdim, n

     end subroutine opencl_opcolv3c

  end interface


  interface

     subroutine opencl_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n) &

          bind(c, name='opencl_opadd2cm')

       use, intrinsic :: iso_c_binding

       import c_rp

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d

       real(c_rp) :: c

       integer(c_int) :: gdim, n

     end subroutine opencl_opadd2cm

  end interface


  interface

     subroutine opencl_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n) &

          bind(c, name='opencl_opadd2col')

       use, intrinsic :: iso_c_binding

       type(c_ptr), value :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

       integer(c_int) :: gdim, n

     end subroutine opencl_opadd2col

  end interface

#endif


  public :: device_opchsign, device_opcolv, device_opcolv3c, &

       device_opadd2cm, device_opadd2col


contains


  subroutine device_opchsign(a1_d, a2_d, a3_d, gdim, n)

    type(c_ptr) :: a1_d, a2_d, a3_d

    integer :: n, gdim

#ifdef HAVE_HIP

    call hip_opchsign(a1_d, a2_d, a3_d, gdim, n)

#elif HAVE_CUDA

    call cuda_opchsign(a1_d, a2_d, a3_d, gdim, n)

#elif HAVE_OPENCL

    call opencl_opchsign(a1_d, a2_d, a3_d, gdim, n)

#else

    call neko_error('No device backend configured')

#endif

  subroutine device_opchsign(a1_d, a2_d, a3_d, gdim, n) …

  end subroutine device_opchsign


  subroutine device_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n)

    type(c_ptr) :: a1_d, a2_d, a3_d, c_d

    integer :: n, gdim

#ifdef HAVE_HIP

    call hip_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n)

#elif HAVE_CUDA

    call cuda_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n)

#elif HAVE_OPENCL

    call opencl_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n)

#else

    call neko_error('No device backend configured')

#endif

  subroutine device_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n) …

  end subroutine device_opcolv


  subroutine device_opcolv3c(a1_d, a2_d, a3_d, &

                             b1_d, b2_d, b3_d, c_d, d, n, gdim)

    type(c_ptr) :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

    real(kind=rp) :: d

    integer :: n, gdim

#ifdef HAVE_HIP

    call hip_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n)

#elif HAVE_CUDA

    call cuda_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n)

#elif HAVE_OPENCL

    call opencl_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, gdim, n)

#else

    call neko_error('No device backend configured')

#endif

  subroutine device_opcolv3c(a1_d, a2_d, a3_d, & …

  end subroutine device_opcolv3c


  subroutine device_opadd2cm (a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, n, gdim)

    type(c_ptr) :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d

    real(kind=rp) :: c

    integer :: n, gdim

#ifdef HAVE_HIP

    call hip_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n)

#elif HAVE_CUDA

    call cuda_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n)

#elif HAVE_OPENCL

    call opencl_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, gdim, n)

#else

    call neko_error('No device backend configured')

#endif

  subroutine device_opadd2cm (a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, n, gdim) …

  end subroutine device_opadd2cm


  subroutine device_opadd2col (a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, n, gdim)

    type(c_ptr) :: a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d

    integer :: n, gdim

#ifdef HAVE_HIP

    call hip_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n)

#elif HAVE_CUDA

    call cuda_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n)

#elif HAVE_OPENCL

    call opencl_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, gdim, n)

#else

    call neko_error('No device backend configured')

#endif

  subroutine device_opadd2col (a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, n, gdim) …

  end subroutine device_opadd2col


end module device_mathops

device_mathops::hip_opadd2cm
Definition device_mathops.F90:71

device_mathops::hip_opadd2col
Definition device_mathops.F90:82

device_mathops::hip_opchsign
Definition device_mathops.F90:42

device_mathops::hip_opcolv3c
Definition device_mathops.F90:60

device_mathops::hip_opcolv
Definition device_mathops.F90:51

utils::neko_error
Definition utils.f90:42

opencl_opcolv3c
void opencl_opcolv3c(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, void *c, real *d, int *gdim, int *n)
Definition mathops.c:101

opencl_opadd2cm
void opencl_opadd2cm(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, real *c, int *gdim, int *n)
Definition mathops.c:133

opencl_opcolv
void opencl_opcolv(void *a1, void *a2, void *a3, void *c, int *gdim, int *n)
Definition mathops.c:75

opencl_opchsign
void opencl_opchsign(void *a1, void *a2, void *a3, int *gdim, int *n)
Definition mathops.c:50

opencl_opadd2col
void opencl_opadd2col(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, void *c, int *gdim, int *n)
Definition mathops.c:164

cuda_opchsign
void cuda_opchsign(void *a1, void *a2, void *a3, int *gdim, int *n)
Definition mathops.cu:42

cuda_opcolv3c
void cuda_opcolv3c(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, void *c, real *d, int *gdim, int *n)
Definition mathops.cu:69

cuda_opadd2cm
void cuda_opadd2cm(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, real *c, int *gdim, int *n)
Definition mathops.cu:85

cuda_opcolv
void cuda_opcolv(void *a1, void *a2, void *a3, void *c, int *gdim, int *n)
Definition mathops.cu:55

cuda_opadd2col
void cuda_opadd2col(void *a1, void *a2, void *a3, void *b1, void *b2, void *b3, void *c, int *gdim, int *n)
Definition mathops.cu:101

device_mathops
Definition device_mathops.F90:33

device_mathops::device_opchsign
subroutine, public device_opchsign(a1_d, a2_d, a3_d, gdim, n)
Definition device_mathops.F90:196

device_mathops::device_opadd2col
subroutine, public device_opadd2col(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, n, gdim)
Definition device_mathops.F90:259

device_mathops::device_opadd2cm
subroutine, public device_opadd2cm(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c, n, gdim)
Definition device_mathops.F90:243

device_mathops::device_opcolv3c
subroutine, public device_opcolv3c(a1_d, a2_d, a3_d, b1_d, b2_d, b3_d, c_d, d, n, gdim)
Definition device_mathops.F90:227

device_mathops::device_opcolv
subroutine, public device_opcolv(a1_d, a2_d, a3_d, c_d, gdim, n)
Definition device_mathops.F90:211

num_types
Definition num_types.f90:1

num_types::c_rp
integer, parameter, public c_rp
Definition num_types.f90:13

num_types::rp
integer, parameter, public rp
Global precision used in computations.
Definition num_types.f90:12

utils
Utilities.
Definition utils.f90:35