dtfft_executor_mkl_m.F90 Source File


This file depends on

sourcefile~~dtfft_executor_mkl_m.f90~~EfferentGraph sourcefile~dtfft_executor_mkl_m.f90 dtfft_executor_mkl_m.F90 sourcefile~dtfft_abstract_executor.f90 dtfft_abstract_executor.F90 sourcefile~dtfft_executor_mkl_m.f90->sourcefile~dtfft_abstract_executor.f90 sourcefile~dtfft_interface_mkl_m.f90 dtfft_interface_mkl_m.F90 sourcefile~dtfft_executor_mkl_m.f90->sourcefile~dtfft_interface_mkl_m.f90 sourcefile~dtfft_interface_mkl_native_m.f90 dtfft_interface_mkl_native_m.F90 sourcefile~dtfft_executor_mkl_m.f90->sourcefile~dtfft_interface_mkl_native_m.f90 sourcefile~dtfft_parameters.f90 dtfft_parameters.F90 sourcefile~dtfft_executor_mkl_m.f90->sourcefile~dtfft_parameters.f90 sourcefile~dtfft_utils.f90 dtfft_utils.F90 sourcefile~dtfft_executor_mkl_m.f90->sourcefile~dtfft_utils.f90 sourcefile~dtfft_abstract_executor.f90->sourcefile~dtfft_parameters.f90 sourcefile~dtfft_abstract_executor.f90->sourcefile~dtfft_utils.f90 sourcefile~dtfft_interface_nvtx.f90 dtfft_interface_nvtx.F90 sourcefile~dtfft_abstract_executor.f90->sourcefile~dtfft_interface_nvtx.f90 sourcefile~dtfft_pencil.f90 dtfft_pencil.F90 sourcefile~dtfft_abstract_executor.f90->sourcefile~dtfft_pencil.f90 sourcefile~dtfft_interface_mkl_m.f90->sourcefile~dtfft_utils.f90 sourcefile~dtfft_utils.f90->sourcefile~dtfft_parameters.f90 sourcefile~dtfft_interface_nvtx.f90->sourcefile~dtfft_utils.f90 sourcefile~dtfft_pencil.f90->sourcefile~dtfft_parameters.f90 sourcefile~dtfft_pencil.f90->sourcefile~dtfft_utils.f90 sourcefile~dtfft_interface_cuda_runtime.f90 dtfft_interface_cuda_runtime.F90 sourcefile~dtfft_pencil.f90->sourcefile~dtfft_interface_cuda_runtime.f90 sourcefile~dtfft_interface_cuda_runtime.f90->sourcefile~dtfft_parameters.f90 sourcefile~dtfft_interface_cuda_runtime.f90->sourcefile~dtfft_utils.f90

Files dependent on this one

sourcefile~~dtfft_executor_mkl_m.f90~~AfferentGraph sourcefile~dtfft_executor_mkl_m.f90 dtfft_executor_mkl_m.F90 sourcefile~dtfft_plan.f90 dtfft_plan.F90 sourcefile~dtfft_plan.f90->sourcefile~dtfft_executor_mkl_m.f90 sourcefile~dtfft.f90 dtfft.F90 sourcefile~dtfft.f90->sourcefile~dtfft_plan.f90 sourcefile~dtfft_api.f90 dtfft_api.F90 sourcefile~dtfft_api.f90->sourcefile~dtfft_plan.f90

Source Code

!------------------------------------------------------------------------------------------------
! Copyright (c) 2021, Oleg Shatrov
! All rights reserved.
! This file is part of dtFFT library.

! dtFFT is free software: you can redistribute it and/or modify
! it under the terms of the GNU General Public License as published by
! the Free Software Foundation, either version 3 of the License, or
! (at your option) any later version.

! dtFFT is distributed in the hope that it will be useful,
! but WITHOUT ANY WARRANTY; without even the implied warranty of
! MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
! GNU General Public License for more details.

! You should have received a copy of the GNU General Public License
! along with this program.  If not, see <https://www.gnu.org/licenses/>.
!------------------------------------------------------------------------------------------------
module dtfft_executor_mkl_m
!! This module describes MKL based FFT Executor: [[mkl_executor]]
!!
!! https://software.intel.com/content/www/us/en/develop/documentation/onemkl-developer-reference-fortran/top/fourier-transform-functions/fft-functions.html
use iso_fortran_env,              only: int8, int32, int64, error_unit
use iso_c_binding,                only: c_int, c_long, c_ptr
use dtfft_abstract_executor,      only: abstract_executor, FFT_C2C, FFT_R2C, FFT_R2R
use dtfft_interface_mkl_m
use dtfft_interface_mkl_native_m
use dtfft_parameters
use dtfft_utils,                  only: int_to_str
#include "dtfft_mpi.h"
implicit none
private
public :: mkl_executor

#define MKL_DFTI_CALL(name, func)                                                                                                                                     \
  block;                                                                                                                                                              \
    integer(c_long) :: ierr;                                                                                                                                          \
    integer(int32)  :: mpi_err;                                                                                                                                       \
    ierr = func;                                                                                                                                                      \
    if( ierr /= DFTI_NO_ERROR ) then;                                                                                                                                 \
      write(error_unit, '(a)') "Error occured during call to MKL DFTI function '"//name//"': "//DftiErrorMessage(ierr)//" at "//__FILE__//":"//int_to_str(__LINE__);  \
      call MPI_Abort(MPI_COMM_WORLD, int(ierr, c_int), mpi_err);                                                                                                      \
    endif;                                                                                                                                                            \
  endblock

  type, extends(abstract_executor)  :: mkl_executor
  !! MKL FFT Executor
  private
    logical                       :: need_reconfigure     !! Needed for R2C plans
    integer(c_long), allocatable  :: istrides(:)          !! Input strides. Needed for R2C plans to reconfigure plan
    integer(c_long), allocatable  :: ostrides(:)          !! Output strides. Needed for R2C plans to reconfigure plan
    integer(int32)                :: idist                !! Input distance between the first data elements of consecutive data sets
    integer(int32)                :: odist                !! Output distance between the first data elements of consecutive data sets
  contains
    procedure :: create_private => create     !! Creates FFT plan via MKL DFTI Interface
    procedure :: execute_private => execute   !! Executes MKL plan
    procedure :: destroy_private => destroy   !! Destroys MKL plan
    procedure, nopass :: mem_alloc            !! Allocates MKL memory
    procedure, nopass :: mem_free             !! Frees MKL aligned memory
  endtype mkl_executor

contains

  subroutine make_plan(fft_rank, fft_sizes, mkl_precision, forward_domain, how_many, idist, odist, plan)
  !! Creates general MKL plan
    integer(int8),              intent(in)    :: fft_rank           !! Rank of fft: 1 or 2
    integer(c_long),            intent(in)    :: fft_sizes(:)       !! Dimensions of transform
    integer(int32),             intent(in)    :: mkl_precision      !! MKL Precision
    integer(int32),             intent(in)    :: forward_domain     !! C2C or R2C flag
    integer(int32),             intent(in)    :: how_many           !! Sets DFTI_NUMBER_OF_TRANSFORMS
    integer(int32),             intent(in)    :: idist              !! Sets DFTI_INPUT_DISTANCE
    integer(int32),             intent(in)    :: odist              !! Sets DFTI_OUTPUT_DISTANCE
    type(c_ptr),                intent(inout) :: plan               !! Resulting plan

    MKL_DFTI_CALL( "DftiCreateDescriptor", mkl_dfti_create_desc(mkl_precision, forward_domain, int(fft_rank, c_long), fft_sizes, plan) )
    MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(plan, DFTI_NUMBER_OF_TRANSFORMS, how_many) )
    MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(plan, DFTI_PLACEMENT, DFTI_NOT_INPLACE) )
    MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(plan, DFTI_INPUT_DISTANCE, idist) )
    MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(plan, DFTI_OUTPUT_DISTANCE, odist) )
    MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(plan, DFTI_CONJUGATE_EVEN_STORAGE, DFTI_COMPLEX_COMPLEX) )
    MKL_DFTI_CALL( "DftiCommitDescriptor", mkl_dfti_commit_desc(plan) )
  end subroutine make_plan

  subroutine create(self, fft_rank, fft_type, precision, idist, odist, how_many, fft_sizes, inembed, onembed, error_code, r2r_kinds)
  !! Creates FFT plan via MKL DFTI Interface
    class(mkl_executor),              intent(inout) :: self           !! MKL FFT Executor
    integer(int8),                    intent(in)    :: fft_rank       !! Rank of fft: 1 or 2
    integer(int8),                    intent(in)    :: fft_type       !! Type of fft: r2r, r2c, c2c
    type(dtfft_precision_t),          intent(in)    :: precision      !! Precision of fft: DTFFT_SINGLE or DTFFT_DOUBLE
    integer(int32),                   intent(in)    :: idist          !! Distance between the first element of two consecutive signals in a batch of the input data.
    integer(int32),                   intent(in)    :: odist          !! Distance between the first element of two consecutive signals in a batch of the output data.
    integer(int32),                   intent(in)    :: how_many       !! Number of transforms to create
    integer(int32),                   intent(in)    :: fft_sizes(:)   !! Dimensions of transform
    integer(int32),                   intent(in)    :: inembed(:)     !! Storage dimensions of the input data in memory.
    integer(int32),                   intent(in)    :: onembed(:)     !! Storage dimensions of the output data in memory.
    integer(int32),                   intent(inout) :: error_code     !! Error code to be returned to user
    type(dtfft_r2r_kind_t), optional, intent(in)    :: r2r_kinds(:)   !! Kinds of r2r transform
    integer(int32) :: forward_domain, mkl_precision, i, idx
    integer(c_long) :: iprod, oprod, sizes(fft_rank)

    if ( present(r2r_kinds) ) then
    endif

    error_code = DTFFT_SUCCESS

    self%is_inverse_copied = .true.
    self%need_reconfigure = .false.

    select case (fft_type)
    case (FFT_C2C)
      forward_domain = DFTI_COMPLEX
    case (FFT_R2C)
      forward_domain = DFTI_REAL
      self%need_reconfigure = .true.
      self%idist = idist
      self%odist = odist
      allocate( self%istrides( size(inembed) + 1), source=0_c_long )
      allocate( self%ostrides( size(onembed) + 1), source=0_c_long )
      iprod = 1; oprod = 1
      self%istrides( size(inembed) + 1 ) = iprod
      self%ostrides( size(onembed) + 1 ) = oprod
      do i = 1, size(inembed) - 1
        idx = size(inembed) + 1 - i
        iprod = iprod * inembed( idx )
        oprod = oprod * onembed( idx )
        self%istrides(idx) = iprod
        self%ostrides(idx) = oprod
      enddo
    case (FFT_R2R)
      error_code = DTFFT_ERROR_R2R_FFT_NOT_SUPPORTED
      return
    endselect
    if(precision == DTFFT_DOUBLE) then
      mkl_precision = DFTI_DOUBLE
    else
      mkl_precision = DFTI_SINGLE
    endif

    sizes(:) = fft_sizes(:)
    call make_plan(fft_rank, sizes, mkl_precision, forward_domain, how_many, idist, odist, self%plan_forward)
    self%plan_backward = self%plan_forward
  end subroutine create

  subroutine execute(self, a, b, sign)
  !! Executes MKL plan
    class(mkl_executor),  intent(in)  :: self                 !! MKL FFT Executor
    type(c_ptr),          intent(in)  :: a                    !! Source pointer
    type(c_ptr),          intent(in)  :: b                    !! Target pointer
    integer(int8),        intent(in)  :: sign                 !! Sign of transform

    if ( self%need_reconfigure ) then
      if ( sign == FFT_FORWARD ) then
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_INPUT_DISTANCE, self%idist) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_OUTPUT_DISTANCE, self%odist) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_INPUT_STRIDES, self%istrides) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_OUTPUT_STRIDES, self%ostrides) )
      else
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_INPUT_DISTANCE, self%odist) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_OUTPUT_DISTANCE, self%idist) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_INPUT_STRIDES, self%ostrides) )
        MKL_DFTI_CALL( "DftiSetValue", mkl_dfti_set_value(self%plan_forward, DFTI_OUTPUT_STRIDES, self%istrides) )
      endif
      MKL_DFTI_CALL( "DftiCommitDescriptor", mkl_dfti_commit_desc(self%plan_forward) )
    endif

    MKL_DFTI_CALL( "DftiCompute", mkl_dfti_execute(self%plan_forward, a, b, int(sign, c_int)) )
  end subroutine execute

  subroutine destroy(self)
  !! Destroys MKL plan
    class(mkl_executor),  intent(inout)  :: self              !! MKL FFT Executor

    MKL_DFTI_CALL( "DftiFreeDescriptor", mkl_dfti_free_desc(self%plan_forward) )
  end subroutine destroy

  subroutine mem_alloc(alloc_bytes, ptr)
  !! Allocates MKL memory
    integer(int64),           intent(in)  :: alloc_bytes      !! Number of bytes to allocate
    type(c_ptr),              intent(out) :: ptr              !! Allocated pointer

    MKL_DFTI_CALL( "mkl_malloc", mkl_dfti_mem_alloc(alloc_bytes, ptr) )
  end subroutine mem_alloc

  subroutine mem_free(ptr)
  !! Frees MKL aligned memory
    type(c_ptr),               intent(in)   :: ptr            !! Pointer to free

    MKL_DFTI_CALL( "mkl_free", mkl_dfti_mem_free(ptr) )
  end subroutine mem_free
end module dtfft_executor_mkl_m