cuFFTMp GPU Backend backend_cufftmp
cuFFTMp GPU Backend
Type | Visibility | Attributes | Name | Initial | |||
---|---|---|---|---|---|---|---|
type(dtfft_backend_t), | public | :: | backend |
Backend type |
|||
logical, | public | :: | is_selfcopy |
If backend is self-copying |
|||
logical, | public | :: | is_pipelined |
If backend is pipelined |
|||
integer(kind=int64), | public | :: | aux_size |
Number of bytes required by aux buffer |
|||
integer(kind=int64), | public | :: | send_recv_buffer_size |
Number of float elements used in |
|||
type(MPI_Comm), | public | :: | comm |
MPI Communicator |
|||
integer(kind=int32), | public, | allocatable | :: | comm_mapping(:) |
Mapping of 1d comm ranks to global comm |
||
integer(kind=int32), | public | :: | comm_size |
Size of MPI Comm |
|||
integer(kind=int32), | public | :: | comm_rank |
Rank in MPI Comm |
|||
integer(kind=int64), | public, | allocatable | :: | send_displs(:) |
Send data displacements, in float elements |
||
integer(kind=int64), | public, | allocatable | :: | send_floats(:) |
Send data elements, in float elements |
||
integer(kind=int64), | public, | allocatable | :: | recv_displs(:) |
Recv data displacements, in float elements |
||
integer(kind=int64), | public, | allocatable | :: | recv_floats(:) |
Recv data elements, in float elements |
||
type(cudaEvent), | public | :: | execution_event |
Event for main execution stream |
|||
type(cudaEvent), | public | :: | copy_event |
Event for copy stream |
|||
type(dtfft_stream_t), | public | :: | copy_stream |
Stream for copy operations |
|||
integer(kind=int64), | public | :: | self_copy_bytes |
Number of bytes to copy it itself |
|||
integer(kind=int64), | public | :: | self_send_displ |
Displacement for send buffer |
|||
integer(kind=int64), | public | :: | self_recv_displ |
Displacement for recv buffer |
|||
type(nvrtc_kernel), | public, | pointer | :: | unpack_kernel |
Kernel for unpacking data |
||
type(nvrtc_kernel), | public, | pointer | :: | unpack_kernel2 |
Kernel for unpacking data |
||
type(cufftReshapeHandle), | private | :: | plan |
procedure, public, non_overridable, pass(self) :: create | ../../ Creates Abstract GPU Backend |
procedure, public, non_overridable, pass(self) :: execute | ../../ Executes GPU Backend |
procedure, public, non_overridable, pass(self) :: destroy | ../../ Destroys Abstract GPU Backend |
procedure, public, non_overridable, pass(self) :: get_aux_size | ../../ Returns number of bytes required by aux buffer |
procedure, public, non_overridable, pass(self) :: set_unpack_kernel | ../../ Sets unpack kernel for pipelined backend |
procedure, public :: create_private => create | |
procedure, public :: execute_private => execute | |
procedure, public :: destroy_private => destroy |
Type | Visibility | Attributes | Name | Initial | |||
---|---|---|---|---|---|---|---|
integer(kind=c_long_long), | public | :: | lower(3) | ||||
integer(kind=c_long_long), | public | :: | upper(3) | ||||
integer(kind=c_long_long), | public | :: | strides(3) |
Creates cuFFTMp GPU Backend
Type | Intent | Optional | Attributes | Name | ||
---|---|---|---|---|---|---|
class(backend_cufftmp), | intent(inout) | :: | self |
cuFFTMp GPU Backend |
||
type(backend_helper), | intent(in) | :: | helper |
Backend helper |
||
type(dtfft_transpose_t), | intent(in) | :: | tranpose_type |
Type of transpose to create |
||
integer(kind=int64), | intent(in) | :: | base_storage |
Number of bytes to store single element |
Executes cuFFTMp GPU Backend
Type | Intent | Optional | Attributes | Name | ||
---|---|---|---|---|---|---|
class(backend_cufftmp), | intent(inout) | :: | self |
cuFFTMp GPU Backend |
||
real(kind=real32), | intent(inout), | target | :: | in(:) |
Send pointer |
|
real(kind=real32), | intent(inout), | target | :: | out(:) |
Recv pointer |
|
type(dtfft_stream_t), | intent(in) | :: | stream |
Main execution CUDA stream |
||
real(kind=real32), | intent(inout), | target | :: | aux(:) |
Aux pointer |
Destroys cuFFTMp GPU Backend
Type | Intent | Optional | Attributes | Name | ||
---|---|---|---|---|---|---|
class(backend_cufftmp), | intent(inout) | :: | self |
cuFFTMp GPU Backend |