dtfft_transpose_plan

This module describes transpose_plan class

Uses

Help

Graph Key

Nodes of different colours represent the following:

Solid arrows point from a submodule to the (sub)module which it is descended from. Dashed arrows point from a module or program unit to modules which it uses.
Where possible, edges connecting nodes are given different colours to make them easier to distinguish in large graphs.

Used by

Help

Graph Key

Nodes of different colours represent the following:

Solid arrows point from a submodule to the (sub)module which it is descended from. Dashed arrows point from a module or program unit to modules which it uses.
Where possible, edges connecting nodes are given different colours to make them easier to distinguish in large graphs.

Variables

Type	Visibility	Attributes		Name		Initial
integer(kind=int8),	private,	save	::	FORWARD_PLAN_IDS(3)			Default data types for forward transpositions
integer(kind=int8),	private,	save	::	BACKWARD_PLAN_IDS(3)			Default data types for backward transpositions
logical,	private,	save	::	ARE_DATATYPES_SET	=	.false.	Are default data types set

Derived Types

type, public, extends(reshape_plan_base) :: transpose_plan

Transpose Plan class This class is a container for transposition plans

Components

Type	Visibility	Attributes		Name
type(dtfft_backend_t),	public		::	backend	Backend
type(backend_helper),	public		::	helper	Backend helper
integer(kind=int64),	public		::	min_buffer_size	Minimal buffer size for transposition
type(dtfft_platform_t),	public		::	platform	Platform used for transposition
type(dtfft_stream_t),	public		::	stream	CUDA stream
type(reshape_container),	public,	allocatable	::	plans(:)	Plans for each reshape operation
type(string),	public,	allocatable	::	names(:)	Names of each reshape operation
logical,	private		::	is_z_slab	Is Z-slab optimization enabled
logical,	private		::	is_y_slab	Is Y-slab optimization enabled

Type-Bound Procedures

procedure, public, pass(self), non_overridable :: init
procedure, public, pass(self), non_overridable :: get_async_active
procedure, public, pass(self), non_overridable :: get_aux_bytes	../../ Returns auxiliary buffer size
procedure, public, pass(self), non_overridable :: is_aux_needed
procedure, public, pass(self), non_overridable :: get_backend	../../ Returns backend id
procedure, public, pass(self) :: destroy
procedure, public, pass(self), non_overridable :: execute
procedure, public, pass(self), non_overridable :: execute_end
procedure, public, pass(self), non_overridable :: mem_alloc
procedure, public, pass(self), non_overridable :: mem_free
procedure, public, non_overridable, pass(self) :: create	../../ Creates transpose plan
procedure, public, non_overridable, pass(self) :: get_z_slab	../../ Returns .true. if Z-slab optimization is enabled
procedure, public, non_overridable, pass(self) :: get_y_slab	../../ Returns .true. if Y-slab optimization is enabled

Functions

private function create(self, platform, dims, base_comm, effort, base_dtype, base_storage, cart_comm, comms, pencils, ipencil) result(error_code)

Creates transposition plan

Arguments

Type	Intent	Optional		Name
class(transpose_plan),	intent(inout)		::	self	Transposition class
type(dtfft_platform_t),	intent(in)		::	platform	Platform to create plan for
integer(kind=int32),	intent(in)		::	dims(:)	Global sizes of the transform requested
type(MPI_Comm),	intent(in)		::	base_comm	Base communicator
type(dtfft_effort_t),	intent(in)		::	effort	`dtFFT` planner type of effort
type(MPI_Datatype),	intent(in)		::	base_dtype	Base MPI_Datatype
integer(kind=int64),	intent(in)		::	base_storage	Number of bytes needed to store single element
type(MPI_Comm),	intent(out)		::	cart_comm	Cartesian communicator
type(MPI_Comm),	intent(out)		::	comms(:)	Array of 1d communicators
type(pencil),	intent(out)		::	pencils(:)	Data distributing meta
type(pencil_init),	intent(in),	optional	::	ipencil	Pencil passed by user

Return Value integer(kind=int32)

Error code

private pure function get_z_slab(self)

Returns .true. if Z-slab optimization is enabled

Arguments

Type	Intent	Optional	Attributes		Name
class(transpose_plan),	intent(in)			::	self	Transposition class

Return Value logical

private pure function get_y_slab(self)

Returns .true. if Y-slab optimization is enabled

Arguments

Type	Intent	Optional	Attributes		Name
class(transpose_plan),	intent(in)			::	self	Transposition class

Return Value logical

private function autotune_transpose_id(create_kwargs, buffer_size, helper, from, to, transpose_name_id, forward_id, backward_id) result(elapsed_time)

Creates forward and backward transpose plans for backend DTFFT_BACKEND_MPI_DATATYPE based on source and target data distributions and, executes them DTFFT_MEASURE_ITERS times ( 4 * DTFFT_MEASURE_ITERS iterations total ) + 4 * DTFFT_MEASURE_WARMUP_ITERS warmup iterations

Arguments

Type	Intent		Name
type(create_args),	intent(inout)	::	create_kwargs
integer(kind=int64),	intent(in)	::	buffer_size
type(backend_helper),	intent(inout)	::	helper	Backend helper
type(pencil),	intent(in)	::	from	Source meta
type(pencil),	intent(in)	::	to	Target meta
integer(kind=int8),	intent(in)	::	transpose_name_id	ID of transpose name (from -3 to 3, except 0)
integer(kind=int8),	intent(out)	::	forward_id	Best forward plan ID
integer(kind=int8),	intent(out)	::	backward_id	Best backward plan ID

Return Value real(kind=real32)

Elapsed time for best plans selected

private function get_plan_execution_time(create_kwargs, buffer_size, helper, from, to, datatype_id, transpose_name_id) result(elapsed_time)

Creates transpose plan for backend DTFFT_BACKEND_MPI_DATATYPE and executes it DTFFT_MEASURE_WARMUP_ITERS + DTFFT_MEASURE_ITERS times

Arguments

Type	Intent		Name
type(create_args),	intent(inout)	::	create_kwargs
integer(kind=int64),	intent(in)	::	buffer_size
type(backend_helper),	intent(inout)	::	helper	Backend helper
type(pencil),	intent(in)	::	from	Source meta
type(pencil),	intent(in)	::	to	Target meta
integer(kind=int8),	intent(in)	::	datatype_id	ID of transpose (1 or 2)
integer(kind=int8),	intent(in)	::	transpose_name_id	ID of transpose name (from -3 to 3, except 0)

Return Value real(kind=real32)

Execution time [ms]

Subroutines

private subroutine autotune_grid_decomposition(platform, dims, base_comm, effort, base_dtype, base_storage, stream, best_forward_ids, best_backward_ids, best_decomposition, backend, min_execution_time, best_backend)

Runs through all possible grid decompositions and selects the best one based on the lowest average execution time

Arguments

Type	Intent	Optional		Name
type(dtfft_platform_t),	intent(in)		::	platform	Platform to use
integer(kind=int32),	intent(in)		::	dims(:)	Global sizes of the transform requested
type(MPI_Comm),	intent(in)		::	base_comm	3D comm
type(dtfft_effort_t),	intent(in)		::	effort	How thoroughly `dtFFT` searches for the optimal plan
type(MPI_Datatype),	intent(in)		::	base_dtype	Base MPI_Datatype
integer(kind=int64),	intent(in)		::	base_storage	Number of bytes needed to store single element
type(dtfft_stream_t),	intent(in)		::	stream	Stream to use
integer(kind=int8),	intent(inout)		::	best_forward_ids(:)	Best Datatype ids for forward plan
integer(kind=int8),	intent(inout)		::	best_backward_ids(:)	Best Datatype ids for backward plan
integer(kind=int32),	intent(out)		::	best_decomposition(:)	Best decomposition found
type(dtfft_backend_t),	intent(in),	optional	::	backend	GPU Backend to test. Should be passed only when effort is `DTFFT_ESTIMATE` or `DTFFT_MEASURE`
real(kind=real32),	intent(out),	optional	::	min_execution_time	Elapsed time for best plan selected
type(dtfft_backend_t),	intent(out),	optional	::	best_backend	Best backend selected

private subroutine autotune_grid(platform, dims, base_comm, effort, base_dtype, comm_dims, base_storage, stream, is_z_slab, best_forward_ids, best_backward_ids, backend, best_time, best_backend)

Creates cartesian grid and runs various backends on it. Returns best backend and execution time

Arguments

Type	Intent	Optional		Name
type(dtfft_platform_t),	intent(in)		::	platform	Platform to create plan for
integer(kind=int32),	intent(in)		::	dims(:)	Global sizes of the transform requested
type(MPI_Comm),	intent(in)		::	base_comm	Basic communicator to create 3d grid from
type(dtfft_effort_t),	intent(in)		::	effort	How thoroughly `dtFFT` searches for the optimal plan
type(MPI_Datatype),	intent(in)		::	base_dtype	Base MPI_Datatype
integer(kind=int32),	intent(in)		::	comm_dims(:)	Number of processors in each dimension
integer(kind=int64),	intent(in)		::	base_storage	Number of bytes needed to store single element
type(dtfft_stream_t),	intent(in)		::	stream	Stream to use
logical,	intent(in)		::	is_z_slab	Is Z-slab optimization enabled
integer(kind=int8),	intent(inout)		::	best_forward_ids(:)	Best Datatype ids for forward plan
integer(kind=int8),	intent(inout)		::	best_backward_ids(:)	Best Datatype ids for backward plan
type(dtfft_backend_t),	intent(in),	optional	::	backend	GPU Backend to test. Should be passed only when effort is `DTFFT_ESTIMATE` or `DTFFT_MEASURE`
real(kind=real32),	intent(out),	optional	::	best_time	Elapsed time for best plan selected
type(dtfft_backend_t),	intent(out),	optional	::	best_backend	Best backend selected for the grid

private subroutine run_autotune_backend(platform, comms, cart_comm, effort, base_dtype, pencils, base_storage, stream, is_z_slab, best_forward_ids, best_backward_ids, backend, best_time, best_backend)

Runs autotune for all backends

Arguments

Type	Intent	Optional		Name
type(dtfft_platform_t),	intent(in)		::	platform	Platform to create plan for
type(MPI_Comm),	intent(in)		::	comms(:)	1D comms
type(MPI_Comm),	intent(in)		::	cart_comm	3D Cartesian comm
type(dtfft_effort_t),	intent(in)		::	effort
type(MPI_Datatype),	intent(in)		::	base_dtype	Base MPI_Datatype
type(pencil),	intent(in)		::	pencils(:)	Source meta
integer(kind=int64),	intent(in)		::	base_storage	Number of bytes needed to store single element
type(dtfft_stream_t),	intent(in)		::	stream	Stream to use
logical,	intent(in)		::	is_z_slab	Is Z-slab optimization enabled
integer(kind=int8),	intent(inout)		::	best_forward_ids(:)	Best Datatype ids for forward plan
integer(kind=int8),	intent(inout)		::	best_backward_ids(:)	Best Datatype ids for backward plan
type(dtfft_backend_t),	intent(in),	optional	::	backend	GPU Backend to test. Should be passed only when effort is `DTFFT_ESTIMATE` or `DTFFT_MEASURE`
real(kind=real32),	intent(out),	optional	::	best_time	Elapsed time for best backend
type(dtfft_backend_t),	intent(out),	optional	::	best_backend	Best backend selected

private subroutine run_autotune_datatypes(create_kwargs, buffer_size, helper, pencils, is_z_slab, best_forward_ids, best_backward_ids, elapsed_time)

Arguments

Type	Intent		Name
type(create_args),	intent(inout)	::	create_kwargs
integer(kind=int64),	intent(in)	::	buffer_size
type(backend_helper),	intent(inout)	::	helper	Base MPI_Datatype
type(pencil),	intent(in)	::	pencils(:)	Source meta
logical,	intent(in)	::	is_z_slab	Is Z-slab optimization enabled
integer(kind=int8),	intent(out)	::	best_forward_ids(:)	Best Datatype ids for forward plan
integer(kind=int8),	intent(out)	::	best_backward_ids(:)	Best Datatype ids for backward plan
real(kind=real32),	intent(out)	::	elapsed_time	Elapsed time for best plans selected in [ms]

private subroutine get_permutations(ndims, dperm, cperm)

Arguments

Type	Intent	Attributes		Name
integer(kind=int8),	intent(in)		::	ndims
integer(kind=int8),		allocatable	::	dperm(:,:)
integer(kind=int8),		allocatable	::	cperm(:,:)

private subroutine create_pencils_and_comm(dims, old_comm, comm_dims, comm, local_comms, pencils, ipencil)

Creates cartesian communicator

Arguments

Type	Intent	Optional		Name
integer(kind=int32),	intent(in)		::	dims(:)	Global dimensions
type(MPI_Comm),	intent(in)		::	old_comm	Communicator to create cartesian from
integer(kind=int32),	intent(in)		::	comm_dims(:)	Dims in cartesian communicator
type(MPI_Comm),	intent(out)		::	comm	Cartesian communicator
type(MPI_Comm),	intent(out)		::	local_comms(:)	1d communicators in cartesian communicator
type(pencil),	intent(out)		::	pencils(:)	Data distributing meta
type(pencil_init),	intent(in),	optional	::	ipencil	Pencil passed by user

private subroutine create_cart_comm(old_comm, comm_dims, comm, local_comms, ipencil)

Creates cartesian communicator

Arguments

Type	Intent	Optional		Name
type(MPI_Comm),	intent(in)		::	old_comm	Communicator to create cartesian from
integer(kind=int32),	intent(in)		::	comm_dims(:)	Dims in cartesian communicator
type(MPI_Comm),	intent(out)		::	comm	Cartesian communicator
type(MPI_Comm),	intent(out)		::	local_comms(:)	1d communicators in cartesian communicator
type(pencil_init),	intent(in),	optional	::	ipencil	Pencil passed by user

dtfft_transpose_plan Module

Contents

Variables

Derived Types

Functions

Subroutines

Uses

Used by

Variables

Derived Types

type, public, extends(reshape_plan_base) :: transpose_plan

Components

Type-Bound Procedures

Functions

private function create(self, platform, dims, base_comm, effort, base_dtype, base_storage, cart_comm, comms, pencils, ipencil) result(error_code)

Arguments

Return Value integer(kind=int32)

private pure function get_z_slab(self)

Arguments

Return Value logical

private pure function get_y_slab(self)

Arguments

Return Value logical

private function autotune_transpose_id(create_kwargs, buffer_size, helper, from, to, transpose_name_id, forward_id, backward_id) result(elapsed_time)

Arguments

Return Value real(kind=real32)

private function get_plan_execution_time(create_kwargs, buffer_size, helper, from, to, datatype_id, transpose_name_id) result(elapsed_time)

Arguments

Return Value real(kind=real32)

Subroutines

private subroutine autotune_grid_decomposition(platform, dims, base_comm, effort, base_dtype, base_storage, stream, best_forward_ids, best_backward_ids, best_decomposition, backend, min_execution_time, best_backend)

Arguments

private subroutine autotune_grid(platform, dims, base_comm, effort, base_dtype, comm_dims, base_storage, stream, is_z_slab, best_forward_ids, best_backward_ids, backend, best_time, best_backend)

Arguments

private subroutine run_autotune_backend(platform, comms, cart_comm, effort, base_dtype, pencils, base_storage, stream, is_z_slab, best_forward_ids, best_backward_ids, backend, best_time, best_backend)

Arguments

private subroutine run_autotune_datatypes(create_kwargs, buffer_size, helper, pencils, is_z_slab, best_forward_ids, best_backward_ids, elapsed_time)

Arguments

private subroutine get_permutations(ndims, dperm, cperm)

Arguments

private subroutine create_pencils_and_comm(dims, old_comm, comm_dims, comm, local_comms, pencils, ipencil)

Arguments

private subroutine create_cart_comm(old_comm, comm_dims, comm, local_comms, ipencil)

Arguments