autotune_grid_decomposition Subroutine

private subroutine autotune_grid_decomposition(self, dims, transposed_dims, base_comm, effort, n_transpose_plans, base_dtype, base_storage, best_comm_dims, best_forward_ids, best_backward_ids)

Runs through all possible grid decompositions and selects the best one based on the lowest average execution time

Type Bound

transpose_plan_host

Arguments

Type IntentOptional Attributes Name
class(transpose_plan_host), intent(in) :: self

Abstract plan

integer(kind=int32), intent(in) :: dims(:)

Global dims

integer(kind=int32), intent(in) :: transposed_dims(:,:)

Transposed dims

type(MPI_Comm), intent(in) :: base_comm

Base communicator

type(dtfft_effort_t), intent(in) :: effort

How thoroughly dtFFT searches for the optimal plan

integer(kind=int8), intent(in) :: n_transpose_plans

Number of transpose plans to test

type(MPI_Datatype), intent(in) :: base_dtype

Base MPI_Datatype

integer(kind=int64), intent(in) :: base_storage

Number of bytes needed to store single element

integer(kind=int32), intent(out) :: best_comm_dims(:)

Best communicator dimensions

integer(kind=int8), intent(inout) :: best_forward_ids(:)

Best Datatype ids for forward plan

integer(kind=int8), intent(inout) :: best_backward_ids(:)

Best Datatype ids for backward plan


Calls

proc~~autotune_grid_decomposition~~CallsGraph proc~autotune_grid_decomposition transpose_plan_host%autotune_grid_decomposition interface~to_str to_str proc~autotune_grid_decomposition->interface~to_str mpi_comm_size mpi_comm_size proc~autotune_grid_decomposition->mpi_comm_size proc~autotune_grid transpose_plan_host%autotune_grid proc~autotune_grid_decomposition->proc~autotune_grid proc~get_conf_log_enabled get_conf_log_enabled proc~autotune_grid_decomposition->proc~get_conf_log_enabled proc~write_message write_message proc~autotune_grid_decomposition->proc~write_message proc~double_to_string double_to_string interface~to_str->proc~double_to_string proc~float_to_string float_to_string interface~to_str->proc~float_to_string proc~int32_to_string int32_to_string interface~to_str->proc~int32_to_string proc~int64_to_string int64_to_string interface~to_str->proc~int64_to_string proc~int8_to_string int8_to_string interface~to_str->proc~int8_to_string proc~autotune_grid->interface~to_str proc~autotune_grid->proc~get_conf_log_enabled proc~autotune_grid->proc~write_message mpi_comm_free mpi_comm_free proc~autotune_grid->mpi_comm_free proc~autotune_mpi_datatypes transpose_plan_host%autotune_mpi_datatypes proc~autotune_grid->proc~autotune_mpi_datatypes proc~create_pencils_and_comm create_pencils_and_comm proc~autotune_grid->proc~create_pencils_and_comm proc~destroy pencil%destroy proc~autotune_grid->proc~destroy proc~get_local_sizes get_local_sizes proc~autotune_grid->proc~get_local_sizes proc~get_plan_execution_time transpose_plan_host%get_plan_execution_time proc~autotune_grid->proc~get_plan_execution_time proc~pop_nvtx_domain_range pop_nvtx_domain_range proc~autotune_grid->proc~pop_nvtx_domain_range proc~push_nvtx_domain_range push_nvtx_domain_range proc~autotune_grid->proc~push_nvtx_domain_range interface~get_conf_internal get_conf_internal proc~get_conf_log_enabled->interface~get_conf_internal mpi_comm_rank mpi_comm_rank proc~write_message->mpi_comm_rank mpi_finalized mpi_finalized proc~write_message->mpi_finalized proc~get_conf_internal_int32 get_conf_internal_int32 interface~get_conf_internal->proc~get_conf_internal_int32 proc~get_conf_internal_logical get_conf_internal_logical interface~get_conf_internal->proc~get_conf_internal_logical proc~autotune_transpose_id transpose_plan_host%autotune_transpose_id proc~autotune_mpi_datatypes->proc~autotune_transpose_id lcounts lcounts proc~create_pencils_and_comm->lcounts lstarts lstarts proc~create_pencils_and_comm->lstarts proc~create pencil%create proc~create_pencils_and_comm->proc~create proc~create_cart_comm create_cart_comm proc~create_pencils_and_comm->proc~create_cart_comm proc~get_plan_execution_time->interface~to_str proc~get_plan_execution_time->mpi_comm_size proc~get_plan_execution_time->proc~get_conf_log_enabled proc~get_plan_execution_time->proc~write_message proc~get_plan_execution_time->proc~pop_nvtx_domain_range proc~get_plan_execution_time->proc~push_nvtx_domain_range mpi_allreduce mpi_allreduce proc~get_plan_execution_time->mpi_allreduce mpi_wtime mpi_wtime proc~get_plan_execution_time->mpi_wtime proc~create~7 transpose_handle_host%create proc~get_plan_execution_time->proc~create~7 proc~destroy~6 transpose_handle_host%destroy proc~get_plan_execution_time->proc~destroy~6 proc~execute~6 transpose_handle_host%execute proc~get_plan_execution_time->proc~execute~6 proc~get_conf_measure_iters get_conf_measure_iters proc~get_plan_execution_time->proc~get_conf_measure_iters proc~get_conf_measure_warmup_iters get_conf_measure_warmup_iters proc~get_plan_execution_time->proc~get_conf_measure_warmup_iters interface~nvtxdomainrangepop_c nvtxDomainRangePop_c proc~pop_nvtx_domain_range->interface~nvtxdomainrangepop_c interface~nvtxdomainrangepushex_c nvtxDomainRangePushEx_c proc~push_nvtx_domain_range->interface~nvtxdomainrangepushex_c proc~astring_f2c astring_f2c proc~push_nvtx_domain_range->proc~astring_f2c proc~create_nvtx_domain create_nvtx_domain proc~push_nvtx_domain_range->proc~create_nvtx_domain proc~string_f2c string_f2c proc~astring_f2c->proc~string_f2c proc~autotune_transpose_id->proc~get_plan_execution_time proc~create->proc~destroy proc~check_if_even check_if_even proc~create->proc~check_if_even proc~get_local_size get_local_size proc~create->proc~get_local_size mpi_cart_create mpi_cart_create proc~create_cart_comm->mpi_cart_create mpi_cart_sub mpi_cart_sub proc~create_cart_comm->mpi_cart_sub mpi_comm_dup mpi_comm_dup proc~create_cart_comm->mpi_comm_dup proc~create_nvtx_domain->proc~astring_f2c interface~nvtxdomaincreate_c nvtxDomainCreate_c proc~create_nvtx_domain->interface~nvtxdomaincreate_c proc~create~7->mpi_comm_size mpi_allgather mpi_allgather proc~create~7->mpi_allgather proc~create_handle handle_t%create_handle proc~create~7->proc~create_handle proc~create_transpose_2d transpose_handle_host%create_transpose_2d proc~create~7->proc~create_transpose_2d proc~create_transpose_xy transpose_handle_host%create_transpose_XY proc~create~7->proc~create_transpose_xy proc~create_transpose_xz transpose_handle_host%create_transpose_XZ proc~create~7->proc~create_transpose_xz proc~create_transpose_yz transpose_handle_host%create_transpose_YZ proc~create~7->proc~create_transpose_yz proc~create_transpose_zx transpose_handle_host%create_transpose_ZX proc~create~7->proc~create_transpose_zx proc~get_transpose_type get_transpose_type proc~create~7->proc~get_transpose_type mpi_request_free mpi_request_free proc~destroy~6->mpi_request_free proc~destroy_handle handle_t%destroy_handle proc~destroy~6->proc~destroy_handle mpi_alltoall_init mpi_alltoall_init proc~execute~6->mpi_alltoall_init mpi_alltoallw_init mpi_alltoallw_init proc~execute~6->mpi_alltoallw_init mpi_start mpi_start proc~execute~6->mpi_start mpi_wait mpi_wait proc~execute~6->mpi_wait proc~get_conf_measure_iters->interface~get_conf_internal proc~get_conf_measure_warmup_iters->interface~get_conf_internal proc~check_if_even->mpi_comm_size proc~check_if_even->mpi_allgather proc~create_handle->proc~destroy_handle mpi_type_commit mpi_type_commit proc~create_transpose_2d->mpi_type_commit mpi_type_contiguous mpi_type_contiguous proc~create_transpose_2d->mpi_type_contiguous mpi_type_create_resized mpi_type_create_resized proc~create_transpose_2d->mpi_type_create_resized mpi_type_vector mpi_type_vector proc~create_transpose_2d->mpi_type_vector proc~free_datatypes free_datatypes proc~create_transpose_2d->proc~free_datatypes proc~create_transpose_xy->mpi_type_commit proc~create_transpose_xy->mpi_type_contiguous mpi_type_create_hvector mpi_type_create_hvector proc~create_transpose_xy->mpi_type_create_hvector proc~create_transpose_xy->mpi_type_create_resized proc~create_transpose_xy->mpi_type_vector proc~create_transpose_xy->proc~free_datatypes proc~create_transpose_xz->mpi_type_commit proc~create_transpose_xz->mpi_type_contiguous proc~create_transpose_xz->mpi_type_create_hvector proc~create_transpose_xz->mpi_type_create_resized proc~create_transpose_xz->mpi_type_vector proc~create_transpose_xz->proc~free_datatypes proc~create_transpose_yz->mpi_type_commit proc~create_transpose_yz->mpi_type_contiguous proc~create_transpose_yz->mpi_type_create_hvector proc~create_transpose_yz->mpi_type_create_resized proc~create_transpose_yz->mpi_type_vector proc~create_transpose_yz->proc~free_datatypes proc~create_transpose_zx->mpi_type_commit proc~create_transpose_zx->mpi_type_contiguous proc~create_transpose_zx->mpi_type_create_hvector proc~create_transpose_zx->mpi_type_create_resized proc~create_transpose_zx->mpi_type_vector proc~create_transpose_zx->proc~free_datatypes mpi_type_free mpi_type_free proc~destroy_handle->mpi_type_free proc~get_local_size->mpi_comm_size proc~get_local_size->mpi_comm_rank proc~get_local_size->mpi_allgather proc~free_datatypes->mpi_type_free

Called by

proc~~autotune_grid_decomposition~~CalledByGraph proc~autotune_grid_decomposition transpose_plan_host%autotune_grid_decomposition proc~create_private transpose_plan_host%create_private proc~create_private->proc~autotune_grid_decomposition