cuLaunchKernel Function

public function cuLaunchKernel(func, in, out, blocks, threads, stream, kernelParams) result(cuResult)

Launches a CUDA kernel

Arguments

Type IntentOptional Attributes Name
type(CUfunction), intent(in) :: func

Function CUfunction or Kernel CUkernel to launch

type(c_ptr), intent(in), target :: in

Input pointer

type(c_ptr), intent(in), target :: out

Output pointer

type(dim3), intent(in) :: blocks

Grid in blocks

type(dim3), intent(in) :: threads

Thread block

type(dtfft_stream_t), intent(in) :: stream

Stream identifier

type(kernelArgs), intent(in), target :: kernelParams

Input parameters of kernel func

Return Value integer(kind=c_int)

Driver result code


Called by

proc~~culaunchkernel~~CalledByGraph proc~culaunchkernel cuLaunchKernel proc~execute~3 nvrtc_kernel%execute proc~execute~3->proc~culaunchkernel proc~get_kernel get_kernel proc~get_kernel->proc~culaunchkernel proc~create~4 nvrtc_kernel%create proc~create~4->proc~get_kernel proc~execute_mpi backend_mpi%execute_mpi proc~execute_mpi->proc~execute~3 proc~execute_nccl backend_nccl%execute_nccl proc~execute_nccl->proc~execute~3 proc~execute~8 transpose_handle_cuda%execute proc~execute~8->proc~execute~3 proc~execute~9 abstract_backend%execute proc~execute~9->proc~execute~3 proc~create~9 transpose_handle_cuda%create proc~create~9->proc~create~4 proc~execute_cuda transpose_plan_cuda%execute_cuda proc~execute_cuda->proc~execute~8 proc~run_autotune_backend run_autotune_backend proc~run_autotune_backend->proc~execute~8 proc~autotune_grid~2 autotune_grid proc~autotune_grid~2->proc~run_autotune_backend proc~create_cuda transpose_plan_cuda%create_cuda proc~create_cuda->proc~run_autotune_backend proc~autotune_grid_decomposition~2 autotune_grid_decomposition proc~create_cuda->proc~autotune_grid_decomposition~2 proc~autotune_grid_decomposition~2->proc~autotune_grid~2