GPU device properties obtained from cudaDeviceProp
Type | Visibility | Attributes | Name | Initial | |||
---|---|---|---|---|---|---|---|
integer(kind=c_int), | public | :: | sm_count |
Number of multiprocessors on device (cudaDeviceProp.multiProcessorCount) |
|||
integer(kind=c_int), | public | :: | max_threads_per_sm |
Maximum resident threads per multiprocessor (cudaDeviceProp.maxThreadsPerMultiProcessor) |
|||
integer(kind=c_int), | public | :: | max_blocks_per_sm |
Maximum number of resident blocks per multiprocessor (cudaDeviceProp.maxBlocksPerMultiProcessor) |
|||
integer(kind=c_size_t), | public | :: | shared_mem_per_sm |
Shared memory per multiprocessor (cudaDeviceProp.sharedMemPerMultiprocessor) |
|||
integer(kind=c_int), | public | :: | max_threads_per_block |
Maximum number of threads per block (cudaDeviceProp.maxThreadsPerBlock) |
|||
integer(kind=c_size_t), | public | :: | shared_mem_per_block |
Shared memory available per block in bytes (cudaDeviceProp.sharedMemPerBlock) |
|||
integer(kind=c_int), | public | :: | l2_cache_size |
Size of L2 cache in bytes (cudaDeviceProp.l2CacheSize) |
|||
integer(kind=c_int), | public | :: | compute_capability_major |
Major compute capability (cudaDeviceProp.major) |
|||
integer(kind=c_int), | public | :: | compute_capability_minor |
Minor compute capability (cudaDeviceProp.minor) |