qfgaohao/device_properties.cu

## device_properties.cu
#include <stdio.h>


void deviceQuery ()
{
  cudaDeviceProp prop;
  int nDevices=0, i;
  cudaError_t ierr;

  ierr = cudaGetDeviceCount(&nDevices);
  if (ierr != cudaSuccess) { printf("Sync error: %s\n", cudaGetErrorString(ierr)); }


  for( i = 0; i < nDevices; ++i )
  {
     ierr = cudaGetDeviceProperties(&prop, i);
     printf("Device number: %d\n", i);
     printf("  Device name: %s\n", prop.name);
     printf("  Compute capability: %d.%d\n\n", prop.major, prop.minor);

     printf("  Clock Rate: %d kHz\n", prop.clockRate);
     printf("  Total SMs: %d \n", prop.multiProcessorCount);
     printf("  Shared Memory Per SM: %lu bytes\n", prop.sharedMemPerMultiprocessor);
     printf("  Registers Per SM: %d 32-bit\n", prop.regsPerMultiprocessor);
     printf("  Max threads per SM: %d\n", prop.maxThreadsPerMultiProcessor);
     printf("  L2 Cache Size: %d bytes\n", prop.l2CacheSize);
     printf("  Total Global Memory: %lu bytes\n", prop.totalGlobalMem);
     printf("  Memory Clock Rate: %d kHz\n\n", prop.memoryClockRate);


     printf("  Max threads per block: %d\n", prop.maxThreadsPerBlock);
     printf("  Max threads in X-dimension of block: %d\n", prop.maxThreadsDim[0]);
     printf("  Max threads in Y-dimension of block: %d\n", prop.maxThreadsDim[1]);
     printf("  Max threads in Z-dimension of block: %d\n\n", prop.maxThreadsDim[2]);

     printf("  Max blocks in X-dimension of grid: %d\n", prop.maxGridSize[0]);
     printf("  Max blocks in Y-dimension of grid: %d\n", prop.maxGridSize[1]);
     printf("  Max blocks in Z-dimension of grid: %d\n\n", prop.maxGridSize[2]);

     printf("  Shared Memory Per Block: %lu bytes\n", prop.sharedMemPerBlock);
     printf("  Registers Per Block: %d 32-bit\n", prop.regsPerBlock);
     printf("  Warp size: %d\n\n", prop.warpSize);

  }
}

int main() {
    deviceQuery();
}
	#include <stdio.h>


	void deviceQuery ()
	{
	cudaDeviceProp prop;
	int nDevices=0, i;
	cudaError_t ierr;

	ierr = cudaGetDeviceCount(&nDevices);
	if (ierr != cudaSuccess) { printf("Sync error: %s\n", cudaGetErrorString(ierr)); }



	for( i = 0; i < nDevices; ++i )
	{
	ierr = cudaGetDeviceProperties(&prop, i);
	printf("Device number: %d\n", i);
	printf(" Device name: %s\n", prop.name);
	printf(" Compute capability: %d.%d\n\n", prop.major, prop.minor);

	printf(" Clock Rate: %d kHz\n", prop.clockRate);
	printf(" Total SMs: %d \n", prop.multiProcessorCount);
	printf(" Shared Memory Per SM: %lu bytes\n", prop.sharedMemPerMultiprocessor);
	printf(" Registers Per SM: %d 32-bit\n", prop.regsPerMultiprocessor);
	printf(" Max threads per SM: %d\n", prop.maxThreadsPerMultiProcessor);
	printf(" L2 Cache Size: %d bytes\n", prop.l2CacheSize);
	printf(" Total Global Memory: %lu bytes\n", prop.totalGlobalMem);
	printf(" Memory Clock Rate: %d kHz\n\n", prop.memoryClockRate);


	printf(" Max threads per block: %d\n", prop.maxThreadsPerBlock);
	printf(" Max threads in X-dimension of block: %d\n", prop.maxThreadsDim[0]);
	printf(" Max threads in Y-dimension of block: %d\n", prop.maxThreadsDim[1]);
	printf(" Max threads in Z-dimension of block: %d\n\n", prop.maxThreadsDim[2]);

	printf(" Max blocks in X-dimension of grid: %d\n", prop.maxGridSize[0]);
	printf(" Max blocks in Y-dimension of grid: %d\n", prop.maxGridSize[1]);
	printf(" Max blocks in Z-dimension of grid: %d\n\n", prop.maxGridSize[2]);

	printf(" Shared Memory Per Block: %lu bytes\n", prop.sharedMemPerBlock);
	printf(" Registers Per Block: %d 32-bit\n", prop.regsPerBlock);
	printf(" Warp size: %d\n\n", prop.warpSize);

	}
	}

	int main() {
	deviceQuery();
	}