rfc1459/gist:7a68e021d39b6f40e8df

## gistfile1.txt
$ docker build -t device_query samples/deviceQuery
Sending build context to Docker daemon 2.048 kB
Step 1 : FROM cuda:latest
 ---> 24b36fe1abbc
Step 2 : WORKDIR /usr/local/cuda/samples/1_Utilities/deviceQuery
 ---> Running in f8c0bfb5333e
 ---> 9951d503fd02
Removing intermediate container f8c0bfb5333e
Step 3 : RUN make
 ---> Running in 974ed5a27cda
/usr/local/cuda-7.5/bin/nvcc -ccbin g++ -I../../common/inc  -m64    -gencode arch=compute_20,code=sm_20 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_52,code=compute_52 -o deviceQuery.o -c deviceQuery.cpp
/usr/local/cuda-7.5/bin/nvcc -ccbin g++   -m64      -gencode arch=compute_20,code=sm_20 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_52,code=compute_52 -o deviceQuery deviceQuery.o
mkdir -p ../../bin/x86_64/linux/release
cp deviceQuery ../../bin/x86_64/linux/release
 ---> dbcd001f1416
Removing intermediate container 974ed5a27cda
Step 4 : CMD ./deviceQuery
 ---> Running in 6e669de169e2
 ---> 6de3092faf4d
Removing intermediate container 6e669de169e2
Successfully built 6de3092faf4d
$ GPU=0 ./nvidia-docker run --rm device_query
[ NVIDIA ] =INFO= Driver version: 352.55
[ NVIDIA ] =INFO= CUDA image version: 7.5

./deviceQuery Starting...

 CUDA Device Query (Runtime API) version (CUDART static linking)

Detected 1 CUDA Capable device(s)

Device 0: "GeForce GTX 650 Ti"
  CUDA Driver Version / Runtime Version          7.5 / 7.5
  CUDA Capability Major/Minor version number:    3.0
  Total amount of global memory:                 2047 MBytes (2146762752 bytes)
  ( 4) Multiprocessors, (192) CUDA Cores/MP:     768 CUDA Cores
  GPU Max Clock rate:                            928 MHz (0.93 GHz)
  Memory Clock rate:                             2700 Mhz
  Memory Bus Width:                              128-bit
  L2 Cache Size:                                 262144 bytes
  Maximum Texture Dimension Size (x,y,z)         1D=(65536), 2D=(65536, 65536), 3D=(4096, 4096, 4096)
  Maximum Layered 1D Texture Size, (num) layers  1D=(16384), 2048 layers
  Maximum Layered 2D Texture Size, (num) layers  2D=(16384, 16384), 2048 layers
  Total amount of constant memory:               65536 bytes
  Total amount of shared memory per block:       49152 bytes
  Total number of registers available per block: 65536
  Warp size:                                     32
  Maximum number of threads per multiprocessor:  2048
  Maximum number of threads per block:           1024
  Max dimension size of a thread block (x,y,z): (1024, 1024, 64)
  Max dimension size of a grid size    (x,y,z): (2147483647, 65535, 65535)
  Maximum memory pitch:                          2147483647 bytes
  Texture alignment:                             512 bytes
  Concurrent copy and kernel execution:          Yes with 1 copy engine(s)
  Run time limit on kernels:                     Yes
  Integrated GPU sharing Host Memory:            No
  Support host page-locked memory mapping:       Yes
  Alignment requirement for Surfaces:            Yes
  Device has ECC support:                        Disabled
  Device supports Unified Addressing (UVA):      Yes
  Device PCI Domain ID / Bus ID / location ID:   0 / 2 / 0
  Compute Mode:
     < Default (multiple host threads can use ::cudaSetDevice() with device simultaneously) >

deviceQuery, CUDA Driver = CUDART, CUDA Driver Version = 7.5, CUDA Runtime Version = 7.5, NumDevs = 1, Device0 = GeForce GTX 650 Ti
Result = PASS
	$ docker build -t device_query samples/deviceQuery
	Sending build context to Docker daemon 2.048 kB
	Step 1 : FROM cuda:latest
	---> 24b36fe1abbc
	Step 2 : WORKDIR /usr/local/cuda/samples/1_Utilities/deviceQuery
	---> Running in f8c0bfb5333e
	---> 9951d503fd02
	Removing intermediate container f8c0bfb5333e
	Step 3 : RUN make
	---> Running in 974ed5a27cda
	/usr/local/cuda-7.5/bin/nvcc -ccbin g++ -I../../common/inc -m64 -gencode arch=compute_20,code=sm_20 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_52,code=compute_52 -o deviceQuery.o -c deviceQuery.cpp
	/usr/local/cuda-7.5/bin/nvcc -ccbin g++ -m64 -gencode arch=compute_20,code=sm_20 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_52,code=compute_52 -o deviceQuery deviceQuery.o
	mkdir -p ../../bin/x86_64/linux/release
	cp deviceQuery ../../bin/x86_64/linux/release
	---> dbcd001f1416
	Removing intermediate container 974ed5a27cda
	Step 4 : CMD ./deviceQuery
	---> Running in 6e669de169e2
	---> 6de3092faf4d
	Removing intermediate container 6e669de169e2
	Successfully built 6de3092faf4d
	$ GPU=0 ./nvidia-docker run --rm device_query
	[ NVIDIA ] =INFO= Driver version: 352.55
	[ NVIDIA ] =INFO= CUDA image version: 7.5

	./deviceQuery Starting...

	CUDA Device Query (Runtime API) version (CUDART static linking)

	Detected 1 CUDA Capable device(s)

	Device 0: "GeForce GTX 650 Ti"
	CUDA Driver Version / Runtime Version 7.5 / 7.5
	CUDA Capability Major/Minor version number: 3.0
	Total amount of global memory: 2047 MBytes (2146762752 bytes)
	( 4) Multiprocessors, (192) CUDA Cores/MP: 768 CUDA Cores
	GPU Max Clock rate: 928 MHz (0.93 GHz)
	Memory Clock rate: 2700 Mhz
	Memory Bus Width: 128-bit
	L2 Cache Size: 262144 bytes
	Maximum Texture Dimension Size (x,y,z) 1D=(65536), 2D=(65536, 65536), 3D=(4096, 4096, 4096)
	Maximum Layered 1D Texture Size, (num) layers 1D=(16384), 2048 layers
	Maximum Layered 2D Texture Size, (num) layers 2D=(16384, 16384), 2048 layers
	Total amount of constant memory: 65536 bytes
	Total amount of shared memory per block: 49152 bytes
	Total number of registers available per block: 65536
	Warp size: 32
	Maximum number of threads per multiprocessor: 2048
	Maximum number of threads per block: 1024
	Max dimension size of a thread block (x,y,z): (1024, 1024, 64)
	Max dimension size of a grid size (x,y,z): (2147483647, 65535, 65535)
	Maximum memory pitch: 2147483647 bytes
	Texture alignment: 512 bytes
	Concurrent copy and kernel execution: Yes with 1 copy engine(s)
	Run time limit on kernels: Yes
	Integrated GPU sharing Host Memory: No
	Support host page-locked memory mapping: Yes
	Alignment requirement for Surfaces: Yes
	Device has ECC support: Disabled
	Device supports Unified Addressing (UVA): Yes
	Device PCI Domain ID / Bus ID / location ID: 0 / 2 / 0
	Compute Mode:
	< Default (multiple host threads can use ::cudaSetDevice() with device simultaneously) >

	deviceQuery, CUDA Driver = CUDART, CUDA Driver Version = 7.5, CUDA Runtime Version = 7.5, NumDevs = 1, Device0 = GeForce GTX 650 Ti
	Result = PASS