Mattias Fält mfalt

## Error 2 Example 2
ERROR: LoadError: TaskFailedException
Stacktrace:
 [1] wait
   @ ./task.jl:334 [inlined]
 [2] fetch(t::Task)
   @ Base ./task.jl:349
 [3] top-level scope
   @ ~/knightvision/piece_recognition/KnightVisionServer/test/test_cuda.jl:39

    nested task error: CUDNNError: CUDNN_STATUS_INTERNAL_ERROR (code 4)

## Error with lock

const LOCK = ReentrantLock()

function inference(imgs)
    lock(LOCK)
    try
        out = nn(imgs)
        return maximum(cpu(out))
    finally
        unlock(LOCK)

## Error 2 example 2
ERROR: LoadError: TaskFailedException
Stacktrace:
 [1] wait
   @ ./task.jl:334 [inlined]
 [2] fetch(t::Task)
   @ Base ./task.jl:349
 [3] top-level scope
   @ ~/knightvision/piece_recognition/KnightVisionServer/test/test_cuda.jl:46

    nested task error: Out of GPU memory trying to allocate 13.184 MiB

## nvidia-smi
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.103.01   Driver Version: 470.103.01   CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|===============================+======================+======================|
|   0  NVIDIA GeForce ...  Off  | 00000000:01:00.0 Off |                  N/A |
|  0%   43C    P8    10W / 250W |   2256MiB / 11175MiB |      0%      Default |
|                               |                      |                  N/A |

## CUDA.jl
using CUDA

import CUDA.CUDNN: cudnnConvolutionForward

const W1 = cu(randn(5,5,3,6))

function inference(imgs)
    out = cudnnConvolutionForward(W1, imgs)
    return maximum(Array(out))
end
	ERROR: LoadError: TaskFailedException
	Stacktrace:
	[1] wait
	@ ./task.jl:334 [inlined]
	[2] fetch(t::Task)
	@ Base ./task.jl:349
	[3] top-level scope
	@ ~/knightvision/piece_recognition/KnightVisionServer/test/test_cuda.jl:39

	nested task error: CUDNNError: CUDNN_STATUS_INTERNAL_ERROR (code 4)

	const LOCK = ReentrantLock()

	function inference(imgs)
	lock(LOCK)
	try
	out = nn(imgs)
	return maximum(cpu(out))
	finally
	unlock(LOCK)
	+-----------------------------------------------------------------------------+
	\| NVIDIA-SMI 470.103.01 Driver Version: 470.103.01 CUDA Version: 11.4 \|
	\|-------------------------------+----------------------+----------------------+
	\| GPU Name Persistence-M\| Bus-Id Disp.A \| Volatile Uncorr. ECC \|
	\| Fan Temp Perf Pwr:Usage/Cap\| Memory-Usage \| GPU-Util Compute M. \|
	\| \| \| MIG M. \|
	\|===============================+======================+======================\|
	\| 0 NVIDIA GeForce ... Off \| 00000000:01:00.0 Off \| N/A \|
	\| 0% 43C P8 10W / 250W \| 2256MiB / 11175MiB \| 0% Default \|
	\| \| \| N/A \|
	using CUDA

	import CUDA.CUDNN: cudnnConvolutionForward

	const W1 = cu(randn(5,5,3,6))

	function inference(imgs)
	out = cudnnConvolutionForward(W1, imgs)
	return maximum(Array(out))
	end