1 2 3
kernel void matrixTranspose( global float *a, global float *b, constant float *c, constant int size ){ int idx = get_global_id(0);
/********************************************************************* sample.cu* This is a example of the CUDA program.