Skip to content

Instantly share code, notes, and snippets.

@seantalts
Last active April 24, 2019 20:54
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save seantalts/7f2f0b8b3bd8421fb60c57af4735dd79 to your computer and use it in GitHub Desktop.
Save seantalts/7f2f0b8b3bd8421fb60c57af4735dd79 to your computer and use it in GitHub Desktop.
#include <iostream>
#include <algorithm>
#include <iterator>
#include <array>
// #ifdef __APPLE__
// #include <OpenCL/cl.hpp>
// #else
#include <CL/cl.hpp>
// #endif
using namespace std;
using namespace cl;
int factorial(int n) {
return (n <= 1) ? 1 : n * factorial(n-1);
}
Platform getPlatform() {
/* Returns the first platform found. */
std::vector<Platform> all_platforms;
Platform::get(&all_platforms);
if (all_platforms.size()==0) {
cout << "No platforms found. Check OpenCL installation!\n";
exit(1);
}
return all_platforms[0];
}
Device getDevice(Platform platform, int i, bool display=false) {
/* Returns the deviced specified by the index i on platform.
* If display is true, then all of the platforms are listed.
*/
std::vector<Device> all_devices;
platform.getDevices(CL_DEVICE_TYPE_ALL, &all_devices);
if(all_devices.size()==0){
cout << "No devices found. Check OpenCL installation!\n";
exit(1);
}
if (display) {
for (int j=0; j<all_devices.size(); j++)
printf("Device %d: %s\n", j, all_devices[j].getInfo<CL_DEVICE_NAME>().c_str());
}
return all_devices[i];
}
void schedWrite(CommandQueue queue, cl::Buffer buf, int* A, int n, Event& eve) {
queue.enqueueWriteBuffer(buf, CL_FALSE, 0, sizeof(int)*n, A, NULL, &eve);
}
void schedWriteEvents(CommandQueue queue, cl::Buffer buf, int* A, int n, Event& eve, Event eve2) {
std::vector<cl::Event> events;
events.push_back(eve2);
queue.enqueueWriteBuffer(buf, CL_FALSE, 0, sizeof(int)*n, A,
&events, &eve);
}
int main() {
constexpr int n = 1024*1024; // size of vectors
constexpr int c_max = 5; // max value to iterate to
const int coeff = factorial(c_max);
// A is initial, B is result, C is expected result
vector<int> A(n), B(n), C(n);
for (int i=0; i<n; i++) {
A[i] = i;
C[i] = coeff * i;
}
Platform default_platform = getPlatform();
Device default_device = getDevice(default_platform, 1);
Context context({default_device});
Program::Sources sources;
std::string kernel_code=
"void kernel multiply_by(global int* A, const int c) {"
" A[get_global_id(0)] = c * A[get_global_id(0)];"
"}";
sources.push_back({kernel_code.c_str(), kernel_code.length()});
Program program(context, sources);
if (program.build({default_device}) != CL_SUCCESS) {
cout << "Error building: " << program.getBuildInfo<CL_PROGRAM_BUILD_LOG>(default_device) << std::endl;
exit(1);
}
Buffer buffer_A(context, CL_MEM_READ_WRITE, sizeof(int) * n);
CommandQueue queue(context, default_device);
Event eve1;
vector<Event> events;
schedWrite(queue, buffer_A, A.data(), n, eve1);
Event eve2;
schedWriteEvents(queue, buffer_A, A.data(), n, eve2, eve1);
queue.flush();
Kernel multiply_by = Kernel(program, "multiply_by");
eve2.wait();
multiply_by.setArg(0, buffer_A);
for (int c=2; c<=c_max; c++) {
multiply_by.setArg(1, c);
queue.enqueueNDRangeKernel(multiply_by, NullRange, NDRange(n), NDRange(32));
}
queue.enqueueReadBuffer(buffer_A, CL_TRUE, 0, sizeof(int)*n, B.data());
if (std::equal(std::begin(B), std::end(B), std::begin(C)))
cout << "Arrays are equal!" << endl;
else
cout << "Uh-oh, the arrays aren't equal!" << endl;
return 0;
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment