Created
November 1, 2014 21:39
-
-
Save Jasper-Bekkers/43e2438d20f54839e706 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import pyopencl as cl | |
import numpy as np | |
import random as r | |
import datetime as date | |
np.set_printoptions(threshold=np.nan) | |
#Averages ~250.000,000 CGoL cell updates a second, 1GB NVIDIA 560ti | |
# x*y*iterations = total = gpu time = cells/sec | |
# 36*36*100000 = 129600000 = 27s = 4,800,000 | |
# 1000*1000*1000 = 1000000000 = 3.82s = 261,780,104 | |
# 1000*1000*5000 = 5000000000 = 18.82 = 265,674,814 | |
class CL: | |
def __init__(self): | |
platform = cl.get_platforms() | |
my_gpu_devices = platform[1].get_devices(device_type=cl.device_type.GPU) | |
self.ctx = cl.Context(devices=my_gpu_devices) | |
self.queue = cl.CommandQueue(self.ctx) | |
self.tick = False | |
np.random.seed(1) | |
def loadProgram(self, filename): | |
#read in the OpenCL source file as a string | |
f = open(filename, 'r') | |
fstr = "".join(f.readlines()) | |
#print fstr | |
#create the program | |
self.program = cl.Program(self.ctx, fstr).build() | |
#Create the host structures and buffers | |
def popCorn(self): | |
mf = cl.mem_flags | |
#initialize client side (CPU) arrays | |
#Use ar_ySize to increase the worldspace | |
self.ar_ySize = np.int32(36) | |
self.a = np.ones((self.ar_ySize,self.ar_ySize), dtype=np.int32) | |
self.c = np.ones((self.ar_ySize,self.ar_ySize), dtype=np.int32) | |
#create OpenCL buffers | |
self.a_buf = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.a) | |
self.dest_buf = cl.Buffer(self.ctx, mf.WRITE_ONLY, self.a.nbytes) | |
#Run Kernel, create buffer, fill buffer | |
def execute(self): | |
if not self.tick: | |
self.program.Conway(self.queue, self.a.shape, None, self.ar_ySize, self.a_buf, self.dest_buf) | |
else: | |
self.program.Conway(self.queue, self.a.shape, None, self.ar_ySize, self.dest_buf, self.a_buf) | |
self.tick = not self.tick | |
#Run Kernel, create buffer, fill buffer | |
def seed(self): | |
self.c = np.int32(np.random.randint(2, size=(self.ar_ySize, self.ar_ySize))) | |
self.a = self.c | |
#Refresh buffers | |
mf = cl.mem_flags | |
self.a_buf = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.a) | |
self.dest_buf = cl.Buffer(self.ctx, mf.WRITE_ONLY, self.a.nbytes) | |
#Print the output array | |
def render(self): | |
if self.tick: | |
cl.enqueue_read_buffer(self.queue, self.dest_buf, self.a).wait() | |
else: | |
cl.enqueue_read_buffer(self.queue, self.a_buf, self.a).wait() | |
print(self.a) | |
if __name__ == "__main__": | |
example = CL() | |
example.loadProgram("kTest.cl") | |
example.popCorn() | |
print("Begin CPU Seed:", date.datetime.now()) | |
example.seed() | |
print("Begin GPU Loop:", date.datetime.now()) | |
for i in range(50000): | |
example.execute() | |
print("Begin CPU Render:", date.datetime.now()) | |
example.render() | |
print("Done", date.datetime.now()) | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment