sklam/testnvvm.py Secret

## testnvvm.py
"""
Run with NUMBAPRO_NVVM set to the path to different libvvm library

e.g. (on OSX)
NUMBAPRO_NVVM=/Developer/NVIDIA/CUDA-7.5/nvvm/lib/libnvvm.dylib  python testnvvm.py
"""

from llvmlite import ir #, binding as llvm

from numba.cuda.cudadrv.nvvm import (llvm_to_ptx, set_cuda_kernel,
                                     fix_data_layout)

m = ir.Module()
ftype = ir.FunctionType(ir.VoidType(), [ir.IntType(32).as_pointer(),
                                        ir.IntType(32)])
fn = ir.Function(m, ftype, "foo")

builder = ir.IRBuilder(fn.append_basic_block('entry'))
[ptr, ip_max] = fn.args
ptr.name = "ptr"
ip_max.name = "ip_max"

ip_var = builder.alloca(ir.IntType(32))
builder.store(ir.Constant(ir.IntType(32), 0), ip_var)

head_label = builder.append_basic_block('head')

builder.branch(head_label)

builder.position_at_end(head_label)

ip = builder.load(ip_var)

ip_add_one = builder.add(ip, ir.Constant(ip.type, 1))
builder.store(ip_add_one, ip_var)

pred_continue = builder.icmp_signed('<', ip, ip_max)

loop_label = builder.append_basic_block('loop')
end_label = builder.append_basic_block('end')
builder.cbranch(pred_continue, loop_label, end_label)

# Loop:
builder.position_at_end(loop_label)


def insert_branch(expect):
    if_label = builder.append_basic_block('if')
    endif_label = builder.append_basic_block('endif')

    cond = builder.icmp_signed('==', ip, expect)

    builder.cbranch(cond, if_label, endif_label)
    # If:
    builder.position_at_end(if_label)

    gep = builder.gep(ptr, [ip])
    builder.store(ip, gep)

    builder.branch(head_label)

    # End:
    builder.position_at_end(endif_label)


for i in range(2000):
    insert_branch(ir.Constant(ir.IntType(32), i))

builder.branch(head_label)
# End:
builder.position_at_end(end_label)
builder.ret_void()

# llvm.view_function_cfg(fn)
set_cuda_kernel(fn)
fix_data_layout(m)

llvmir = str(m)

print('line ct', len(list(llvmir.splitlines())))
ptx = llvm_to_ptx(llvmir)
print(ptx.decode('ascii'))
	"""
	Run with NUMBAPRO_NVVM set to the path to different libvvm library

	e.g. (on OSX)
	NUMBAPRO_NVVM=/Developer/NVIDIA/CUDA-7.5/nvvm/lib/libnvvm.dylib python testnvvm.py
	"""

	from llvmlite import ir #, binding as llvm

	from numba.cuda.cudadrv.nvvm import (llvm_to_ptx, set_cuda_kernel,
	fix_data_layout)

	m = ir.Module()
	ftype = ir.FunctionType(ir.VoidType(), [ir.IntType(32).as_pointer(),
	ir.IntType(32)])
	fn = ir.Function(m, ftype, "foo")

	builder = ir.IRBuilder(fn.append_basic_block('entry'))
	[ptr, ip_max] = fn.args
	ptr.name = "ptr"
	ip_max.name = "ip_max"

	ip_var = builder.alloca(ir.IntType(32))
	builder.store(ir.Constant(ir.IntType(32), 0), ip_var)

	head_label = builder.append_basic_block('head')

	builder.branch(head_label)

	builder.position_at_end(head_label)

	ip = builder.load(ip_var)

	ip_add_one = builder.add(ip, ir.Constant(ip.type, 1))
	builder.store(ip_add_one, ip_var)

	pred_continue = builder.icmp_signed('<', ip, ip_max)

	loop_label = builder.append_basic_block('loop')
	end_label = builder.append_basic_block('end')
	builder.cbranch(pred_continue, loop_label, end_label)

	# Loop:
	builder.position_at_end(loop_label)


	def insert_branch(expect):
	if_label = builder.append_basic_block('if')
	endif_label = builder.append_basic_block('endif')

	cond = builder.icmp_signed('==', ip, expect)

	builder.cbranch(cond, if_label, endif_label)
	# If:
	builder.position_at_end(if_label)

	gep = builder.gep(ptr, [ip])
	builder.store(ip, gep)

	builder.branch(head_label)

	# End:
	builder.position_at_end(endif_label)


	for i in range(2000):
	insert_branch(ir.Constant(ir.IntType(32), i))

	builder.branch(head_label)
	# End:
	builder.position_at_end(end_label)
	builder.ret_void()

	# llvm.view_function_cfg(fn)
	set_cuda_kernel(fn)
	fix_data_layout(m)

	llvmir = str(m)

	print('line ct', len(list(llvmir.splitlines())))
	ptx = llvm_to_ptx(llvmir)
	print(ptx.decode('ascii'))