Allan MacKinnon allanmac

## cub_sort.cu
//
// Build:
//
// nvcc -lcurand --generate-code arch=compute_50,code=compute_50 --generate-code arch=compute_75,code=compute_75 -D CUB_SORT_TYPE=uint32_t -o sort_cub_32 cub_sort.cu
// nvcc -lcurand --generate-code arch=compute_50,code=compute_50 --generate-code arch=compute_75,code=compute_75 -D CUB_SORT_TYPE=uint64_t -o sort_cub_64 cub_sort.cu
//

#define THRUST_IGNORE_CUB_VERSION_CHECK

#include <curand.h>

## sort.cu
// -*- compile-command: "nvcc -I ../cub-1.8.0 -lcurand -arch sm_50 -o sort sort.cu"; -*-

#include <curand.h>
#include <cub/cub.cuh>

//
//
//

#include <stdbool.h>

## warp_scan.cu

#include <stdio.h>
#include <stdint.h>

#define WARP_SIZE 32

//
//
//

## README.md

      
              3 files
            
          
              1 fork
            
          
              0 comments
            
          
              5 stars
            
          
                allanmac
                / README.md
            
            
              Last active
              June 10, 2023 11:11
            
              
                Macros for neatly error checking OpenCL API functions. 
              
          
    Simply adding two parentheses cl(...) gives you error checking for OpenCL API functions that return a cl_int error code.
The second cl_ok(err) macro is for error checking API functions that initialize their error code as an argument.
The header also includes a useful function for converting OpenCL errors to strings:
char const * clGetErrorString(cl_int const err);


## unit16v2.cu
// -*- compile-command: "nvcc -arch sm_50 -Xptxas=-v -use_fast_math unit16v2.cu -o unit16v2"; -*-

#include <stdio.h>
#include <stdint.h>

//
//
//

#define WARP_SIZE                           32

## ck_2.cu
/*
 * Copyright 1993-2015 NVIDIA Corporation.  All rights reserved.
 *
 * Please refer to the NVIDIA end user license agreement (EULA) associated
 * with this source code for terms and conditions that govern your use of
 * this software. Any use, reproduction, disclosure, or distribution of
 * this software and related documentation outside the terms of the EULA
 * is strictly prohibited.
 *
 */

## alpha_gamma_test.svg

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                allanmac
                / alpha_gamma_test.svg
            
            
              Last active
              February 22, 2016 02:31
            
              
                See here: http://www.realtimerendering.com/blog/a-png-puzzle/
              
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## sort.cu
// -*- compile-command: "nvcc -D THRUST_SORT_TYPE=uint32_t -arch sm_50 -o sort sort_32.cu"; -*-

#include <thrust/host_vector.h>
#include <thrust/device_vector.h>
#include <thrust/generate.h>
#include <thrust/sort.h>
#include <thrust/copy.h>
#include <algorithm>
#include <cstdlib>

## probe_bw.cu
// -*- compile-command: "nvcc -m 64 -arch compute_30 -Xptxas=-v -o probe_bw probe_bw.cu"; -*-

//
// Copyright 2015 Allan MacKinnon <allanmac@alum.mit.edu>
//
// Permission is hereby granted, free of charge, to any person obtaining
// a copy of this software and associated documentation files (the
// "Software"), to deal in the Software without restriction, including
// without limitation the rights to use, copy, modify, merge, publish,
// distribute, sublicense, and/or sell copies of the Software, and to

## assert_cuda.c
//
//
//

#include <stdlib.h>
#include <stdio.h>

//
//
//
	//
	// Build:
	//
	// nvcc -lcurand --generate-code arch=compute_50,code=compute_50 --generate-code arch=compute_75,code=compute_75 -D CUB_SORT_TYPE=uint32_t -o sort_cub_32 cub_sort.cu
	// nvcc -lcurand --generate-code arch=compute_50,code=compute_50 --generate-code arch=compute_75,code=compute_75 -D CUB_SORT_TYPE=uint64_t -o sort_cub_64 cub_sort.cu
	//

	#define THRUST_IGNORE_CUB_VERSION_CHECK

	#include <curand.h>
	// -- compile-command: "nvcc -I ../cub-1.8.0 -lcurand -arch sm_50 -o sort sort.cu"; --

	#include <curand.h>
	#include <cub/cub.cuh>

	//
	//
	//

	#include <stdbool.h>

	#include <stdio.h>
	#include <stdint.h>

	#define WARP_SIZE 32

	//
	//
	//
	// -- compile-command: "nvcc -arch sm_50 -Xptxas=-v -use_fast_math unit16v2.cu -o unit16v2"; --

	#include <stdio.h>
	#include <stdint.h>

	//
	//
	//

	#define WARP_SIZE 32
	/*
	* Copyright 1993-2015 NVIDIA Corporation. All rights reserved.
	*
	* Please refer to the NVIDIA end user license agreement (EULA) associated
	* with this source code for terms and conditions that govern your use of
	* this software. Any use, reproduction, disclosure, or distribution of
	* this software and related documentation outside the terms of the EULA
	* is strictly prohibited.
	*
	*/
	// -- compile-command: "nvcc -D THRUST_SORT_TYPE=uint32_t -arch sm_50 -o sort sort_32.cu"; --

	#include <thrust/host_vector.h>
	#include <thrust/device_vector.h>
	#include <thrust/generate.h>
	#include <thrust/sort.h>
	#include <thrust/copy.h>
	#include <algorithm>
	#include <cstdlib>
	// -- compile-command: "nvcc -m 64 -arch compute_30 -Xptxas=-v -o probe_bw probe_bw.cu"; --

	//
	// Copyright 2015 Allan MacKinnon <allanmac@alum.mit.edu>
	//
	// Permission is hereby granted, free of charge, to any person obtaining
	// a copy of this software and associated documentation files (the
	// "Software"), to deal in the Software without restriction, including
	// without limitation the rights to use, copy, modify, merge, publish,
	// distribute, sublicense, and/or sell copies of the Software, and to