Tadej Ciglarič t4c1

## eigendecomposition_speed_precision.cpp
#include <stan/math.hpp>
#include <stan/math/prim/mat/fun/symmetric_eigensolver.hpp>
#include <chrono>
#include <cstdio>

using namespace std;
using namespace Eigen;
using namespace stan::math;

double residual(const MatrixXd& a, const VectorXd& eigenvals, const MatrixXd& eigenvecs) {

## bernouli_logit_minitest.cpp
//
// Created by tadej on 27. 07. 2018.
//
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0
#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
#define USE_TIMING_OUTPUTS

//#include <CL/cl.hpp>
#include <Eigen/Dense>

## mvmTest.cpp
#include <iostream>

#define STAN_OPENCL
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0

#ifdef STAN_OPENCL

#include <stan/math.hpp>
#include <stan/math/opencl/add.hpp>

## cov_benchmark.cpp
#include <iostream>

//#define STAN_OPENCL
//#define OPENCL_PLATFORM_ID 0
//#define OPENCL_DEVICE_ID 0

#include <stan/math.hpp>
#include <stan/math/opencl/copy.hpp>
#include <stan/math/opencl/matrix_cl.hpp>
#include <stan/math/rev/mat/fun/gp_exp_quad_cov.hpp>

## cov_threshold.cpp
#include <iostream>

#define STAN_OPENCL
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0

#include <stan/math.hpp>
#include <stan/math/opencl/copy.hpp>
#include <stan/math/opencl/matrix_cl.hpp>
#include <stan/math/rev/mat/fun/gp_exp_quad_cov.hpp>

## softmax_benchmark.cpp
#define STAN_OPENCL
#define STAN_OPENCL_CACHE
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0
#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
#define __CL_ENABLE_EXCEPTIONS

#include <stan/math/prim/scal/meta/partials_return_type.hpp>
#include <stan/math.hpp>
#include <Eigen/Dense>

## ordered_logistic_benchmark.cpp
#define STAN_OPENCL
#define STAN_OPENCL_CACHE
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0
#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
#define __CL_ENABLE_EXCEPTIONS

#include <stan/math/prim/scal/meta/partials_return_type.hpp>
#include <stan/math.hpp>
#include <Eigen/Dense>

## cov_benchmark.cpp
#include <iostream>

#define STAN_OPENCL
#define OPENCL_PLATFORM_ID 0
#define OPENCL_DEVICE_ID 0

#include <stan/math.hpp>
#include <stan/math/opencl/copy.hpp>
#include <stan/math/opencl/matrix_cl.hpp>
#include <stan/math/rev/mat/fun/gp_exp_quad_cov.hpp>

## plot_thresholds.py
import pandas, numpy
import matplotlib.pyplot as plt

data = pandas.read_csv("thresholds.txt")
models=numpy.array(data["model"])
speedup=numpy.array(data["speedup"])
attributes=numpy.array(data["attributes"])
cases=numpy.array(data["cases"])

selection = numpy.logical_and(models!="normal_id",numpy.logical_or(cases>20000,numpy.logical_and(cases>8000, models=="negbin_log_2")))

## clinfo1.txt
Number of platforms                               2
  Platform Name                                   NVIDIA CUDA
  Platform Vendor                                 NVIDIA Corporation
  Platform Version                                OpenCL 1.2 CUDA 10.1.120
  Platform Profile                                FULL_PROFILE
  Platform Extensions                             cl_khr_global_int32_base_atomics cl_khr_global_int32_extended_atomics cl_khr_local_int32_base_atomics cl_khr_local_int32_extended_atomics cl_khr_fp64 cl_khr_byte_addressable_store cl_khr_icd cl_khr_gl_sharing cl_nv_compiler_options cl_nv_device_attribute_query cl_nv_pragma_unroll cl_nv_d3d10_sharing cl_khr_d3d10_sharing cl_nv_d3d11_sharing cl_nv_copy_opts cl_nv_create_buffer
  Platform Extensions function suffix             NV

  Platform Name                                   Experimental OpenCL 2.1 CPU Only Platform
  Platform Vendor                                 Intel(R) Corporation
	#include <stan/math.hpp>
	#include <stan/math/prim/mat/fun/symmetric_eigensolver.hpp>
	#include <chrono>
	#include <cstdio>

	using namespace std;
	using namespace Eigen;
	using namespace stan::math;

	double residual(const MatrixXd& a, const VectorXd& eigenvals, const MatrixXd& eigenvecs) {
	//
	// Created by tadej on 27. 07. 2018.
	//
	#define OPENCL_PLATFORM_ID 0
	#define OPENCL_DEVICE_ID 0
	#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
	#define USE_TIMING_OUTPUTS

	//#include <CL/cl.hpp>
	#include <Eigen/Dense>
	#include <iostream>

	#define STAN_OPENCL
	#define OPENCL_PLATFORM_ID 0
	#define OPENCL_DEVICE_ID 0

	#ifdef STAN_OPENCL

	#include <stan/math.hpp>
	#include <stan/math/opencl/add.hpp>
	#include <iostream>

	//#define STAN_OPENCL
	//#define OPENCL_PLATFORM_ID 0
	//#define OPENCL_DEVICE_ID 0

	#include <stan/math.hpp>
	#include <stan/math/opencl/copy.hpp>
	#include <stan/math/opencl/matrix_cl.hpp>
	#include <stan/math/rev/mat/fun/gp_exp_quad_cov.hpp>
	#define STAN_OPENCL
	#define STAN_OPENCL_CACHE
	#define OPENCL_PLATFORM_ID 0
	#define OPENCL_DEVICE_ID 0
	#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
	#define __CL_ENABLE_EXCEPTIONS

	#include <stan/math/prim/scal/meta/partials_return_type.hpp>
	#include <stan/math.hpp>
	#include <Eigen/Dense>
	import pandas, numpy
	import matplotlib.pyplot as plt

	data = pandas.read_csv("thresholds.txt")
	models=numpy.array(data["model"])
	speedup=numpy.array(data["speedup"])
	attributes=numpy.array(data["attributes"])
	cases=numpy.array(data["cases"])

	selection = numpy.logical_and(models!="normal_id",numpy.logical_or(cases>20000,numpy.logical_and(cases>8000, models=="negbin_log_2")))
	Number of platforms 2
	Platform Name NVIDIA CUDA
	Platform Vendor NVIDIA Corporation
	Platform Version OpenCL 1.2 CUDA 10.1.120
	Platform Profile FULL_PROFILE
	Platform Extensions cl_khr_global_int32_base_atomics cl_khr_global_int32_extended_atomics cl_khr_local_int32_base_atomics cl_khr_local_int32_extended_atomics cl_khr_fp64 cl_khr_byte_addressable_store cl_khr_icd cl_khr_gl_sharing cl_nv_compiler_options cl_nv_device_attribute_query cl_nv_pragma_unroll cl_nv_d3d10_sharing cl_khr_d3d10_sharing cl_nv_d3d11_sharing cl_nv_copy_opts cl_nv_create_buffer
	Platform Extensions function suffix NV

	Platform Name Experimental OpenCL 2.1 CPU Only Platform
	Platform Vendor Intel(R) Corporation