(De)coding

Pantelis Sopasakis alphaville

(De)coding

Lecturer at QUB, EEECS, i-AMS.

alphaville / cuda_timer.cuh

Last active August 29, 2015 14:07

alphaville / test_matvec_inexact_tiling.cu

Last active August 29, 2015 14:07

alphaville / matvec_inexact_tiling_kernel.cu

Last active August 29, 2015 14:07

alphaville / rand_data.h

Last active August 29, 2015 14:07

	/* Auto-generated file (by a MATLAB script) - ID 3062321795 */

	#ifndef __RAND_DATA_TURBO__
	#define __RAND_DATA_TURBO__

	#define NS 32

	__device__ float dev_x[32] =
	{ 9.320295340189, 8.666071467758, 2.064062819139, 5.206786781683, 9.887525026886, 9.196139126590, 2.988093813008, 9.115010659100, 4.994307851747, 0.409423900211,
	1.911173066863, 1.515824153316, 5.797111859887, 1.448878331722, 8.210170746106, 6.347733121928, 7.880805428768, 0.672098319650, 5.452277295227, 9.969671220601,

alphaville / use_matvec_kernel.cu

Last active August 29, 2015 14:07

	int main(void) {

	checkCudaErrors(cudaSetDeviceFlags(cudaDeviceMapHost));

	float * dev_ptr_A = NULL;
	float * dev_ptr_x = NULL;
	float * hst_y = NULL;
	float * address_y = NULL;

	checkCudaErrors(

alphaville / dev_static_cublas.cu

Last active August 29, 2015 14:07

alphaville / cublas_dot_prod.cu

Created October 13, 2014 18:57

alphaville / support_mapping.cu

Created October 13, 2014 18:02

	cudaDeviceProp prop;
	int whichDevice;

	checkCudaErrors( cudaGetDevice(&whichDevice));
	checkCudaErrors( cudaGetDeviceProperties(&prop, whichDevice));

	if (prop.canMapHostMemory != 1){
	fprintf(stderr, "Device cannot map memory!\n");
	return 1;
	}

alphaville / zero_copy.cu

Created October 13, 2014 18:01

	int main(void) {

	int * host_p; /< Host data allocated as pinned memory /
	int * dev_ptr_p; /< this pointer resides on the host /
	int ns = 32;
	int data_size = ns * sizeof(int);

	checkCudaErrors(
	cudaHostAlloc((void**) &host_p, data_size, cudaHostAllocMapped));

alphaville / cudaHostAlloc_example.cu

Created October 13, 2014 18:00

	#include <stdio.h>
	#include <cuda_runtime.h>
	#include "helper_cuda.h"

	/* A very simple kernel function */
	__global__ void kernel(int *d_var) { d_var[threadIdx.x] += 10; }

	int * host_p;
	int * host_result;
	int * dev_p;