Lesson2 Square number

最新推荐文章于 2018-05-02 13:52:51 发布

seamanj

最新推荐文章于 2018-05-02 13:52:51 发布

阅读量529

点赞数

分类专栏： CUDA

本文链接：https://blog.csdn.net/seamanj/article/details/49657339

版权

CUDA 专栏收录该内容

23 篇文章 0 订阅

订阅专栏

//filename: square.cu
// By Seamanj 04/11/2015 @NCCA
 
#include <stdio.h>


__global__
void square(float * d_out, float * d_in)
{
	int idx = threadIdx.x;
	float f = d_in[idx];
	d_out[idx] = f * f;
}

int main(int argc, char ** argv)
{
	const int ARRAY_SIZE = 64;
	const int ARRAY_BYTES = ARRAY_SIZE * sizeof(float);
	
	// generate the input array on the host
	float h_in[ARRAY_SIZE];
	for (int i = 0; i < ARRAY_SIZE; ++i)
	{
		h_in[i] = float(i);
	}
	
	float h_out[ARRAY_SIZE];
	
	// declare GPU memory pointers
	
	float * d_in;
	float * d_out;
	
	cudaMalloc((void**) &d_in, ARRAY_BYTES);
	cudaMalloc((void**) &d_out, ARRAY_BYTES);
	
	// transfer the array to the GPU
	cudaMemcpy(d_in, h_in, ARRAY_BYTES, cudaMemcpyHostToDevice);
	
	// launch the kernel
	square<<<1, ARRAY_SIZE>>>(d_out, d_in);
	
	// copy back the result array to the CPU
	cudaMemcpy(h_out, d_out, ARRAY_BYTES, cudaMemcpyDeviceToHost);
	
	// copy back the result array to the CPU
	for( int i = 0; i < ARRAY_SIZE; ++i)
	{
		printf("%f", h_out[i]);
		printf(((i % 4) != 3) ? "\t" : "\n");
	}
	cudaFree(d_in);
	cudaFree(d_out);
	
	return 0;
 
}

seamanj

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
Lesson2 Square number

//filename: square.cu// By Seamanj 04/11/2015 @NCCA #include __global__void square(float * d_out, float * d_in){ int idx = threadIdx.x; float f = d_in[idx]; d_out[idx] = f * f;}int main(
复制链接

扫一扫

专栏目录