OpenCL程序完整例子

最新推荐文章于 2025-10-17 23:39:22 发布

原创最新推荐文章于 2025-10-17 23:39:22 发布 · 1.1k 阅读

5 ·

CC 4.0 BY-SA版权

OpenCl/CUDA算法加速专栏收录该内容

10 篇文章

订阅专栏

#include<iostream>

#include "common.h"


#define DATA_SIZE 8388608

using namespace std;


int valuesOK(UserData* to, UserData* from) 
{
	for (int i = 0; i < DATA_SIZE; ++i) {
		if (to[i].w != from[i].w) return 0;
	}
	return 1;
}







int buffer_query(int argc, char* argv[])
{
	/* OpenCL 1.1 data structures */
	cl_platform_id* platforms;
	cl_program program;
	cl_device_id device;
	cl_context context;

	/* OpenCL 1.1 scalar data types */
	cl_uint numOfPlatforms;
	cl_int  error;

	/*
	Prepare an array of UserData via dynamic memory allocation
	*/
	UserData* ud_in = (UserData*)malloc(sizeof(UserData) * DATA_SIZE); // input to device
	UserData* ud_out = (UserData*)malloc(sizeof(UserData) * DATA_SIZE); // output from device
	for (int i = 0; i < DATA_SIZE; ++i) {
		(ud_in + i)->x = i;
		(ud_in + i)->y = i;
		(ud_in + i)->z = i;
		(ud_in + i)->w = 3 * i;
	}
	/*
	Get the number of platforms
	Remember that for each vendor's SDK installed on the computer,
	the number of available platform also increased.
	*/
	error = clGetPlatformIDs(0, NULL, &numOfPlatforms);
	if (error != CL_SUCCESS) {
		perror("Unable to find any OpenCL platforms");
		exit(1);
	}

	platforms = (cl_platform_id*)alloca(sizeof(cl_platform_id) * numOfPlatforms);
	printf("Number of OpenCL platforms found: %d\n", numOfPlatforms);

	error = clGetPlatformIDs(numOfPlatforms, platforms, NULL);
	if (error != CL_SUCCESS) {
		perror("Unable to find any OpenCL platforms");
		exit(1);
	}
	// Search for a CPU/GPU device through the installed platforms
	// Build a OpenCL program and do not run it.
	for (cl_uint i = 0; i < numOfPlatforms; i++) {
		// Get the GPU device
		error = clGetDeviceIDs(platforms[i], CL_DEVICE_TYPE_GPU, 1, &device, NULL);
		if (error != CL_SUCCESS) {
			// Otherwise, get the CPU
			error = clGetDeviceIDs(platforms[i], CL_DEVICE_TYPE_CPU, 1, &device, NULL);
		}
		if (error != CL_SUCCESS) {
			perror("Can't locate any OpenCL compliant device");
			exit(1);
		}
		/* Create a context */
		context = clCreateContext(NULL, 1, &device, NULL, NULL, &error);
		if (error != CL_SUCCESS) {
			perror("Can't create a valid OpenCL context");
			exit(1);
		}

		/* Load the two source files into temporary datastores */
		const char *file_names[] = { "user_test.cl" };
		const int NUMBER_OF_FILES = 1;
		char* buffer[NUMBER_OF_FILES];
		size_t sizes[NUMBER_OF_FILES];
		loadProgramSource(file_names, NUMBER_OF_FILES, buffer, sizes);

		/* Create the OpenCL program object */
		program = clCreateProgramWithSource(context, NUMBER_OF_FILES, (const char**)buffer, sizes, &error);
		if (error != CL_SUCCESS) {
			perror("Can't create the OpenCL program object");
			exit(1);
		}
		/* Build OpenCL program object and dump the error message, if any */
		char *program_log;
		size_t log_size;
		error = clBuildProgram(program, 1, &device, NULL, NULL, NULL);
		if (error != CL_SUCCESS) {
			// If there's an error whilst building the program, dump the log
			clGetProgramBuildInfo(program, device, CL_PROGRAM_BUILD_LOG, 0, NULL, &log_size);
			program_log = (char*)malloc(log_size + 1);
			program_log[log_size] = '\0';
			clGetProgramBuildInfo(program, device, CL_PROGRAM_BUILD_LOG,
				log_size + 1, program_log, NULL);
			printf("\n=== ERROR ===\n\n%s\n=============\n", program_log);
			free(program_log);
			exit(1);
		}

		/* Query the program as to how many kernels were detected */
		cl_uint numOfKernels;
		error = clCreateKernelsInProgram(program, 0, NULL, &numOfKernels);
		if (error != CL_SUCCESS) {
			perror("Unable to retrieve kernel count from program");
			exit(1);
		}
		cl_kernel* kernels = (cl_kernel*)alloca(sizeof(cl_kernel) * numOfKernels);
		error = clCreateKernelsInProgram(program, numOfKernels, kernels, NULL);
		

		for (cl_uint i = 0; i < numOfKernels; i++) 
		{
			char kernelName[32];
			cl_uint argCnt;
			clGetKernelInfo(kernels[i], CL_KERNEL_FUNCTION_NAME, sizeof(kernelName), kernelName, NULL);
			clGetKernelInfo(kernels[i], CL_KERNEL_NUM_ARGS, sizeof(argCnt), &argCnt, NULL);
			printf("Kernel name: %s with arity: %d\n", kernelName, argCnt);
			printf("About to create command queue and enqueue this kernel...\n");

			/* Create a command queue */ ///创建命令队列
			cl_command_queue cQ = clCreateCommandQueue(context, device, 0, &error);
			if (error != CL_SUCCESS) {
				perror("Unable to create command-queue");
				exit(1);
			}

			/* Create a OpenCL buffer object */ ///创建缓存对象
			cl_mem UDObj = clCreateBuffer(context, CL_MEM_READ_WRITE | CL_MEM_COPY_HOST_PTR,sizeof(UserData) * DATA_SIZE, ud_in, &error);

			if (error != CL_SUCCESS) {
				perror("Unable to create buffer object");
				exit(1);
			}

			/* Extract some info about the buffer object we created */
			displayBufferDetails(UDObj);

			/* Let OpenCL know that the kernel is suppose to receive an argument */
			// 让OpenCL知道内核应该接收一个参数
			error = clSetKernelArg(kernels[i], 0, sizeof(cl_mem), &UDObj);
			if (error != CL_SUCCESS) {
				perror("Unable to create buffer object");
				exit(1);
			}

			/* Enqueue the kernel to the command queue */
			// 将内核放入命令队列
			error = clEnqueueTask(cQ, kernels[i], 0, NULL, NULL);
			if (error != CL_SUCCESS) {
				perror("Unable to enqueue task to command-queue");
				exit(1);
			}
			printf("Task has been enqueued successfully!\n");

			/* Enqueue the read-back from device to host */
			error = clEnqueueReadBuffer(cQ, UDObj,
				CL_TRUE,                    // blocking read
				0,                          // write from the start
				sizeof(UserData) * DATA_SIZE, // how much to copy
				ud_out, 0, NULL, NULL);

			if (valuesOK(ud_in, ud_out)) {
				printf("Check passed!\n");
			}
			else printf("Check failed!\n");

			/* Release the command queue */
			clReleaseCommandQueue(cQ);
			clReleaseMemObject(UDObj);
		}

		/* Clean up */

		for (cl_uint i = 0; i < numOfKernels; i++) { clReleaseKernel(kernels[i]); }
		for (i = 0; i< NUMBER_OF_FILES; i++) { free(buffer[i]); }
		clReleaseProgram(program);
		clReleaseContext(context);
	}

	free(ud_in);
	free(ud_out);
}


int main(int argc,char* argv[])
{
 

 //PlatForminfo(argc,argv);
//	BuildProgram(argc, argv);

 cout<<"My Love Ye!"<<endl;
 system("pause");
 return 0;
}

头文件common.h里代码：

#ifndef COMMON_H_
#define COMMON_H_

#include <stdio.h>
#include <stdlib.h>
#include <sys/types.h>

#include <string>

//#include <alloca.h>



#ifdef APPLE
#include<OpenCL/cl.h>
#else
#include <CL/cl.h>
#endif // APPLE



// Simulating the OpenCL vector data type: int4
typedef struct UserData {
	int x;
	int y;
	int z;
	int w;
} UserData;




void displayPlatformInfo(cl_platform_id id,cl_platform_info param_name,const char* paramNameAsStr)
{
	cl_int error = 0;
	size_t paramSize = 0;
	error = clGetPlatformInfo(id, param_name, 0, NULL, &paramSize);
	
	char* moreInfo = (char*)alloca(sizeof(char)*paramSize);
	error = clGetPlatformInfo(id, param_name, paramSize, moreInfo, NULL);
	if (error!=CL_SUCCESS)
	{
		perror("Unable to find any OpenCl platform Information!");
		return;
	}
	printf("%s:%s\n", paramNameAsStr, moreInfo);
}


/************************************************************************/
/* file  file name
*  length  file number
*  buffer  save file program
*  sizes   file length
*/
/************************************************************************/

void loadProgramSource(const char** files,size_t length,char **buffer,size_t*sizes)
{
	for (size_t i=0;i<length;++i)
	{
		FILE *file = fopen(files[i], "r");
		if (file==NULL)
		{
			perror("Couldn't read the program files");
			exit(1);
		}
		fseek(file,0,SEEK_END);
		sizes[i] = ftell(file);//得到文件的长度
		rewind(file);//重置文件指针到文件头，进行文件的读取
		buffer[i] = (char*)malloc(sizes[i] + 1);
		buffer[i][sizes[i]] = '\0';
		fread(buffer[i],sizeof(char),sizes[i],file);
		fclose(file);
	}

	return;
}


void displayBufferDetails(cl_mem memobj) {
	cl_mem_object_type objT;
	cl_mem_flags flags;
	size_t memSize;

	clGetMemObjectInfo(memobj, CL_MEM_TYPE, sizeof(cl_mem_object_type), &objT, 0);
	clGetMemObjectInfo(memobj, CL_MEM_FLAGS, sizeof(cl_mem_flags), &flags, 0);
	clGetMemObjectInfo(memobj, CL_MEM_SIZE, sizeof(size_t), &memSize, 0);

	char* str = '\0';
	switch (objT) {
	case CL_MEM_OBJECT_BUFFER: str = "Buffer or Sub-buffer"; break;
	case CL_MEM_OBJECT_IMAGE2D: str = "2D Image Object"; break;
	case CL_MEM_OBJECT_IMAGE3D: str = "3D Image Object"; break;
	}

	char flagStr[128] = { '\0' };
	if (flags & CL_MEM_READ_WRITE)     strcat(flagStr, "Read-Write|");
	if (flags & CL_MEM_WRITE_ONLY)     strcat(flagStr, "Write Only|");
	if (flags & CL_MEM_READ_ONLY)      strcat(flagStr, "Read Only|");
	if (flags & CL_MEM_COPY_HOST_PTR)  strcat(flagStr, "Copy from Host|");
	if (flags & CL_MEM_USE_HOST_PTR)   strcat(flagStr, "Use from Host|");
	if (flags & CL_MEM_ALLOC_HOST_PTR) strcat(flagStr, "Alloc from Host|");

	printf("\tOpenCL Buffer's details =>\n\t size: %lu MB,\n\t object type is: %s,\n\t flags:0x%lx (%s) \n", memSize >> 20, str, flags, flagStr);
}














#endif

user_test.cl里的代码：

typedef struct UserData {
    int x;
    int y;
    int z;
    int w;
} UserData;


__kernel void hello(__global UserData* data) {
    int id = get_global_id(0);
    data[id].w = data[id].x + data[id].y + data[id].z;        
}