【CUDA】CUDA将RGB图像转成灰度图并统计并行直方图

最新推荐文章于 2025-04-25 21:14:21 发布

小飞哥咯咯咯

最新推荐文章于 2025-04-25 21:14:21 发布

阅读量250

点赞数 3

分类专栏： CUDA 文章标签： CUDA C++ opencv 学习

本文链接：https://blog.csdn.net/weixin_45207619/article/details/140228100

版权

CUDA 专栏收录该内容

5 篇文章

订阅专栏

笔者在阅读网上的文章时，看到这篇。
遂安装了opencv库准备一试，结果不管怎么弄都报错找不到文件，最后发现，竟然是作者将头文件中的/写成了\。
试了之后发现这篇文章中的代码没有任何输出，连最基本的灰度图都输不出来，遂参考GPT写了一个输出脚本，这么看opencv封装的函数还是很好用的，比如这里面的cv:imgwrite函数。
贴一下可以用的基础版本代码吧~

#include "cuda_runtime.h"
#include "device_launch_parameters.h"
#include <cuda.h>
#include <device_functions.h>
#include <opencv2/opencv.hpp>
#include <iostream>
#include <math.h>
using namespace std;
using namespace cv;

//输入图像为BGR图，将其转化为gray图
__global__ void rgb2grayInCuda(uchar3 *dataIn, unsigned char *dataOut, int imgHeight, int imgWidth)
{
	int xIndex = threadIdx.x + blockIdx.x * blockDim.x;
	int yIndex = threadIdx.y + blockIdx.y * blockDim.y;

	if (xIndex < imgWidth && yIndex < imgHeight)
	{
		uchar3 rgb = dataIn[yIndex * imgWidth + xIndex];

		dataOut[yIndex * imgWidth + xIndex] = 0.299f * rgb.x + 0.587f * rgb.y + 0.114f * rgb.z;
	}
}

//灰度直方图统计
__global__ void imHistInCuda(unsigned char *dataIn, int *hist)
{
	int threadIndex = threadIdx.x + threadIdx.y * blockDim.x;
	int blockIndex = blockIdx.x + blockIdx.y * gridDim.x;
	int index = threadIndex + blockIndex * blockDim.x * blockDim.y;

	atomicAdd(&hist[dataIn[index]], 1);

}

int main()
{
	//传入图片
	Mat srcImg = imread("input.jpg");

	int imgHeight = srcImg.rows;
	int imgWidth = srcImg.cols;
	Mat grayImg(imgHeight, imgWidth, CV_8UC1, Scalar(0));//输出灰度图
	int hist[256];//灰度直方图统计数组
	memset(hist, 0, 256 * sizeof(int));

	//在GPU中开辟输入输出空间
	uchar3 *d_in;
	unsigned char *d_out;
	int *d_hist;

	cudaMalloc((void**)&d_in, imgHeight * imgWidth * sizeof(uchar3));
	cudaMalloc((void**)&d_out, imgHeight * imgWidth * sizeof(unsigned char));
	cudaMalloc((void**)&d_hist, 256 * sizeof(int));

	//将图像数据传入GPU中
	cudaMemcpy(d_in, srcImg.data, imgHeight * imgWidth * sizeof(uchar3), cudaMemcpyHostToDevice);
	cudaMemcpy(d_hist, hist, 256 * sizeof(int), cudaMemcpyHostToDevice);

	dim3 threadsPerBlock(32, 32);
	dim3 blocksPerGrid((imgWidth + threadsPerBlock.x - 1) / threadsPerBlock.x, (imgHeight + threadsPerBlock.y - 1) / threadsPerBlock.y);

	//灰度化
	rgb2grayInCuda << <blocksPerGrid, threadsPerBlock >> >(d_in, d_out, imgHeight, imgWidth);

	//灰度直方图统计
	imHistInCuda << <blocksPerGrid, threadsPerBlock >> >(d_out, d_hist);

	//将数据从GPU传回CPU
	cudaMemcpy(hist, d_hist, 256 * sizeof(int), cudaMemcpyDeviceToHost);
	cudaMemcpy(grayImg.data, d_out, imgHeight * imgWidth * sizeof(unsigned char), cudaMemcpyDeviceToHost);

    imwrite("output.jpg", grayImg);

	cudaFree(d_in);
	cudaFree(d_out);
	cudaFree(d_hist);

	return 0;
}