视频
CUDA真香? CUDA与CPU在计算方面的差距
测试平台
Jetson Orin Nano
测试代码
代码仓库(如果对你有用麻烦点个STAR!)
https://github.com/LitchiCheng/CUDA_Test
如下为部分测试代码:
#include <cstdio>
#include "cuda_runtime.h"
#include <sys/time.h>
#include <time.h>
#include <math.h>
#include "utility/timecost.h"
__global__ void kernelAdd(float * A, float * B, float * C)
{
int ix=threadIdx.x+blockDim.x*blockIdx.x;
int iy=threadIdx.y+blockDim.y*blockIdx.y;
int idx=ix+iy*blockDim.x*gridDim.x;
C[idx]=cos(A[idx])+sin(B[idx]);
// if(idx == 2077){
// printf("idx[%d],ix[%d],iy[%d],bdx[%d],bdy[%d],bix[%d],biy