Answer to assessment of Fundamentals of Accelerated Computing with OpenACC

void pair_gpu(const double *d_x, const double *d_y, const double *d_z,
			  unsigned long long int *d_g2, int numatm, int nconf,
			  const double xbox, const double ybox, const double zbox, int d_bin)
{
	double r, cut, dx, dy, dz;
	int ig2;
	double box;
	box = min(xbox, ybox);
	box = min(box, zbox);

	double del = box / (2.0 * d_bin);
	cut = box * 0.5;
#pragma acc data copyin(d_x[:numatm*nconf], d_y[:numatm*nconf], d_z[:numatm*nconf]) copyout(d_g2[:d_bin]) 
{
    #pragma acc parallel num_gangs( 100 ) num_workers( 32 ) vector_length( 32 )
    #pragma acc loop gang private(dx,dy,dz,r,ig2) 
    for (int frame = 0; frame < nconf; frame++)
	{
        #pragma acc loop worker independent
		for (int id1 = 0; id1 < numatm; id1++)
		{
            #pragma acc loop vector independent
			for (int id2 = 0; id2 < numatm; id2++)
			{
				dx = d_x[frame * numatm + id1] - d_x[frame * numatm + id2];
				dy = d_y[frame * numatm + id1] - d_y[frame * numatm + id2];
				dz = d_z[frame * numatm + id1] - d_z[frame * numatm + id2];

				dx = dx - xbox * (round(dx / xbox));
				dy = dy - ybox * (round(dy / ybox));
				dz = dz - zbox * (round(dz / zbox));

				r = sqrtf(dx * dx + dy * dy + dz * dz);
				if (r < cut)
				{
					ig2 = (int)(r / del);
    #pragma acc atomic
                        d_g2[ig2] = d_g2[ig2] + 1;
                    }
                }
            }
        }
    }
}
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值