CUDA thrust库sort_by_key函数

问题描述

#include <stdio.h>
#include <thrust/host_vector.h>
#include <thrust/device_vector.h>
#include <thrust/sort.h>
#define SIZE 6

__global__ void kernel1(int* key, int* value)
{
    for(int i = 0; i < SIZE; i++)
    {
        printf("key[%d] = %d value[%d] = %d\n", i, key[i], i, value[i]);
    }
    printf("\n");
}

int main(){
    int key[SIZE] = {24, 43, 27, 42, 25, 40};
    int value[SIZE] = {0, 1, 2, 3, 4, 5};
    int *d_key, *d_value;
    cudaMalloc((void**)&d_key, sizeof(int) * SIZE);
    cudaMalloc((void**)&d_value, sizeof(int) * SIZE);
    cudaMemcpy(d_key, key, sizeof(int) * SIZE, cudaMemcpyHostToDevice);
    cudaMemcpy(d_value, value, sizeof(int) * SIZE, cudaMemcpyHostToDevice);

    kernel1<<<1,1>>>(d_key, d_value);
    cudaDeviceSynchronize();

    //- sort
    thrust::device_ptr<int> t_key(d_key);
    thrust::device_ptr<int> t_value(d_value);
    thrust::sort_by_key(t_value, t_value + SIZE, t_key);
    cudaDeviceSynchronize();

    kernel1<<<1,1>>>(d_key, d_value);
    cudaDeviceSynchronize();
    return 0;
}

sort前后的输出结果分别为:

#- 预期结果                  运行结果
key[0] = 24 value[0] = 0    key[0] = 24 value[0] = 0
key[1] = 43 value[1] = 1    key[1] = 43 value[1] = 1
key[2] = 27 value[2] = 2    key[2] = 27 value[2] = 2
key[3] = 42 value[3] = 3    key[3] = 42 value[3] = 3
key[4] = 25 value[4] = 4    key[4] = 25 value[4] = 4
key[5] = 40 value[5] = 5    key[5] = 40 value[5] = 5

key[0] = 24 value[0] = 0    key[0] = 24 value[0] = 0
key[1] = 25 value[1] = 4    key[1] = 43 value[1] = 1
key[2] = 27 value[2] = 2    key[2] = 27 value[2] = 2
key[3] = 40 value[3] = 5    key[3] = 42 value[3] = 3
key[4] = 42 value[4] = 3    key[4] = 25 value[4] = 4
key[5] = 43 value[5] = 1    key[5] = 40 value[5] = 5
评论 4
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值