#include<iostream>
#include<cuda.h>
#include<cuda_runtime.h>
#include<time.h>
using namespace std;
const int N=123456;
const int sample=100;
const int threads=256;
const int blocks=2048;
__global__ void judge(int* da,int* data,int sam)
{
for(int i=blockIdx.x*blockDim.x+threadIdx.x;i<N+blockDim.x*gridDim.x;
i+=blockDim.x*gridDim.x)
{
if(i<N)
{
for(int j=0;j<sam;j++)
{
if((da[i]>=sample*j)&&(da[i]<sample*(j+1)))
#include<cuda.h>
#include<cuda_runtime.h>
#include<time.h>
using namespace std;
const int N=123456;
const int sample=100;
const int threads=256;
const int blocks=2048;
__global__ void judge(int* da,int* data,int sam)
{
for(int i=blockIdx.x*blockDim.x+threadIdx.x;i<N+blockDim.x*gridDim.x;
i+=blockDim.x*gridDim.x)
{
if(i<N)
{
for(int j=0;j<sam;j++)
{
if((da[i]>=sample*j)&&(da[i]<sample*(j+1)))