public class Distinct { static { System.setProperty("hadoop.home.dir", "D:\\hadoop\\hadoop-2.8.3"); } public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException { //初始化job Configuration conf = new Configuration(); Job job = Job.getInstance(conf, "distinct"); //输入文件 FileInputFormat.addInputPath(job,new Path(args[0])); //mapper计算 job.setMapperClass(MyMapper.class); //shuffle //reduce计算 job.setReducerClass(MyReducer.class); job.setOutputKeyClass(Text.class); job.setOutputValueClass(Text.class); //输出 FileOutputFormat.setOutputPath(job,new Path(args[1])); //提交 boolean result = job.waitForCompletion(true); System.out.println(result?1:0); } public static class MyMapper extends Mapper<LongWritable,Text,Text,Text>{ @Override protected void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException { context.write(value,new Text("")); } } public static class MyReducer extends Reducer<Text,Text,Text,Text>{ @Override protected void reduce(Text key, Iterable<Text> values, Context context) throws IOException, InterruptedException { context.write(key,new Text("")); } } }
mapreduce去重
最新推荐文章于 2022-12-19 10:00:00 发布