输入数据
test1
test2 test2
test3 test3 test3
test4 test4 test4 test4
test5 test5 test5 test5 test5
自定义Driver类(WordCountDriver)
将 MapReduce中词频统计简单实现 中WordCountDriver改为如下代码,其他代码不变
package com.test.mapreduce.combiner;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import java.io.IOException;
public class WordCountDriver {
public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
// 1.创建配置信息Configuration对象并获取Job单例对象
Configuration