案例要求
求出输入路径中包含的所有文件中不同单词的出现次数。
输入文件示例
// a.txt
hadoop mapreduce
hdfs
hadoop mapreduce
hdfs
hadoop mapreduce
hdfs
hadoop mapreduce
hdfs
hadoop mapreduce
hdfs
// inputword.txt
tony tony
study
hadoop
hdfs mapreduce
spark mysql
输出结果示例
// part-r-00000
hadoop 6721
hdfs 6721
mapreduce 6721
mysql 1
spark 1
study 1
tony 2
代码实现
WordCountMapper.java
package com.tony.mr.word_count;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Mapper;
import java.io.IOException;
/**
* @author tony
* @create 2020-07-19 18:41
*/
public class WordCountMapper extends Mapper<Object, Text, Text, IntWritable> {
private Text word = new Text();
private IntWritable one = new IntWritable(1);
@Override
protected void map(Object key, Text value, Context context