主要是整理了mapreduce常用的操作模板
主函数(请忽略主类的名字。。忘记改了):
package hadoop.wordCount;
import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.mapreduce.*;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.*;
public class WordCount {
public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
// TODO Auto-generated method stub
Configuration conf = new Configuration();
Path inpath = new Path(HDFS.HDFS_PATH+"/file/input");
Path outpath = new Path(HDFS.HDFS_PATH+"/file/output");
Job job = new Job(conf, "WordCount");
//先删除之前的输入输出文件,再重新读取输入文件
HDFS.rmInHDFS("/file/outpu