1.源数据:
张三 90
李四 100
张三 60
李四 80
王五 88
李四 100
2.代码如下:
package com.average;
import java.io.IOException;
import java.util.StringTokenizer;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.util.GenericOptionsParser;
public class Average {
public static class Map extends Mapper<Object, Text, Text, IntWritable>{
public void map(Object key,Text value,Context context) throws IOException, InterruptedException{
String line=value.toString();
String[] line1=line.split(" ");
String person=line1[0].toString();
IntWritable i=new IntWritable(Integer.parseInt(line1[1]));
//System.out.print(person+" "+i);
context.write(new Text(person), i);
}
}
public static class Redudce extends Reducer<Text, IntWritable, Text, IntWritable>{
private static IntWritable i=new IntWritable(1);
public void reduce(Text key,Iterable<IntWritable> value,Context context) throws IOException, InterruptedException{
int sum=0; //总分
int ave=0;
int count=0; //个数
for(IntWritable v:value){
sum+=v.get();
count++;
//System.out.println(v);
}
ave=sum/count;
IntWritable ave1=new IntWritable(ave);
context.write(key, ave1);
System.out.println(key+" "+ave1);
}
}
public static void main(String args[]) throws IOException, ClassNotFoundException, InterruptedException{
Configuration conf=new Configuration();
String otherargs[]=new GenericOptionsParser(conf, args).getRemainingArgs();
if(otherargs.length!=2){
System.exit(2);
}
Job job=new Job(conf,"average");
job.setJarByClass(Average.class);
job.setMapperClass(Map.class);
job.setCombinerClass(Redudce.class);
job.setReducerClass(Redudce.class);
job.setOutputKeyClass(Text.class);
job.setOutputValueClass(IntWritable.class);
FileInputFormat.addInputPath(job, new Path(otherargs[0]));
FileOutputFormat.setOutputPath(job, new Path(otherargs[1]));
System.exit(job.waitForCompletion(true) ? 0 : 1);
}
}
程序运行后输出文件夹里面是空的,也是很苦恼。。。。。。