mapreduce编程:多表关联

package my.hadoopstudy;  

import java.util.*;
import java.io.*;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.TextInputFormat;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
import org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat;


public class TableConnect {
 
 public static class tableMapper extends Mapper<Text, Text, Text, Text>
 {
  @Override
  public void map(Text key, Text value, Context context) throws IOException, InterruptedException
  {
       context.write(key,value);
  }
 }
 
 
 public static class tableReducer extends Reducer<Text, Text, Text, Text>
 {
  @Override
  public void reduce(Text key, Iterable<Text> values, Context context) throws IOException, InterruptedException
  {
   List<String> gChildren=new ArrayList<String>();
   List<String> gParents =new ArrayList<String>();
   for(Text val : values)
   {
    if(val.toString().charAt(0)  == '1')// the key's child.
    {
       gChildren.add(val.toString().substring(1));
    }
    else//the key's parent.
    {
       gParents.add(val.toString().substring(1));
    }
   }
   for(int i=0; i<gChildren.size(); i++)
    for(int j=0;j<gParents.size();j++)
    {
       context.write(new Text(gChildren.get(i)), new Text(gParents.get(j)));
    }
  } 
 }
 
 public static void main(String[] args) throws Exception
 {
  Configuration conf = new Configuration();
  conf.set("mapreduce.input.keyvaluelinerecordreader.key.value.separator", " ");
  
  Job job = new Job(conf, "tableConnect");
  job.setJarByClass(TableConnect.class);
  
  job.setMapperClass(tableMapper.class);
  job.setReducerClass(tableReducer.class);
  
  job.setOutputKeyClass(Text.class);
  job.setOutputValueClass(Text.class);
  
  job.setInputFormatClass(KeyValueTextInputFormat.class);
  job.setOutputFormatClass(TextOutputFormat.class);
  
  FileInputFormat.addInputPath(job, new Path(args[0]));
  FileOutputFormat.setOutputPath(job, new Path(args[1]));
  
  System.exit( job.waitForCompletion(true) ? 0 : 1);
 }
}

输入数据,文本1:

代号        公司

a 1Beijing Red Star
c 1Shenzhen Thunder
b 1Guangzhou Honda
a 1Beijing Rising
b 1Guangzhou Development Bank
c 1Tencent
a 1Back of Beijing



输入数据,文本2:

代号       地方

a 2Beijing
b 2Guangzhou
c 2Shenzhen
d 2Xian


输出:



  • 1
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值