MapReduce实现矩阵相乘

矩阵相乘能够查看百度百科的解释http://baike.baidu.com/view/2455255.htm?fr=aladdin

有a和b两个矩阵

a:                1   2   3

                   4   5   0

                   7   8   9

                   10  11  12

b:              10  15

                  0     2

                  11   9

 c = a*b

1:将矩阵存到HDFS中:

                       矩阵a:


hdfs存储
1111,1,1
1221,2,2
1331,3,3
2142,1,4
2252,2,5
2300不存储
3173,1,7
3283,2,8
3393,3,9
41104,1,10
42114,2,11
43124,3,12

                     

                        矩阵b:

hdfs存储
11101,1,10
12151,2,15
2100不存储
2222,2,2
31113,1,11
3293,2,9


2:a的map读取

   读取第一个值是1,1,1。它是矩阵a的第一行第一列。那么它要在计算c(1,1) c(1,2)的时候使用(这里c仅仅用2列,假设用n列,那么它的值要在计算c(1,1),c(1,2),c(1,3)...c(1,n)的时候使用)。我们就以 key = 1,1  value = a,1,1  ,      key= 1,2   value = a,1,1输出两条数据(1,1) (1,2)是 c(1,1) ,c(1,2)的坐标。

  b的map读取

  读取第一个值是1,1,10。它是矩阵b的第一行第一列。那么它要在计算c(1,1) c(2,1) c(3,1) c(4,1)的时候使用(这里c仅仅用4行,假设用m行,那么它的值要在计算c(1,1),c(2,1),c(3,1)...c(m,1)的时候使用)。我们就以 key = 1,1  value = b,1,10  ,     key= 2,1   value = b,1,10               ,    key = 3,1   value = b,1,10    ,                                         key= 4,1   value = b,1,10输出

3:reduce读取计算

   通过mapA和mapB的输出能够得到 key = 1,1   ,   value=a,1,1    value=b,1,10   value=a,2,2      value=a,3,3  value = b,3,11l来计算c(1,1)的值

代码例如以下:

package MyMatrix;

import java.io.IOException;
import java.util.Iterator;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.MultipleInputs;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

public class MartrixMultiply{
	
	/**
	 * 最后得到的矩阵的列数
	 */
	public static final int COL_COUNT = 2;
	
	/**
	 * 最后得到的矩阵的行数
	 */
	public static final int ROW_COUNT = 4;
	
	/**
	 * A矩阵的列数或者是B矩阵的行数
	 */
	public static final int BROW_ACOL= 3;
	
	public static class MartrixMaperA extends Mapper<LongWritable, Text, Text, Text>{

		@Override
		protected void map(LongWritable key, Text value, Context context)
				throws IOException, InterruptedException {
			
			String valueStr = value.toString();
			String[] items = valueStr.split(",");
			
			int rowIndex = Integer.parseInt(items[0]);
			int colIndex = Integer.parseInt(items[1]);
			int valueInt = Integer.parseInt(items[2]);
			
			Text outKey = null;
			Text outValue = null;
			for(int i=0;i<COL_COUNT;i++){
				outKey = new Text(rowIndex + "," + (i+1));
				outValue = new Text("a,"+colIndex+","+valueInt);
				context.write(outKey, outValue);
			}
			
		}
		
	}
	
	public static class MartrixMaperB extends Mapper<LongWritable, Text, Text, Text>{

		@Override
		protected void map(LongWritable key, Text value, Context context)
				throws IOException, InterruptedException {
			
			String valueStr = value.toString();
			String[] items = valueStr.split(",");
			
			int rowIndex = Integer.parseInt(items[0]);
			int colIndex = Integer.parseInt(items[1]);
			int valueInt = Integer.parseInt(items[2]);
			
			Text outKey = null;
			Text outValue = null;
			for(int i=0;i<ROW_COUNT;i++){
				outKey = new Text((i+1) + "," + colIndex);
				outValue = new Text("b,"+rowIndex+","+valueInt);
				context.write(outKey, outValue);
			}
			
		}
		
	}
	
	public static class MartrixReducer extends Reducer<Text,Text,Text,IntWritable>{

		@Override
		protected void reduce(Text key, Iterable<Text> values,Context context)
				throws IOException, InterruptedException {

			String[] items = new String[3];
			
			int[] valueA = new int[BROW_ACOL];
			int[] valueB = new int[BROW_ACOL];
			
			Iterator<Text> it = values.iterator();
			while(it.hasNext()){
				items = it.next().toString().split(",");
				if(items[0].equals("a")){
					valueA[Integer.parseInt(items[1])-1] = Integer.parseInt(items[2]);
				}else if(items[0].equals("b")){
					valueB[Integer.parseInt(items[1])-1] = Integer.parseInt(items[2]);
				}
			}
			
			int result = 0;
			for(int i=0;i<BROW_ACOL;i++){
				result += valueA[i]*valueB[i];
			}
			context.write(key, new IntWritable(result));
		}
		
	}
	
	@SuppressWarnings("deprecation")
	public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
		
		Path pathA = new Path("hdfs://localhost:9000/Martrix/a.txt");
		Path pathB = new Path("hdfs://localhost:9000/Martrix/b.txt");
		Path pathOut = new Path("hdfs://localhost:9000/Martrix/out");
		
		Configuration conf = new Configuration();
		Job job = new Job(conf,"MartrixMultiply");
		
		job.setJarByClass(MartrixMultiply.class);
		
		MultipleInputs.addInputPath(job, pathA, TextInputFormat.class, MartrixMaperA.class);
		MultipleInputs.addInputPath(job, pathB, TextInputFormat.class, MartrixMaperB.class);
		
		job.setReducerClass(MartrixReducer.class);
		
		job.setMapOutputKeyClass(Text.class);
		job.setMapOutputValueClass(Text.class);
		
		job.setOutputKeyClass(Text.class);
		job.setOutputValueClass(IntWritable.class);
		
		FileOutputFormat.setOutputPath(job, pathOut);
		
		if(job.waitForCompletion(true)){
			System.exit(0);
		}else{
			System.exit(1);
		}
		
	}
	
}


  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值