hbase的wordcount

package com.neworigin.HBaseMR;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.Cell;
import org.apache.hadoop.hbase.CellUtil;
import org.apache.hadoop.hbase.HBaseConfiguration;
import org.apache.hadoop.hbase.client.Mutation;
import org.apache.hadoop.hbase.client.Put;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.io.ImmutableBytesWritable;
import org.apache.hadoop.hbase.mapreduce.TableMapReduceUtil;
import org.apache.hadoop.hbase.mapreduce.TableMapper;
import org.apache.hadoop.hbase.mapreduce.TableReducer;
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;

public class HbaseMRTest {
    static Configuration conf=null;
    static{
//        配置configuration的三种方法
//        ①直接将hbase-site.xml拿来放到src下面
        conf=HBaseConfiguration.create();
//        ②设置服务器和端口        
//        conf.set("hbase.zookeeper.quorum", "s100:2181,s101:2181,s102:2181");
//        ③扥开设置服务器和端口
        conf.set("hbase.zookeeper.quorum", "s100,s101,s102");
        conf.set("hbase.zookeeper.property.clientPort", "2181");
    }
    
    表信息
//    public static final String tablename="wordtest";//表一
//    public static final String colf="content";//表列族
//    public static final String col="info";////    
//    public static final String tablename2="stat";//表二
//    
//public static void initTB(){
//    
//}    
public static class HBmapper extends TableMapper<Text,IntWritable>/*输出类型*/{
    private static IntWritable one=new IntWritable(1);
    private static Text word =new Text();
//    输入类型,key:row key  value:一行数据的结果集 result
    protected void map(ImmutableBytesWritable key, Result value,
            Mapper<ImmutableBytesWritable, Result, Text, IntWritable>.Context context)
            throws IOException, InterruptedException {
        for(Cell cell:value.rawCells())
        {
            word.set(CellUtil.cloneValue(cell));//读取值
            context.write(word, one);//输出:单词----1
        }
        
    }
}
public static class HBreducer extends TableReducer<Text,IntWritable,ImmutableBytesWritable>{

    @Override
    protected void reduce(Text key, Iterable<IntWritable> values,
            Reducer<Text, IntWritable, ImmutableBytesWritable, Mutation>.Context context)
            throws IOException, InterruptedException {
        
        int sum=0;
        //叠加单词个数
        for(IntWritable value:values)
        {
            sum+=value.get();
        }
        Put put = new Put(Bytes.toBytes(key.toString()));//设置row key为单词
        put.add(Bytes.toBytes("content"), Bytes.toBytes("info"), Bytes.toBytes(String.valueOf(sum)));
        //写到hbase中的需要指定rowkey和put
        context.write(new ImmutableBytesWritable(Bytes.toBytes(key.toString())), put);
    }
    
}
public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
    Job job=new Job(conf,"HBaseMR");
    Scan scan =new Scan();
    TableMapReduceUtil.initTableMapperJob("wordtest",scan, HBmapper.class, Text.class, IntWritable.class, job);
    TableMapReduceUtil.initTableReducerJob("stat", HBreducer.class, job);
    
    job.waitForCompletion(true);
    System.out.println("finished");
}
}

 

转载于:https://www.cnblogs.com/chengdonghui/p/7978285.html

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值