java mapreduce mysql_Hadoop编程之MapReduce操作Mysql数据库

1,首先建立mysql的数据库,表:如下图

1361811068_3342.jpg

下面是MapReduce编程了,需要导入mysql数据库驱动jar包;

首先需要自定义Recoder,这里是CourceRecord

public class CourceRecord implements Writable, DBWritable {

int id;

String name;

int count;

int no;

//从in流反序列化出内容

@Override

public void readFields(DataInput in) throws IOException {

this.id = in.readInt();

this.name = Text.readString(in);

this.count = in.readInt();

this.no = in.readInt();

}

//将内容序列化到out流

@Override

public void write(DataOutput out) throws IOException {

out.writeInt(this.id);

Text.writeString(out, this.name);

out.writeInt(this.count);

out.writeInt(this.no);

}

@Override

public void readFields(ResultSet result) throws SQLException {

this.id = result.getInt(1);

this.name = result.getString(2);

this.count = result.getInt(3);

this.no = result.getInt(4);

}

@Override

public void write(PreparedStatement stmt) throws SQLException {

stmt.setInt(1, this.id);

stmt.setString(2, this.name);

stmt.setInt(3, this.count);

stmt.setInt(4, this.no);

}

@Override

public String toString() {

return new String(this.name + " " + this.count + " " + this.no);

}

}

------------------------------------------------map类-----------------------------------

public class DBMapper extends MapReduceBase implements

Mapper {

public void map(LongWritable key, CourceRecord value,

OutputCollector collector, Reporter reporter)

throws IOException {

collector.collect(new LongWritable(value.id),

new Text(value.toString()));

}

}

--------------------------------------driver驱动类DB------------------

public class DB {

public static void main(String[] args) throws IOException {

String[] argc={"jdbc:mysql://localhost/test","root", "111111"};

try {

JobConf conf = new JobConf(DB.class);

Class.forName("com.mysql.jdbc.Driver");

DBConfiguration.configureDB(conf, "com.mysql.jdbc.Driver",argc[0], argc[1], argc[2]);

String[] fields = { "id", "name", "count", "no" };

DBInputFormat.setInput(conf, CourceRecord.class, "tb", null,"id", fields);

conf.setInputFormat(DBInputFormat.class);

conf.setOutputKeyClass(LongWritable.class);

conf.setOutputValueClass(Text.class);

Path path = new Path("DBOUTPUT");

FileOutputFormat.setOutputPath(conf, path);

conf.setMapperClass(DBMapper.class);

conf.setReducerClass(IdentityReducer.class);

//如果文件存在则删除

FileSystem hdfs = path.getFileSystem(conf);

if (hdfs.exists(path)) {

hdfs.delete(path, true);

}

JobClient.runJob(conf);

}

catch(ClassNotFoundException e) {

System.err.println("mysql.jdbc.Driver not found");

}

}

------------------------------------------------------

运行:在DBOUTPUT目录下生成一个part-00000的文件,其内容为:

17hello 28 17

18hadoop 28 18

19java 28 19

20hive 16 20

21hbase 18 21

22pig 18 22

实例是跑起来了,主要是DB的一个配置,相关设置函数:

DBConfiguration.configureDB (JobConf job, String driverClass, String Url, String userName, String passwd)

DBInputFormat.setInput(JobConf job, Class<?extends DBWritable> inputClass,

String tableName, String conditions,String orderBy, String fieldNames)

DBOutputFormat.setOut(JobConf

job,String tablename,String fieldNames);

eg:DBOutputFormat.setOut(job,"tb",28,"mahout",30,401)

分享到:

18e900b8666ce6f233d25ec02f95ee59.png

72dd548719f0ace4d5f9bca64e1d7715.png

2014-04-25 16:08

浏览 349

评论

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值