Hadoop/MapReduce(单词统计--读写数据库)

最新推荐文章于 2022-05-03 22:34:45 发布

zhuzihuaile

最新推荐文章于 2022-05-03 22:34:45 发布

阅读量463

点赞数

分类专栏： hadoop Java

本文链接：https://blog.csdn.net/u010379996/article/details/50886020

版权

Java 同时被 2 个专栏收录

14 篇文章 1 订阅

订阅专栏

hadoop

3 篇文章 0 订阅

订阅专栏

单词统计

1. MySQL

CREATE TABLE `word` (
   `id` int(11) NOT NULL AUTO_INCREMENT,
   `name` varchar(20) NOT NULL COMMENT '单词',
   `count` int(11) NOT NULL DEFAULT '1' COMMENT '次数',
   PRIMARY KEY (`id`)
 ) ENGINE=InnoDB DEFAULT CHARSET=utf8 COMMENT='单词表'

CREATE TABLE `word2` (
   `id` int(11) NOT NULL AUTO_INCREMENT,
   `name` varchar(20) NOT NULL COMMENT '单词',
   `count` int(11) NOT NULL DEFAULT '1' COMMENT '次数',
   PRIMARY KEY (`id`)
 ) ENGINE=InnoDB DEFAULT CHARSET=utf8 COMMENT='单词统计表'

INSERT INTO word(NAME) VALUES('JAVA'),('Hadoop'),('Spring'),('Hadoop'),('JAVA'),('JAVA'),('JAVA'),('Spring'),('Mysql'),('Hadoop'),('Mysql'),('Spring'),('Hadoop'),('Mysql'),('Mysql'),('Hadoop');

2. Java

public class Demo08 {
	public static class WordRecord implements Writable, DBWritable {
		int count;
		String name;
		public WordRecord() {
		}
		public void readFields(DataInput in) throws IOException {
			this.count = in.readInt();
			this.name = Text.readString(in);
		}		
		public void write(PreparedStatement stmt) throws SQLException {
			stmt.setInt(1, this.count);
			stmt.setString(2, this.name);
		}
		public void readFields(ResultSet result) throws SQLException {
			this.count = result.getInt(1);
			this.name = result.getString(2);
		}
		public void write(DataOutput out) throws IOException {
			out.writeInt(this.count);
			Text.writeString(out, this.name);
		}
	}

	public static class DBInputMapper extends MapReduceBase
			implements Mapper<LongWritable, WordRecord, Text, IntWritable> {
		public void map(LongWritable key, WordRecord value, OutputCollector<Text, IntWritable> collector,
				Reporter reporter) throws IOException {
			collector.collect(new Text(value.name), new IntWritable(value.count));
		}
	}

	public static class MyReducer extends MapReduceBase
			implements Reducer<Text, IntWritable, WordRecord, LongWritable> {
		public void reduce(Text key, Iterator<IntWritable> values, OutputCollector<WordRecord, LongWritable> output,
				Reporter reporter) throws IOException {
			WordRecord r = new WordRecord();
			r.name = key.toString();
			while(values.hasNext()){		
				r.count += values.next().get();
			}
			output.collect(r, new LongWritable(r.count));
		}
	}

	@SuppressWarnings("deprecation")
	public static void main(String[] args) throws IOException {
		JobConf conf = new JobConf(Demo08.class);
               //加载mysql连接jar包
                DistributedCache.addFileToClassPath(new Path("/tool/lib/mysql.jar"), conf);

		conf.setMapOutputKeyClass(Text.class);
		conf.setMapOutputValueClass(IntWritable.class);
		conf.setOutputKeyClass(Text.class);
		conf.setOutputValueClass(IntWritable.class);

		conf.setOutputFormat(DBOutputFormat.class);
		conf.setInputFormat(DBInputFormat.class);

		DBConfiguration.configureDB(conf, "com.mysql.jdbc.Driver", "jdbc:mysql://192.168.1.194:3306/test", "root", "root");
		String[] fields = { "count", "name" };
		DBInputFormat.setInput(conf, WordRecord.class, "word", null, null, fields);
		DBOutputFormat.setOutput(conf, "word2", "count", "name");
		conf.setMapperClass(DBInputMapper.class);
		conf.setReducerClass(MyReducer.class);

		JobClient.runJob(conf);
	}
}

zhuzihuaile

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
Hadoop/MapReduce(单词统计--读写数据库)

单词统计1. MySQL CREATE TABLE `word` ( `id` int(11) NOT NULL AUTO_INCREMENT, `name` varchar(20) NOT NULL COMMENT '单词', `count` int(11) NOT NULL DEFAULT '1' COMMENT '次数', PRIMARY KEY (`
复制链接

扫一扫