mapreduce写入mysql

参考这个博客


import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
import java.sql.PreparedStatement;
import java.sql.ResultSet;
import java.sql.SQLException;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.Writable;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.db.DBConfiguration;
import org.apache.hadoop.mapreduce.lib.db.DBOutputFormat;
import org.apache.hadoop.mapreduce.lib.db.DBWritable;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.util.Tool;
import org.apache.hadoop.util.ToolRunner;


/**
 * 将mapreduce的结果数据写入mysql中
 *
 * @author asheng
 */
public class WriteDataToMysql extends Configured implements Tool {
    /**
     * 重写DBWritable
     *
     * @author asheng
     * TblsWritable需要向mysql中写入数据
     */
    public static class TblsWritable implements Writable, DBWritable {
        String tbl_name;
        String tbl_name1;
        String tbl_type;

        public TblsWritable() {

        }

        TblsWritable(String tbl_name, String tbl_name1, String tbl_type) {
            this.tbl_name = tbl_name;
            this.tbl_name1 = tbl_name1;
            this.tbl_type = tbl_type;

        }

        @Override
        public void write(PreparedStatement statement) throws SQLException {
            statement.setString(1, this.tbl_name);
            statement.setString(2, this.tbl_name1);
            statement.setString(3, this.tbl_type);
        }

        @Override
        public void readFields(ResultSet resultSet) throws SQLException {
            this.tbl_name = resultSet.getString(1);
            this.tbl_name1 = resultSet.getString(2);
            this.tbl_type = resultSet.getString(3);
        }

        @Override
        public void write(DataOutput out) throws IOException {
            out.writeUTF(this.tbl_name);
            out.writeUTF(this.tbl_name1);
            out.writeUTF(this.tbl_type);
        }

        @Override
        public void readFields(DataInput in) throws IOException {
            this.tbl_name = in.readUTF();
            this.tbl_name1 = in.readUTF();
            this.tbl_type = in.readUTF();
        }

        public String toString() {
            return new String(this.tbl_name + " " + this.tbl_name1 + " " + this.tbl_type);
        }
    }

    public static class ConnMysqlMapper extends Mapper<LongWritable, Text, Text, Text>
            //TblsRecord是自定义的类型,也就是上面重写的DBWritable类
    {
        public void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException {
            //<首字母偏移量,该行内容>接收进来,然后处理value,将abc和x作为map的输出
            //key对于本程序没有太大的意义,没有使用
            String name = value.toString().split("\t")[0] + "," + value.toString().split("\t")[1];
            String type = value.toString().split("\t")[2];
            context.write(new Text(name), new Text(type));
        }
    }

    public static class ConnMysqlReducer extends Reducer<Text, Text, TblsWritable, TblsWritable> {
        public void reduce(Text key, Iterable<Text> values, Context context) throws IOException,
                InterruptedException {
            //接收到的key value对即为要输入数据库的字段,所以在reduce中:
            //wirte的第一个参数,类型是自定义类型TblsWritable,利用key和value将其组合成TblsWritable,然后等待写入数据库
            //wirte的第二个参数,wirte的第一个参数已经涵盖了要输出的类型,所以第二个类型没有用,设为null
            for (Text value : values) {
                String k1 = key.toString().split(",")[0];
                String k2 = key.toString().split(",")[1];
                context.write(new TblsWritable(k1, k2, value.toString()), null);
            }
        }
    }

    @Override
    public int run(String[] args) throws Exception {
        Configuration conf = getConf();
        DBConfiguration.configureDB(conf, "com.mysql.cj.jdbc.Driver", "jdbc:mysql://127.0.0.1:3306/mapreduce_test?serverTimezone=UTC&characterEncoding=utf-8", "ecjtu", "123456");
        Job job = Job.getInstance(conf, "test mysql connection");
        job.setJarByClass(WriteDataToMysql.class);

        job.setMapperClass(ConnMysqlMapper.class);
        job.setReducerClass(ConnMysqlReducer.class);

        job.setOutputKeyClass(Text.class);
        job.setOutputValueClass(Text.class);

        job.setInputFormatClass(TextInputFormat.class);
        job.setOutputFormatClass(DBOutputFormat.class);
        FileInputFormat.addInputPath(job, new Path(args[0]));//args[0]则是一个运行时参数

        DBOutputFormat.setOutput(job, "good_user", "uid", "gid", "exp");
        return job.waitForCompletion(true) ? 0 : 1;
    }

    public static void main(String[] args) throws Exception {
        // 数据输入路径和输出路径  下方调用arg0替换args
/*        String[] args0 = {
                "hdfs://ljc:9000/buaa/student/student.txt"
        };*/
        //                              下方调用arg0替换args,就无需配置idea program arguments
        ToolRunner.run(new WriteDataToMysql(), args);
    }
}
//执行输入参数为/home/asheng/hadoop/in/test3.txt
//test3.txt中的内容为
/*
abc x
def y
chd z
*/
//即将abc x分别做为TBL_NAME,和TBL_TYPE插入数据库中


//输出结果在mysql数据库中查看
//select * from lxw_tabls;
//发现新增三行
/*
abc x
def y
chd z
*/

  • 1
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 3
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 3
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值