flink sql 自定义 source 读取kafka(RichSourceFunction 模式)

  1. 先一定 KafkaSourceFunction:
package com.alpha;
import com.alibaba.fastjson.JSON;
import org.apache.flink.configuration.Configuration;
import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
import org.apache.flink.types.Row;
import org.apache.kafka.clients.consumer.ConsumerConfig;
import org.apache.kafka.clients.consumer.ConsumerRecord;
import org.apache.kafka.clients.consumer.ConsumerRecords;
import org.apache.kafka.clients.consumer.KafkaConsumer;
import org.apache.kafka.clients.producer.KafkaProducer;
import org.apache.kafka.clients.producer.ProducerConfig;
import org.apache.kafka.common.serialization.StringDeserializer;
import java.util.Arrays;
import java.util.Map;
import java.util.Properties;

class KafkaSourceFunction extends RichSourceFunction<Row> {

    KafkaProducer<String, String> producer;
    KafkaConsumer<String,String> consumer;


    @Override
    public void open(Configuration parameters) throws Exception {

        Properties props = new Properties();
        props.put(ConsumerConfig.KEY_DESERIALIZER_CLASS_CONFIG, StringDeserializer.class.getName());
        props.put(ConsumerConfig.VALUE_DESERIALIZER_CLASS_CONFIG, StringDeserializer.class.getName());
        props.put(ConsumerConfig.GROUP_ID_CONFIG, "default-009");
        props.put(ProducerConfig.BOOTSTRAP_SERVERS_CONFIG, "bigdata006:9092,bigdata007:9092,bigdata008:9092");

        // 创建消费者
        consumer=new KafkaConsumer<String, String>(props);
        consumer.subscribe(Arrays.asList("topic_test_flink"));
    }

    @Override
    public void run(SourceContext sourceContext) throws Exception {

        while(true) {
            ConsumerRecords<String, String> records = consumer.poll(100);

            for (ConsumerRecord<String, String> record : records) {

                String key = record.key();
                String value = record.value();

                Map map = JSON.parseObject(value);

                Row row = Row.of(new Object[]{map.get("timestamp").toString(), map.get("name").toString(), map.get("age").toString()});
                sourceContext.collect(row);
            }
        }

    }

    @Override
    public void cancel() {

    }

}
  1. 主程序:
package com.alpha;

import com.alibaba.fastjson.JSON;
import kafka.utils.Json;
import org.apache.flink.api.common.functions.MapFunction;
import org.apache.flink.api.common.io.InputFormat;
import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
import org.apache.flink.api.common.typeinfo.TypeInfo;
import org.apache.flink.api.common.typeinfo.TypeInformation;
import org.apache.flink.api.common.typeinfo.Types;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple4;
import org.apache.flink.api.java.tuple.Tuple5;
import org.apache.flink.api.java.tuple.Tuple9;
import org.apache.flink.api.java.typeutils.RowTypeInfo;
import org.apache.flink.configuration.Configuration;
import org.apache.flink.streaming.api.datastream.DataStream;
import org.apache.flink.streaming.api.datastream.DataStreamSource;
import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;

import org.apache.flink.streaming.api.functions.source.InputFormatSourceFunction;
import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
import org.apache.flink.streaming.api.functions.source.SourceFunction;
import org.apache.flink.table.api.Table;
import org.apache.flink.table.api.TableEnvironment;
import org.apache.flink.table.api.TableSchema;
import org.apache.flink.table.api.java.StreamTableEnvironment;
import com.alibaba.fastjson.JSONObject;
import org.apache.flink.table.sinks.CsvTableSink;
import org.apache.flink.table.sinks.TableSink;
import org.apache.flink.table.sources.StreamTableSource;
import org.apache.flink.table.sources.TableSource;
import org.apache.flink.types.Row;
import org.apache.kafka.clients.consumer.ConsumerConfig;
import org.apache.kafka.clients.consumer.ConsumerRecord;
import org.apache.kafka.clients.consumer.ConsumerRecords;
import org.apache.kafka.clients.consumer.KafkaConsumer;
import org.apache.kafka.clients.producer.KafkaProducer;
import org.apache.kafka.clients.producer.ProducerConfig;
import org.apache.kafka.clients.producer.ProducerRecord;
import org.apache.kafka.common.serialization.Deserializer;
import org.apache.kafka.common.serialization.StringDeserializer;
import org.apache.kafka.common.serialization.StringSerializer;

import java.util.Arrays;
import java.util.Date;
import java.util.Map;
import java.util.Properties;

public class KafkaAvro {

    public static void main(String[] args) throws Exception {


        //初始化运行环境
        StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
        StreamTableEnvironment tableEnv = StreamTableEnvironment.create(env);


        //定义数据源的字段类型
        TypeInformation[] fieldTypes = new TypeInformation[]{
                TypeInformation.of(String.class),
                TypeInformation.of(String.class),
                TypeInformation.of(String.class)
        };
        String[] sourceFieldNames = new String[]{"ttime", "name", "age"};

        //定义数据源的结构类型
        TypeInformation<Row> typeInformation = new RowTypeInfo(fieldTypes, sourceFieldNames);

        //定义 sourcefunction
        DataStreamSource<Row> streamSource= env.addSource(new KafkaSourceFunction(),typeInformation);

        //生成 flink table
        Table tbl = tableEnv.fromDataStream(streamSource,"ttime,name,age");
        //定义输出sink table


        //定义sink
        String[] fieldNames = {"ttime", "name", "age"};
        TypeInformation[] fTypes = {Types.STRING, Types.STRING, Types.STRING};
        CsvTableSink csvSink = new CsvTableSink("/Users/bozhong/Documents/code/flinkStreamSQL/data/"+new Date().getTime()+"/");

        tableEnv.registerTableSink("sink_tbl",csvSink.configure(fieldNames,fTypes));

        //执行数据处理
        tableEnv.sqlUpdate(
                "INSERT INTO sink_tbl SELECT ttime,name,age FROM " + tbl);



        tableEnv.execute("not table run....");


    }

}

  • 0
    点赞
  • 7
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值