我正在试用Flink的新Python流式API,并尝试使用./Flink-1.6.1/bin/pyflink运行我的脚本-流.sh示例/ 读取_ Kafka .py. python脚本相当简单,我只是尝试从一个现有的主题中使用并将所有内容发送到stdout(或log目录中的*.out文件,默认情况下,output方法在其中发出数据)。
import glob
import os
import sys
from java.util import Properties
from org.apache.flink.streaming.api.functions.source import SourceFunction
from org.apache.flink.streaming.api.collector.selector import OutputSelector
from org.apache.flink.api.common.serialization import SimpleStringSchema
directories=['/home/user/flink/flink-1.6.1/lib']
for directory in directories:
for jar in glob.glob(os.path.join(directory,'*.jar')):
sys.path.append(jar)
from org.apache.flink.streaming.connectors.kafka import FlinkKafkaConsumer09
props = Properties()
config = {"bootstrap_servers": "localhost:9092",