spark streaming python实例_实时 Spark Streaming 消费示例

## StructuredLoghubWordCount.Scala

object StructuredLoghubSample {

def main(args: Array[String]) {

if (args.length < 7) {

System.err.println("Usage: StructuredLoghubSample " +

" " +

" []")

System.exit(1)

}

val Array(project, logStore, accessKeyId, accessKeySecret, endpoint, startingOffsets, maxOffsetsPerTrigger, outputPath, _*) = args

val checkpointLocation =

if (args.length > 8) args(8) else "/tmp/temporary-" + UUID.randomUUID.toString

val spark = SparkSession

.builder

.appName("StructuredLoghubSample")

.master("local[5]")

.getOrCreate()

import spark.implicits._

// Create DataSet representing the stream of input lines from loghub

val lines = spark

.readStream

.format("loghub")

.option("sls.project", project)

.option("sls.store", logStore)

.option("access.key.id", accessKeyId)

.option("access.key.secret", accessKeySecret)

.option("endpoint", endpoint)

.option("startingoffsets", startingOffsets)

.option("zookeeper.connect.address", "localhost:2181")

.option("maxOffsetsPerTrigger", maxOffsetsPerTrigger)

.load()

.selectExpr("CAST(content AS STRING)")

.as[String]

val query = lines.writeStream

.format("parquet")

.option("checkpointLocation", checkpointLocation)

.option("path", outputPath)

.outputMode("append")

.trigger(Trigger.ProcessingTime(30000))

.start()

query.awaitTermination()

}

}

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值