val env = StreamExecutionEnvironment.getExecutionEnvironment env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime) env.setParallelism(1) val sourceStream = env.fromCollection(List( "a,1646150400000", "a,1646150403000", "a,1646150406000", "a,1646150410000", "a,1646150415000", "b,1646150400000", "b,1646150403000", "b,1646150410000", "b,1646150415000", "c,1646150400000", "c,1646150403000", "c,1646150415000" )).assignTimestampsAndWatermarks(new BoundedOutOfOrdernessTimestampExtractor[String](Time.seconds(3)){ override def extractTimestamp(t: String): Long = t.split(",")(1).toLong }) val aggData: DataStream[(Long, String, Int)] = sourceStream.map( line => { val splits = line.split(",") (splits(0), 1) } )
Flink对keyBy汇总后的数据排序
最新推荐文章于 2024-06-02 01:54:41 发布