匿名内部类方式
package com.atguigu.Adatastream_api.transformations;
import org.apache.flink.api.common.functions.RichFilterFunction;
import org.apache.flink.api.common.functions.RichFlatMapFunction;
import org.apache.flink.api.common.functions.RichMapFunction;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple3;
import org.apache.flink.streaming.api.TimeCharacteristic;
import org.apache.flink.streaming.api.datastream.DataStream;
import org.apache.flink.streaming.api.datastream.DataStreamSource;
import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
import org.apache.flink.util.Collector;
/**
* 匿名内部类方式测试map\flapMap\filter等算子
* 可以改成lambda表达式方式
*/
public class AMapText {
public static void main(String[] args) throws Exception {
//创建环境
StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
env.setParallelism(1);
env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime);
//读取数据
DataStreamSource<String> inputStream = env.readTextFile("G:\\SoftwareInstall\\idea\\project\\UserBehaviorAnalysis\\BasicKnowledge\\src\\main\\resources\\hello.txt");
//获取数据的长度
DataStream<Tuple3<String, Integer, Integer>> result = inputStream.flatMap(new RichFlatMapFunction<String,Tuple2<String,Integer>>() {
@Override
public void flatMap(String s, Collector<Tuple2<String,Integer>> out) throws Exception {
String [] words=s.split(" ");
for (String word:words) {
out.collect(new Tuple2(word,1)); //分词,每个单词加上1
}
}
}) //参数1:输入数据格式 参数2:输出数据格式,增加一个单词的长度的字段
.map(new RichMapFunction<Tuple2<String, Integer>, Tuple3<String,Integer,Integer>>() {
@Override
public Tuple3<String,Integer,Integer> map(Tuple2<String, Integer> data) throws Exception {
return new Tuple3<String,Integer,Integer>(data.f0,data.f0.length(),data.f1);
}
})
.filter(new RichFilterFunction<Tuple3<String, Integer, Integer>>() {
@Override
public boolean filter(Tuple3<String, Integer, Integer> data) throws Exception {
return "hello".equals(data.f0);
}
});
//输出数据
result.print(" 匿名内部类方式测试map/flapMap/filter等算子");
env.execute(" 匿名内部类方式测试map/flapMap/filter等算子");
}
}
lambda表达式方式
package com.atguigu.Adatastream_api.transformations;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple3;
import org.apache.flink.streaming.api.TimeCharacteristic;
import org.apache.flink.streaming.api.datastream.DataStream;
import org.apache.flink.streaming.api.datastream.DataStreamSource;
import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
import org.apache.flink.util.Collector;
/**
*lambda表达式方式测试map\flapMap\filter等算子
*/
public class AMapText {
public static void main(String[] args) throws Exception {
//创建环境
StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
env.setParallelism(1);
env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime);
//读取数据
DataStreamSource<String> inputStream = env.readTextFile("G:\\SoftwareInstall\\idea\\project\\UserBehaviorAnalysis\\BasicKnowledge\\src\\main\\resources\\hello.txt");
//获取数据的长度
DataStream<Tuple3<String, Integer, Integer>> result = inputStream.flatMap(
(String str, Collector<Tuple2<String,Integer>> out) -> {
String [] words=str.split(" ");
for (String word:words) {
out.collect(new Tuple2(word,1)); //分词,每个单词加上1
}
})
.map(data -> new Tuple3<String,Integer,Integer>(data.f0,data.f0.length(),data.f1))
.filter(data -> "hello".equals(data.f0));
//输出数据
result.print(" lambda表达式方式测试map/flapMap/filter等算子");
env.execute(" lambda表达式方式测试map/flapMap/filter等算子");
}
}