环境如下:(更新了林子雨教程中不可使用的部分)
Hadoop 2.7.1
java JDK 11
Spark 3.1.1
1.maven安装
2.java应用程序编码
/*** SimpleApp.java **/
import org.apache.spark.api.java.;
import org.apache.spark.api.java.function.Function;
public class SimpleApp {
public static void main(String[] args) {
String logFile = "file:///usr/local/spark/README.md"; // Should be some file on your system
JavaSparkContext sc = new JavaSparkContext("local", "Simple App",
"file:///usr/local/spark/", new String[]{"target/simple-project-1.0.jar"});
JavaRDD<String> logData = sc.textFile(logFile).cache();
long numAs = logData.fi