读取HDFS中的文件创建RDD
private def makeRDDFromHDFS = {
val conf: SparkConf = new SparkConf().setAppName(this.getClass.getSimpleName).setMaster(“local[*]”)
val sc = new SparkContext(conf)
//读取HDFS文件
val rdd: RDD[String] = sc.textFile(“hdfs://doit01:9000/word.txt”)
sc.stop()
}
读取本地问及那创建RDD
private def makeRDDFromDisk = { val conf: SparkConf = new SparkConf().setAppName(this.getClass.getSimpleName).setMaster(“local[*]”) val sc = new SparkContext(conf) // 返回的是处理整个文件数据的RDD val rdd: RDD[String] = sc.textFile(“d://word