现在pox.xml添加play框架的依赖
< dependency>
< groupId>com.fasterxml.jackson.module< /groupId>
< artifactId>jackson-module-scala_2.11< /artifactId>
< version>2.7.5< /version>
< /dependency>
< dependency>
< groupId>com.fasterxml.jackson.core< /groupId>
< artifactId>jackson-databind< /artifactId>
< version>2.7.0< /version>
< /dependency>
< dependency>
< groupId>com.fasterxml.jackson.core< /groupId>
< artifactId>jackson-annotations< /artifactId>
< version>2.7.0< /version>
< /dependency>
< dependency>
< groupId>com.fasterxml.jackson.core< /groupId>
< artifactId>jackson-core< /artifactId>
< version>2.7.0< /version>
< /dependency>
< dependency>
< groupId>com.typesafe.play< /groupId>
< artifactId>play-json_2.11< /artifactId>
< version>2.7.0< /version>
< /dependency>
运行时,有时候报错是应为缺少依赖,根据报错信息去Maven Repository去找相关依赖进行添加就行了
package Spark.quick
import play.api.libs.json._
import org.apache.spark.{SparkConf, SparkContext}
object test1 {
// 设置JSON格式,类参数名得和JSON文件得字段名相同
case class Person(name: String, lovesPandas: Boolean)
implicit val personReads = Json.format[Person]
def main(args: Array[String]): Unit = {
val sparkConf = new SparkConf().setMaster("local[2]").setAppName("JSONApp")
val sc = new SparkContext(sparkConf)
val input = sc.textFile("file:///home/hadoop/data/sparkQuick/learning-spark-master/files/pandainfo.json", 1)
// 将文本解(String)析成JSON(String, Boolean),才能进行后续操作
val parse = input.map(Json.parse(_))
// 输出检测
parse.foreach(println)
// 根据设置的格式赛选类容,得到非json
val result = parse.flatMap(record => personReads.reads(record).asOpt)
// 输出检测
result.foreach(println)
// 将赛选后的格式装换成JSON格式进行存储
result.filter(_.lovesPandas).map(Json.toJson(_)).saveAsTextFile("file:///home/hadoop/data/sparkQuick/learning-spark-master/files/TEST")
}
}