import org.apache.spark.sql.types._
import org.apache.spark.sql.{DataFrame, Dataset, Row, SparkSession}
object WordCount1 {
def main(args: Array[String]): Unit = {
val spark=SparkSession.builder().master("local[4]").appName("score").getOrCreate()
val read=spark.sparkContext.textFile("E://download//person.txt")
val read1=read.map(x=>{
val fields=x.split(",")
Row(fields(0),fields(1).toInt,fields(2).toInt)
})
val schema: StructType = StructType(List(
StructField("name", StringType, true),
StructField("id", IntegerType, true),
StructField("score", IntegerType, true)
))
val df=spark.createDataFrame(read1,schema)
df.show()
import spark.implicits._
df.selectExpr("id","score").where($"score">80).show()
spark.close()
}
}
数据
zhangsan,13,100
lisi,12,80
zhanghua,1,90
weige,3,79
结果