spark dataframe helloworld

package com.astron.spark2

import org.apache.spark
import org.apache.spark.sql.SparkSession

object BasicOperation {
  def main(args: Array[String]): Unit = {
    println("astron")
    val spark = SparkSession
      .builder()
      .master("local")
      .appName("star")
      .getOrCreate()

    // 导入spark的隐式转换
    import spark.implicits._
    val emp = spark.read.json("d://employee.json")
    val dep = spark.read.json("d://department.json")
    println("-"*10 + "完整数据")
    emp.show()
    //数值型过滤
    println("-"*10 + "数值型过滤emp.filter(\"age>40\").filter(\"salary>1000\").show()")
    emp.filter("age>40").filter("salary>1000").show()
    //字符型过滤
    println("-"*10 + "字符型过滤:等于emp.filter(emp(\"name\")===\"Jen\").show()")
    emp.filter(emp("name")==="Jen").show()
    println("-"*10 + "字符型过滤:不等于,已经过期用法emp.filter(emp(\"name\")!==\"Jen\").show()")
    emp.filter(emp("name")!=="Jen").show()
    println("-"*10 + "字符型过滤:不等于,目前用法emp.filter(emp(\"name\")=!=\"Jen\").show()")
    emp.filter(emp("name")=!="Jen").show()

    //$访问
    emp.filter($"name"=!="Jen"&&($"age")===25).show()
  }

}
astron
----------完整数据
+---+-----+------+------+------+
|age|depId|gender|  name|salary|
+---+-----+------+------+------+
| 25|    1|  male|   Leo| 20000|
| 30|    2|female| Marry| 25000|
| 35|    1|  male|  Jack| 15000|
| 42|    3|  male|   Tom| 18000|
| 21|    3|female|Kattie| 21000|
| 30|    2|female|   Jen| 28000|
| 19|    2|female|   Jen|  8000|
+---+-----+------+------+------+

----------数值型过滤emp.filter("age>40").filter("salary>1000").show()
+---+-----+------+----+------+
|age|depId|gender|name|salary|
+---+-----+------+----+------+
| 42|    3|  male| Tom| 18000|
+---+-----+------+----+------+

----------字符型过滤:等于emp.filter(emp("name")==="Jen").show()
+---+-----+------+----+------+
|age|depId|gender|name|salary|
+---+-----+------+----+------+
| 30|    2|female| Jen| 28000|
| 19|    2|female| Jen|  8000|
+---+-----+------+----+------+

----------字符型过滤:不等于,已经过期用法emp.filter(emp("name")!=="Jen").show()
+---+-----+------+------+------+
|age|depId|gender|  name|salary|
+---+-----+------+------+------+
| 25|    1|  male|   Leo| 20000|
| 30|    2|female| Marry| 25000|
| 35|    1|  male|  Jack| 15000|
| 42|    3|  male|   Tom| 18000|
| 21|    3|female|Kattie| 21000|
+---+-----+------+------+------+

----------字符型过滤:不等于,目前用法emp.filter(emp("name")=!="Jen").show()
+---+-----+------+------+------+
|age|depId|gender|  name|salary|
+---+-----+------+------+------+
| 25|    1|  male|   Leo| 20000|
| 30|    2|female| Marry| 25000|
| 35|    1|  male|  Jack| 15000|
| 42|    3|  male|   Tom| 18000|
| 21|    3|female|Kattie| 21000|
+---+-----+------+------+------+

+---+-----+------+----+------+
|age|depId|gender|name|salary|
+---+-----+------+----+------+
| 25|    1|  male| Leo| 20000|
+---+-----+------+----+------+
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值