Spark之UDAF

 1 import org.apache.spark.sql.{Row, SparkSession}
 2 import org.apache.spark.sql.expressions.{MutableAggregationBuffer, UserDefinedAggregateFunction}
 3 import org.apache.spark.sql.types._
 4 
 5 /**
 6   * Created by zhen on 2018/11/26.
 7   */
 8 object AverageUserDefinedAggregateFunction extends UserDefinedAggregateFunction{
 9   //聚合函数输入数据结构
10   override def inputSchema:StructType = StructType(StructField("input", LongType) :: Nil)
11 
12   //缓存区数据结构
13   override def bufferSchema: StructType = StructType(StructField("sum", LongType) :: StructField("count", LongType) :: Nil)
14 
15   //结果数据结构
16   override def dataType : DataType = DoubleType
17 
18   // 是否具有唯一性
19   override def deterministic : Boolean = true
20 
21   //初始化
22   override def initialize(buffer : MutableAggregationBuffer) : Unit = {
23     buffer(0) = 0L
24     buffer(1) = 0L
25   }
26 
27   //数据处理 : 必写,其它方法可选,使用默认
28   override def update(buffer: MutableAggregationBuffer, input: Row): Unit = {
29     if(input.isNullAt(0)) return
30     buffer(0) = buffer.getLong(0) + input.getLong(0) //求和
31     buffer(1) = buffer.getLong(1) + 1 //计数
32   }
33 
34   //合并
35   override def merge(bufferLeft: MutableAggregationBuffer, bufferRight: Row): Unit ={
36     bufferLeft(0) = bufferLeft.getLong(0) + bufferRight.getLong(0)
37     bufferLeft(1) = bufferLeft.getLong(1) + bufferRight.getLong(1)
38   }
39 
40   //计算结果
41   override def evaluate(buffer: Row): Any  = buffer.getLong(0).toDouble / buffer.getLong(1)
42 }
43 object SparkUdaf {
44   def main(args: Array[String]) {
45     val spark = SparkSession
46       .builder()
47       .appName("udaf")
48       .master("local[2]")
49       .getOrCreate()
50 
51     spark.read.json("E:/BDS/newsparkml/src/udaf.json").createOrReplaceTempView("user")
52     spark.udf.register("average", AverageUserDefinedAggregateFunction)
53     spark.sql("select count(*) count,average(age) avg_age from user").show()
54 
55   }
56 }

结果:

 

转载于:https://www.cnblogs.com/yszd/p/10021864.html

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值