aggregateByKey
import org.apache.spark.{SparkConf, SparkContext}
object AggegateByKeyTest {
def main(args: Array[String]): Unit = {
val conf=new SparkConf().setMaster("local").setAppName("ArregateByKey")
val sc=new SparkContext(conf)
val data=List((1,3),(1,4),(2,3),(3,6),(1,2),(3,8))
val rdd=sc.parallelize(data,3)
rdd.aggregateByKey(0)(math.max(_,_),_+_).collect.foreach(println)
}
}