String转Rdd[String]并取出排名前几的keys值

import com.sun.rowset.internal.Row
import org.apache.spark.storage.StorageLevel
import org.jruby.ext.ffi.StructLayout.Storage
import scala.collection.mutable.{ArrayBuffer, ListBuffer}
//import org.apache.hadoop.hive.serde2.objectinspector.StructField
import org.apache.spark.rdd.RDD
import org.apache.spark.sql.{DataFrame, Dataset, SparkSession}
import org.apache.spark.sql.types.{StructField, StructType}
import org.dmg.pmml.True

/*!/usr/bin/env java
# -*- coding:utf-8 -*-
# Author: supeihuang
 Time: 2019/4/19 15:59*/

  object test{
    val  spark=SparkSession.builder().master("local").getOrCreate()
    def sortedTopOne(data:String):String={
      println(data)
      var wordCount=data.split(",").map(arr=>(arr,1))
      var sc=spark.sparkContext.parallelize(wordCount)
      var countKey=sc.reduceByKey(_+_)
      var result=countKey.sortBy(_._2,false).keys.collect().toList
      println("---"+result)
      var result1=result(0)
      if(result1== "-1"){
        result1=result(1)
      }
      return result1
    }
    def main(args: Array[String]): Unit = {
      val sc=spark.sparkContext
      var list="332684,60070,306590,57608,-1,60070,60070,-1,302720,60070,-1,120537,63672,60848,99634,60070,60070,60795,56737,60070,41737,57085,304525,120516,-1,-1,-1,60070,-1,-1,-1,-1,-1,-1,-1,-1,-1,63673,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1"
      var result=sortedTopOne(list)
      println("xxx"+result)
    }










}


  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值