// 利用SimpleDateFormat类
def getDayOfWeek = (date: String) => (new SimpleDateFormat("u")).format(new SimpleDateFormat("yyyy-MM-dd").parse(date))
val weekDays: Array[String] = Array("星期日", "星期一", "星期二", "星期三", "星期四", "星期五", "星期六")
// 注册函数
spark.udf.register("get_weekday", (date: String) => {
var d1: Int = getDayOfWeek(date).toInt
if (d1==7){
d1 = 0
}
weekDays(d1)
})
spark.udf.register("get_day_week", (date: String) =>{
var d2: Int = getDayOfWeek(date).toInt
if (d2==7){
d2 = 0
}
d2
})
//合并结果:每天各个商家 浏览量和 客户支付量统计
val trainPrerDayUserDF =trainPerDayUserVisitCountDF
.join(trainPryDayUserPayCountDf,Seq("date_str", "shop_id"))
//对于特征值来讲,我们需要的是周一
.selectExpr(
"get_weekday(date_str) as weekday", //将日期转成 星期几
"get_day_week(date_str) as day_week",//一周的第几天
"shop_id","count_visit","count_pay"
)