hive新建动态分区表,可能存在的问题,以及我们想主动设置压缩格式,对应demo sql如下:
set hive.exec.dynamic.partition=true;
set hive.exec.dynamic.partition.mode=nonstrict;
set hive.exec.max.created.files = 200000;
set hive.exec.compress.output=true;
set mapred.output.compression.codec=com.hadoop.compression.lzo.LzopCodec;
insert overwrite table xxx.user_action_pack_info
partition(date_user_tail)
select b.time as time,
b.member_id as member_id,
b.method as method,
b.url as url,
b.ip as ip,
b.referer as refer,
concat("${yesterday}",'-',b.member_id%100) as date_user_tail
from
(select userid from xxx.actions
where p_date = "${yesterday}" group by userid) as a
inner join
(select time,method,url,ip,member_id,referer from vvv.v3
where ptdate = "${yesterday}") as b
on a.userid = b.member_id