hive-1

 
 
##后台nginx日志mpi-web报表生成
use bi;
##set ($suffix = "${env.YYYY}${env.MM}${env.DD}");
##今日临时表创建
drop table if exists dpstg_mpi_nginx_log_today_${env.YYYY}${env.MM}${env.DD};
create table if not exists dpstg_mpi_nginx_log_today_${env.YYYY}${env.MM}${env.DD}
(
server_ip string,
url string,
times int,
avg_response_today int,
avg_body_size int,
response_line95_today int,
count_50x int,
count_40x int,
count_30x int,
count_20x int
)
ROW FORMAT DELIMITED
FIELDS TERMINATED BY '\005'
COLLECTION ITEMS TERMINATED BY '\002'
MAP KEYS TERMINATED BY '\003'
LINES TERMINATED BY '\n'
STORED AS ORC;
##昨日临时表创建
drop table if exists dpstg_mpi_nginx_log_yesterday_${env.YYYY}${env.MM}${env.DD};
create table if not exists dpstg_mpi_nginx_log_yesterday_${env.YYYY}${env.MM}${env.DD}
(
server_ip string,
url string,
times int,
avg_response_today int,
avg_body_size int,
response_line95_today int,
count_50x int,
count_40x int,
count_30x int,
count_20x int
)
ROW FORMAT DELIMITED
FIELDS TERMINATED BY '\005'
COLLECTION ITEMS TERMINATED BY '\002'
MAP KEYS TERMINATED BY '\003'
LINES TERMINATED BY '\n'
STORED AS ORC;
##今日报表生成
insert into table dpstg_mpi_nginx_log_today_${env.YYYY}${env.MM}${env.DD}
select
server_ip,
concat(parse_url(url,'HOST'), regexp_replace(parse_url(url, 'PATH'),'[0-9|\+|\*]','')) as url_s,
count(url) as times,
round(avg(response_time)*1000) as avg_response_today,
round(avg(body_bytes_sent)) as avg_body_size,
round(percentile(round(response_time*1000),0.95)) as response_line95_today,
sum(if(status like '50%' ,1 ,0)) as count_50x,
sum(if(status like '40%' ,1 ,0)) as count_40x,
sum(if(status like '30%' ,1 ,0)) as count_30x,
sum(if(status like '20%' ,1 ,0)) as count_20x
from
dpdw_nginx_log_all
where
application = 'mpi-web'
and hp_stat_date='${env.YYYYMMDD}'
and parse_url(url, 'PATH')<>'/index.jsp'
and parse_url(url, 'PATH')<>'/heartbeat.html'
and parse_url(url, 'HOST')<>'dp'
and parse_url(url, 'HOST')<>'www.dianping.com'
group by
concat(parse_url(url,'HOST'), regexp_replace(parse_url(url, 'PATH'),'[0-9|\+|\*]','')),server_ip,application
order by
times desc
;
##昨日报表生成
insert into table dpstg_mpi_nginx_log_yesterday_${env.YYYY}${env.MM}${env.DD}
select
server_ip as server_ip,
concat(parse_url(url,'HOST'), regexp_replace(parse_url(url, 'PATH'),'[0-9|\+|\*]','')) as url,
count(url) as times,
round(avg(response_time)*1000) as avg_response_today,
round(avg(body_bytes_sent)) as avg_body_size,
round(percentile(round(response_time*1000),0.95)) as response_line95_today,
sum(if(status like '50%' ,1 ,0)) as count_50x,
sum(if(status like '40%' ,1 ,0)) as count_40x,
sum(if(status like '30%' ,1 ,0)) as count_30x,
sum(if(status like '20%' ,1 ,0)) as count_20x
from
dpdw_nginx_log_all
where
application = 'mpi-web'
and hp_stat_date='${env.YYYYMMDD_P1D}'
and parse_url(url, 'PATH')<>'/index.jsp'
and parse_url(url, 'PATH')<>'/heartbeat.html'
and parse_url(url, 'HOST')<>'dp'
and parse_url(url, 'HOST')<>'www.dianping.com'
group by
concat(parse_url(url,'HOST'), regexp_replace(parse_url(url, 'PATH'),'[0-9|\+|\*]','')),server_ip,application
order by
times desc
;
insert overwrite table dprpt_mpi_nginx_log_daily partition(hp_cal_dt = '${env.YYYYMMDD}')
select
t.server_ip as server_ip,
t.url as url,
t.times as times,
coalesce(y.times,0) as times_cmp,
t.avg_response_today as avg_response_today,
coalesce(y.avg_response_today,0) as avg_response_cmp,
t.response_line95_today as response_line95_today,
coalesce(y.response_line95_today,0) as response_line95_today_cmp,
t.avg_body_size as avg_body_size,
t.count_20x as count_20x,
coalesce(y.count_20x,0) as count_20x_cmp,
t.count_30x as count_30x,
coalesce(y.count_30x,0) as count_30x_cmp,
t.count_40x as count_40x,
coalesce(y.count_40x,0) as count_40x_cmp,
t.count_50x as count_50x,
coalesce(y.count_50x,0) as count_50x_cmp
from dpstg_mpi_nginx_log_today_${env.YYYY}${env.MM}${env.DD} t left outer join dpstg_mpi_nginx_log_yesterday_${env.YYYY}${env.MM}${env.DD} y
on t.url=y.url and t.server_ip=y.server_ip
order by times desc;
drop table if exists dpstg_mpi_nginx_log_today_${env.YYYY}${env.MM}${env.DD};
drop table if exists dpstg_mpi_nginx_log_yesterday_${env.YYYY}${env.MM}${env.DD};
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值