step0:建表语句(hive脚本)
USE databasename;CREATE TABLE OrderQuantity_Forecast_Table(
masterhotel int COMMENT '酒店ID',
orderdate string COMMENT '订单日期',
city int COMMENT '城市ID',
y_bar double COMMENT '产量预测值')
comment '订单间夜量预测结果输出表'
PARTITIONED BY(d STRING COMMENT '日期分区')
row format delimited fields terminated by '\t'
stored as TextFile;
step1:样例数据生成(python脚本)
output_values.to_csv("output_values.txt", header=False, index=False,sep='\t')
step2:导入hive方式
## Hive-Shell形式
load data local inpath 'output_values.txt' into table databasename.OrderQuantity_Forecast_Table partition(d='2016-10-31');
hive -S -e "load data local inpath 'output_values.txt' into table databasename.OrderQuantity_Forecast_Table partition(d='2016-10-31');
## Python形式
sql="""load data local inpath "output_values.txt" overwrite into table databasename.OrderQuantity_Forecast_Table partition(d="2016-10-31");"""os.popen("hive -S -e '"+sql+"'")
step3:数据检查
##检查数据是否存在
select *
from databasename.OrderQuantity_Forecast_Table
where d='2016-10-31'
limit 100;
##删除分区
use databasename;
alter table OrderQuantity_Forecast_Table drop partition(d='2016-10-31');
##显示分区
show partitions databasename.OrderQuantity_Forecast_Table;
step4:Linux环境下python后台运行
nohup python yourscript.py & 可以让你的程序在后台运行,控制台输出导向nohup.out文件