第一关:Hive存储数据
根据要求配置环境
start-all.sh
schematool -dbType mysql -initSchema
成功后进入hive
在hive中创建数据库trafficdata
create database trafficdata;
在trafficdata中创建表
use trafficdata;
create table cancelorder(companyid string,address string,districtname string,orderid string,ordertime string,canceltime string,operator string,canceltypecode string,cancelreason string) row format delimited fields terminated by '|' stored as textfile;
create table createorder(companyid string,address string,districtname string,orderid string,departtime string,ordertime string,departure string,deplongitude string,deplatitude string,destination string,destlongitude string,destlatitude string) row format delimited fields terminated by '\t' stored as textfile;
两个表创建完成后,复制一个新的命令行,进入canceldata.txt和createdata.txt所在路径
cd /data/workspace/myshixun/data/
执行hdfs的put命令,把数据上传到hdfs上的/user/目录中
hdfs dfs -put canceldata.txt /user/
hdfs dfs -put createdata.txt /user/
返回到hive中,执行数据加载,导入数据到表中
load data inpath '/user/canceldata.txt' into table cancelorder;
load data inpath '/user/createdata.txt' into table createorder;