load data local inpath "/home/hadoop/work" overwrite into talbe docs;
wordcount,通过子查询后统计词频并分组排序
createtable wordcount asselect word , count(1) as num from
( select explode(split(line,'\\s')) as word from docs ) x
groupby word orderby word;
测试一下新表wordcount数据,输出格式为单词 频数
select * from wordcount;
3. 通过脚本实现hql语句
在linux下编写扩展名为.hql的脚本文件wordcount.hql, 写入hql语句
use mydb;
createtable wordcount asselect word , count(1) as num from
( select explode(split(line,'\\s')) as word from docs ) x
groupby word orderby word;select * from wordcount;