Hive 操作与应用词频统计

本地文件

启动hive

#查看数据库
show databases;

show datanases

#创建数据库
create database if not exists hive;

create database

#查看是否成功创建数据库
show databases;

查看是否成功创建数据库

#查看表
use hive;
show tables;

show tables

#创建表
create table if not exists pctext(line string);

create table

#查看是否成功创建表
show tables;

show datables

#映射本地文件的数据到文本表中
load data local inpath '/home/hadoop/HLH/hlh1.txt' into table pctext;

load data

#查看映射内容
select * from pctext;

select *

#词频统计
select split(line,'') as word from pctext;
select explod(split(line,'')) as word from pctext;

select split
select expold

#查看统计结果
select word,count(1) as count from (select explode(split(line,'')) as word from pctext) w group by word order by word;

#上传本地文件
hdfs dfs -put HLH HLH
#查看上传结果
hdfs dfs -ls HLH

hdfs dfs -put

#创建数据表
create table if not exists HLH(line string)
#查看数据表是否创建成功
show tables;

create table

Hive 操作与应用 词频统计