Skip to content

GitLab

  • Projects
  • Groups
  • Snippets
  • Help
    • Loading...
  • Help
    • Help
    • Support
    • Community forum
    • Submit feedback
    • Contribute to GitLab
  • Sign in / Register
W
wiki-hadoop
  • Project overview
    • Project overview
    • Details
    • Activity
  • Issues 0
    • Issues 0
    • List
    • Boards
    • Labels
    • Service Desk
    • Milestones
  • Merge requests 0
    • Merge requests 0
  • Operations
    • Operations
    • Incidents
  • Analytics
    • Analytics
    • Value Stream
  • Wiki
    • Wiki
  • Members
    • Members
  • Activity
  • Create a new issue
  • Issue Boards
Collapse sidebar
  • 老徐
  • wiki-hadoop
  • Wiki
  • Hive_Table_Operation

Hive_Table_Operation · Changes

Page history
yangbl created page: Hive_Table_Operation authored Sep 08, 2015 by 杨宝龙's avatar 杨宝龙
Hide whitespace changes
Inline Side-by-side
Showing with 100 additions and 0 deletions
+100 -0
  • Hive_Table_Operation.md Hive_Table_Operation.md +100 -0
  • No files found.
Hive_Table_Operation.md 0 → 100644
View page @ c7ff871e
# 基本表操作
## 查看数据表详情
desc touna;
desc formatted touna;
## 更改表的列名
ALTER TABLE laoniushuju_pv CHANGE host domain string;
## 清空数据表(慎用!)
insert overwrite table ua_chinese select * from ua_chinese where 1=0;
## 删除表(慎用!)
drop table pingan_data_pv_20150504;
# 内部表
## 创建内部表
create table kw_test(
srcip string,
ad string,
ts string,
url string,
ref string,
ua string,
dstip string,
cookie string,
datelabel string,
loadstamp string)
row format delimited fields terminated by '\t';
## 导入数据到内部表
load data local inpath '/home/yangbl/data/task' into table ua_chinese;
load data inpath '/user/xuji/yang/data/part-r-00069.gz' into table e_pingan.kw_test;
# 临时外部表
## 创建临时外部表
CREATE EXTERNAL TABLE IF NOT EXISTS laoniushuju_pv
ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t'
LINES TERMINATED BY '\n'
STORED AS RCFILE
LOCATION '/user/e_pingan/private/laoniushuju/base/laoniushuju_pv'
AS
${查询语句};
# 外部表分区表
## 创建外部分区表
CREATE EXTERNAL TABLE IF NOT EXISTS laoniushuju_pv (
host string,
pv bigint)
PARTITIONED BY (
datelabel string,
loadstamp string
)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t'
LINES TERMINATED BY '\n'
STORED AS RCFILE
LOCATION '/user/e_pingan/private/laoniushuju/base/laoniushuju_pv';
## 向表中插入数据
### 查询结果插入数据到分区表
INSERT OVERWRITE TABLE laoniushuju_pv PARTITION(datelabel='${date}',loadstamp)
${查询语句};
### HDFS数据导入分区表
LOAD DATA INPATH '/user/yangbl/yang/task/文件名' INTO TABLE laoniushuju_pv PARTITION(datelabel='${date}',loadstamp='${hour}');
### 本地数据导入分区表
LOAD DATA LOCAL INPATH '/home/yangbl/data/task/文件名' INTO TABLE laoniushuju_pv PARTITION(datelabel='${date}',loadstamp='${hour}');
# 存储查询结果
## 保存到HDFS路径
INSERT OVERWRITE DIRECTORY '/user/yangbl/yang/task'
ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t'
${查询语句};
## 保存到本地路径
INSERT OVERWRITE LOCAL DIRECTORY '/home/yangbl/data/task'
ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t'
${查询语句};
Clone repository
  • Hive_Basic_Configuration
  • Hive_Basic_HQL
  • Hive_Basic_Operation
  • Hive_Table_Operation
  • Home