HIVE基本語法使用

阿新 • • 發佈：2019-02-06

set hive.cli.print.header=true;

建立一張表

CREATE TABLE page_view(viewTime INT, userid BIGINT,
     page_url STRING, referrer_url STRING,
     ip STRING COMMENT 'IP Address of the User')
     #新增描述
 COMMENT 'This is the page view table'
 #新增分割槽
 PARTITIONED BY(dt STRING, country STRING)
 #制定檔案的分隔符
 ROW FORMAT DELIMITED FIELDS TERMINATED BY 
 '\t'
 #
STORED AS SEQUENCEFILE;

TEXTFILE
以小檔案形式儲存

//sequencefile
create table tab_ip_seq(id int,name string,ip string,country string) 
    row format delimited
    fields terminated by ','
    stored as sequencefile;
insert overwrite table tab_ip_seq select * from tab_ext;

load資料，載入到hive的目錄中去

//create & load
create table tab_ip(id int,name string,ip string,country string) 
    row format delimited
    fields terminated by ','
    stored as textfile;
load data local inpath '/home/hadoop/ip.txt' into table tab_ext;

載入資料，以連結的方式來建立

//external
CREATE EXTERNAL TABLE tab_ip_ext(id int, name string,
     ip STRING,
     country STRING)
 ROW 
 FORMAT DELIMITED FIELDS TERMINATED BY ','
 STORED AS TEXTFILE
 LOCATION '/external/hive';

// CTAS 用於建立一些臨時表儲存中間結果

CREATE TABLE tab_ip_ctas
   AS
SELECT id new_id, name new_name, ip new_ip,country new_country
FROM tab_ip_ext
#sort by 是幹嘛的，跟Oder by 有什麼關係
SORT BY new_id;

//insert from select 用於向臨時表中追加中間結果資料

create table tab_ip_like like tab_ip;

insert overwrite table tab_ip_like
    select * from tab_ip;

//CLUSTER <–相對高階一點，你可以放在有精力的時候才去學習>

create table tab_ip_cluster(id int,name string,ip string,country string)
clustered by(id) into 3 buckets;

分桶


load data local inpath '/home/hadoop/ip.txt' overwrite into table tab_ip_cluster;
set hive.enforce.bucketing=true;
insert into table tab_ip_cluster select * from tab_ip;

select * from tab_ip_cluster tablesample(bucket 2 out of 3 on id);

//PARTITION分割槽

create table tab_ip_part(id int,name string,ip string,country string) 
    partitioned by (part_flag string)
    row format delimited fields terminated by ',';

load data local inpath '/home/hadoop/ip.txt' overwrite into table tab_ip_part
     partition(part_flag='part1');


load data local inpath '/home/hadoop/ip_part2.txt' overwrite into table tab_ip_part
     partition(part_flag='part2');

select * from tab_ip_part;

select * from tab_ip_part  where part_flag='part2';
select count(*) from tab_ip_part  where part_flag='part2';


alter table tab_ip change id id_alter string;
ALTER TABLE tab_cts ADD PARTITION (partCol = 'dt') location '/external/hive/dt';

show partitions tab_ip_part;

//write to hdfs把資料寫到hdfs中

insert overwrite local directory '/home/hadoop/hivetemp/test.txt' select * from tab_ip_part where part_flag='part1';    
insert overwrite directory '/hiveout.txt' select * from tab_ip_part where part_flag='part1';

//array 陣列的使用

create table tab_array(a array<int>,b array<string>)
row format delimited
fields terminated by '\t'
collection items terminated by ',';

示例資料
tobenbrone,laihama,woshishui     13866987898,13287654321
abc,iloveyou,itcast     13866987898,13287654321


select a[0] from tab_array;
select * from tab_array where array_contains(b,'word');
insert into table tab_array select array(0),array(name,ip) from tab_ext t;

//map的使用

create table tab_map(name string,info map<string,string>)
row format delimited
fields terminated by '\t'
collection items terminated by ';'
map keys terminated by ':';

示例資料：
fengjie         age:18;size:36A;addr:usa
furong      age:28;size:39C;addr:beijing;weight:180KG


load data local inpath '/home/hadoop/hivetemp/tab_map.txt' overwrite into table tab_map;
insert into table tab_map select name,map('name',name,'ip',ip) from tab_ext;

//struct結構體

create table tab_struct(name string,info struct<age:int,tel:string,addr:string>)
row format delimited
fields terminated by '\t'
collection items terminated by ','

load data local inpath '/home/hadoop/hivetemp/tab_st.txt' overwrite into table tab_struct;
insert into table tab_struct select name,named_struct('age',id,'tel',name,'addr',country) from tab_ext;

怎麼在shell語句中執行，可以用於批處理


hive -S -e 'select country,count(*) from tab_ext' > /home/hadoop/hivetemp/e.txt  
有了這種執行機制，就使得我們可以利用指令碼語言（bash shell,python）進行hql語句的批量執行


select * from tab_ext sort by id desc limit 5;

select a.ip,b.book from tab_ext a join tab_ip_book b on(a.name=b.name);

//UDF自定義函式的使用



select if(id=1,first,no-first),name from tab_ext;

hive>add jar /home/hadoop/myudf.jar;
hive>CREATE TEMPORARY FUNCTION my_lower AS 'org.dht.Lower';
select my_upper(name) from tab_ext;

HIVE基本語法使用

set hive.cli.print.header=true; 建立一張表 CREATE TABLE page_view(viewTime INT, userid BIGINT, page

hive的基本語法操作

基本操作 DLL操作資料庫- -----1. 建立資料庫：預設儲存在：HDFS預設位置：/user/hive/warehouse/資料庫名.db create database if not exists hive; -----2. 檢視資料庫 show d

HIVE SQL 基本語法

1.DDL 操作 1.建表 2.3.建立簡單表 4.建立外部表 5.建分割槽表 6.建Bucket表 7.建立表並建立索引欄位ds 8.複製一個空表 9.顯示所有表 10.按正條件正則表示式顯示錶 11.修改表結構 12.表新增一列 13.新增一列並增加列欄位註釋

hive的基本語法匯總（hql）

生成就是種類型 class bin ike 分塊 ear ket 2019/2/20 星期三 hive的基本語法匯總（hql）——————————————————————————————————————————————Hive學習3：Hive三種建表語句詳解 https

[C#] CSharp 基本語法

windows library 命名方式編譯器帕斯卡一、基礎1.規範:除常量外,所有變量用駝峰命名方式,其它用帕斯卡命名方式. 2.編譯:首先由csc.exe將cs文件編譯成MSIL.當雙擊exe的時候,會由clr的jit(just in time)編譯器再次編譯成cpu指令.csc

Swift基礎學習(一)基本語法

postfix 合數語言特性初學者表達式 public 能夠 dict 命名　　Swift 簡介(贊美一番，收集了多篇關於Swift 學習教程的語言簡介一直以為英語和漢語混寫的時候只是英語字母結尾的地方打空格，原來是英語字母的開頭和結尾都要加一個空格，英語字母

C# 基本語法

stack 執行指定 rect pub 標識符 ont check orderby end C# 是一種面向對象的編程語言。在面向對象的程序設計方法中，程序由各種相互交互的對象組成。相同種類的對象通常具有相同的類型，或者說，是在相同的 class 中。例如，以 Recta

SQL語句基本語法

sql首先寫入可顯示中文代碼set character_set_client=gbk; set character_set_results=gbk;或只輸一句 set names gbk;創建數據庫create database 庫名;查詢現有數據局show databases;刪除數據庫drop data

Xml一（基本語法和約束）、

字符一行語言 oca cas 書寫 xsd ati 寫法 XML：eXtensible Markup Language 可擴展標記語言 version="1.0" 　　　　* 可擴展：所有的標簽都是自定義的。　　　　* 功能：數據存儲　　　　* 配置文件　

Markdown 基本語法

最大添加 tle lin hello -s mark lock 橫線 1. 標題設置（讓字體變大，和word的標題意思一樣）在Markdown當中設置標題，有兩種方式：第一種：通過在文字下方添加“=”和“-”，他們分別表示一級標題和二級標題。第二種：在文字開頭加上 “#”

Day1[下] - Python基礎基本語法、流程控制

數字 tin 流程 label reference rst too ren ogr 一、變量\字符編碼 Variables are used to store information to be referenced and manipulated in a comput

python 基本語法速覽，快速入門

我們 method adding ger monk use gre 數據類型 struct https://zhuanlan.zhihu.com/p/24536868 學習參考於這個博文。我做一個筆記。關於python一些常用的語法快速的預覽，適合已經掌握一門編程語

R的基本語法總結

adobe hist 當我 colors gda 編碼找到 cati 逆時針條形圖：基本語法： barplot(H, xlab, ylab, main, names.arg, col) H是包含在挑選圖中使用的數值的向量或矩陣

1.基本語法

lan strong set script rst rip 關於 col doctype 整個教程默認是需要html和css的基礎的，如果後面需要，我會抽時間在寫一份html和css的入門教程；閑話少說，接下來我們一起進入JavaScript這門語言的大門吧！一、Jav

Kotlin VS Java：基本語法差異（轉載）

允許接收 point this view 學習替換同時 ons 5月18號，goole宣布Kotlin成為官方支持的開發語言以來，Kotlin語言社區，公眾號，qq群等全面轟炸，本文是一篇譯文，來自國外的一個用戶，將給大家介紹，基礎語法部分Kotlin和java之間的

1go基本語法

pan 導入 world 函數 ... pac ring 方法 ack // week1 project main.go//導入一個包（目錄） package main //導入方法 import "fmt" //createMessage函數(參數，類型)返回值的類型(

shell--grep命令+正則表達式+基本語法

及其 gre awk 使用 part 開頭合集運算符擴展什麽是正則正則就是用一些具有特殊含義的符號組合到一起（稱為正則表達式）來描述字符或者字符串的方法。或者說：正則就是用來描述一類事物的規則。在linux中，通配符是由shell解釋的，而正則表達式則是由命令解

008-Hadoop Hive sql語法詳解3-DML 操作:元數據存儲

pan 查詢寫入所有 not insert語句 int 寫入文件文件系統一、概述 hive不支持用insert語句一條一條的進行插入操作，也不支持update操作。數據是以load的方式加載到建立好的表中。數據一旦導入就不可以修改。 DML包括：INSERT插入

Shell第三篇：基本語法

允許主體賦值算數 export $* lar script userdel 目錄一、什麽是shell script 二、變量三、運算符四、流程控制五、函數　　一、什麽是shell script 　　將OS命令堆積到可執行文件裏，由上至下的順序執行文本裏的

js基本語法及註意事項

name tab 設置刪除元素 ext ack rop 捕獲 ons 正則表達式：var x=/^a{2,8}$/;alert(x.test("aaa"));正則表達式一般用於表單驗證。<form onsubmit="return checkForm()">

HIVE基本語法使用

相關推薦