31b57a494b
* fix: #295 impala data types suggestion * fix: #297 impala create table with STRUCT
215 lines
6.7 KiB
SQL
215 lines
6.7 KiB
SQL
CREATE EXTERNAL TABLE external_parquet (c1 INT, c2 STRING, c3 TIMESTAMP)
|
|
STORED AS PARQUET LOCATION '/user/etl/destination';
|
|
|
|
create table census (name string, census_year int) partitioned by (year int);
|
|
|
|
CREATE TABLE census_data (last_name STRING, first_name STRING, state STRING, address STRING)
|
|
SORT BY (last_name, state)
|
|
STORED AS PARQUET
|
|
TBLPROPERTIES ('transactional'='true', 'transactional_properties'='insert_only');
|
|
|
|
CREATE TABLE sorted_census_data
|
|
SORT BY (last_name, state)
|
|
STORED AS PARQUET
|
|
AS SELECT last_name, first_name, state, address
|
|
FROM unsorted_census_data;
|
|
|
|
CREATE TABLE yy2 (s STRING, year INT);
|
|
|
|
CREATE TABLE kudu_no_partition_by_clause
|
|
(
|
|
id bigint PRIMARY KEY, s STRING, b BOOLEAN
|
|
)
|
|
STORED AS KUDU;
|
|
|
|
CREATE TABLE kudu_t1 (id BIGINT PRIMARY key, s STRING, b BOOLEAN)
|
|
PARTITION BY HASH (id) PARTITIONS 20 STORED AS KUDU;
|
|
|
|
CREATE TABLE kudu_t2 (id BIGINT, s STRING, b BOOLEAN, PRIMARY KEY (id,s))
|
|
PARTITION BY HASH (s) PARTITIONS 30 STORED AS KUDU;
|
|
|
|
CREATE TABLE kudu_t3 (id BIGINT, year INT, s STRING,
|
|
b BOOLEAN, PRIMARY KEY (id,year))
|
|
PARTITION BY HASH (id) PARTITIONS 20,
|
|
RANGE (year) (PARTITION 1980 <= VALUES < 1990,
|
|
PARTITION 1990 <= VALUES < 2000,
|
|
PARTITION VALUE = 2001,
|
|
PARTITION 2001 < VALUES < 2003)
|
|
STORED AS KUDU;
|
|
|
|
CREATE EXTERNAL TABLE external_t1 STORED AS KUDU
|
|
TBLPROPERTIES ('kudu.table_name'='kudu_tbl_created_via_api');
|
|
|
|
CREATE EXTERNAL TABLE myextkudutbl (
|
|
id int PRIMARY KEY,
|
|
name string)
|
|
PARTITION BY HASH PARTITIONS 8
|
|
STORED AS KUDU
|
|
TBLPROPERTIES ('external.table.purge'='true');
|
|
|
|
CREATE TABLE ctas_t1
|
|
PRIMARY KEY (id) PARTITION BY HASH (id) PARTITIONS 10
|
|
STORED AS KUDU
|
|
AS SELECT id, s FROM kudu_t1;
|
|
|
|
CREATE TABLE pk_multiple_columns
|
|
(
|
|
col1 BIGINT,
|
|
col2 STRING,
|
|
col3 BOOLEAN,
|
|
PRIMARY KEY (col1, col2)
|
|
) PARTITION BY HASH(col2) PARTITIONS 2 STORED AS KUDU;
|
|
|
|
CREATE TABLE user.inline_pk_rewritten (
|
|
id BIGINT NOT NULL ENCODING AUTO_ENCODING COMPRESSION DEFAULT_COMPRESSION,
|
|
s STRING NULL ENCODING AUTO_ENCODING COMPRESSION DEFAULT_COMPRESSION,
|
|
PRIMARY KEY (id)
|
|
)
|
|
PARTITION BY HASH (id) PARTITIONS 2
|
|
STORED AS KUDU
|
|
TBLPROPERTIES ('kudu.master_addresses'='host.example.com');
|
|
|
|
CREATE TABLE default_vals
|
|
(
|
|
id BIGINT PRIMARY KEY,
|
|
name STRING NOT NULL DEFAULT 'unknown',
|
|
address STRING DEFAULT upper('no fixed address'),
|
|
age INT DEFAULT -1,
|
|
earthling BOOLEAN DEFAULT TRUE,
|
|
planet_of_origin STRING DEFAULT 'Earth',
|
|
optional_col STRING DEFAULT NULL
|
|
) PARTITION BY HASH(id) PARTITIONS 2 STORED AS KUDU;
|
|
|
|
CREATE TABLE various_encodings
|
|
(
|
|
id BIGINT PRIMARY KEY,
|
|
c1 BIGINT ENCODING PLAIN_ENCODING,
|
|
c2 BIGINT ENCODING AUTO_ENCODING,
|
|
c3 TINYINT ENCODING BIT_SHUFFLE,
|
|
c4 DOUBLE ENCODING BIT_SHUFFLE,
|
|
c5 BOOLEAN ENCODING RLE,
|
|
c6 STRING ENCODING DICT_ENCODING,
|
|
c7 STRING ENCODING PREFIX_ENCODING
|
|
) PARTITION BY HASH(id) PARTITIONS 2 STORED AS KUDU;
|
|
|
|
|
|
CREATE TABLE blog_posts
|
|
(
|
|
user_id STRING ENCODING DICT_ENCODING,
|
|
post_id BIGINT ENCODING BIT_SHUFFLE,
|
|
subject STRING ENCODING PLAIN_ENCODING,
|
|
body STRING COMPRESSION LZ4,
|
|
spanish_translation STRING COMPRESSION SNAPPY,
|
|
esperanto_translation STRING COMPRESSION ZLIB,
|
|
PRIMARY KEY (user_id, post_id)
|
|
) PARTITION BY HASH(user_id, post_id) PARTITIONS 2 STORED AS KUDU;
|
|
|
|
|
|
CREATE TABLE various_encodings
|
|
(
|
|
id BIGINT PRIMARY KEY,
|
|
c1 BIGINT ENCODING PLAIN_ENCODING,
|
|
c2 BIGINT ENCODING AUTO_ENCODING,
|
|
c3 TINYINT ENCODING BIT_SHUFFLE,
|
|
c4 DOUBLE ENCODING BIT_SHUFFLE,
|
|
c5 BOOLEAN ENCODING RLE,
|
|
c6 STRING ENCODING DICT_ENCODING,
|
|
c7 STRING ENCODING PREFIX_ENCODING
|
|
) PARTITION BY HASH(id) PARTITIONS 2 STORED AS KUDU;
|
|
|
|
create table million_rows_one_range (id string primary key, s string)
|
|
partition by hash(id) partitions 50,
|
|
range (partition 'a' <= values < '{')
|
|
stored as kudu;
|
|
|
|
create table million_rows_two_ranges (id string primary key, s string)
|
|
partition by hash(id) partitions 50,
|
|
range (partition 'a' <= values < '{', partition 'A' <= values < '[', partition value = '00000')
|
|
stored as kudu;
|
|
|
|
create table million_rows_three_ranges (id string primary key, s string)
|
|
partition by hash (school) partitions 10,
|
|
range (letter_grade) (partition value = 'A', partition value = 'B',
|
|
partition value = 'C', partition value = 'D', partition value = 'F')
|
|
stored as kudu;
|
|
|
|
create table hash_t5 (x bigint, y bigint, s string, primary key (x,y))
|
|
partition by hash (x) partitions 10, hash (y) partitions 20, hash (y) partitions 20
|
|
stored as kudu;
|
|
|
|
create table range_t1 (x bigint, s string, s2 string, primary key (x, s))
|
|
partition by range (x)
|
|
(
|
|
partition 0 <= values <= 49, partition 50 <= values <= 100,
|
|
partition value < 0, partition 100 < values <= 500,
|
|
partition values < 0, partition 100 < values
|
|
)
|
|
stored as kudu;
|
|
|
|
create table combined_t1 (x bigint, s string, s2 string, primary key (x, s))
|
|
partition by hash (x) partitions 10, range (x)
|
|
(
|
|
partition 0 <= values <= 49, partition 50 <= values <= 100
|
|
)
|
|
stored as kudu;
|
|
|
|
CREATE TABLE t5 AS SELECT upper(y) AS s, x+1 AS a, 'Entirely new column' AS n FROM t1;
|
|
|
|
CREATE TABLE parquet_version_of_t1 STORED AS PARQUET AS SELECT * FROM t1;
|
|
|
|
create table partitions_yes partitioned by (year, month)
|
|
as select s, year, month from partitions_no;
|
|
|
|
CREATE TABLE my_first_table (id BIGINT, name STRING, PRIMARY KEY (id)) PARTITION BY HASH PARTITIONS 16 STORED AS KUDU TBLPROPERTIES ('kudu.num_tablet_replicas' = '1');
|
|
|
|
CREATE TABLE parquet_table (id INT) STORED AS PARQUET;
|
|
|
|
CREATE TABLE games3 (id BIGINT, play ARRAY < MAP < STRING, BIGINT > >) STORED AS PARQUET;
|
|
|
|
CREATE TABLE games3 (id BIGINT, play ARRAY < MAP < STRING, BIGINT > >) STORED AS PARQUET;
|
|
|
|
create table unsorted (x bigint);
|
|
|
|
CREATE TABLE pk(col1 INT, col2 STRING, PRIMARY KEY(col1, col2));
|
|
|
|
CREATE TABLE fk(id INT, col1 INT, col2 STRING, PRIMARY KEY(id),
|
|
FOREIGN KEY(col1, col2) REFERENCES pk(col1, col2));
|
|
|
|
CREATE TABLE pk(id INT, PRIMARY KEY(id) DISABLE, NOVALIDATE, RELY);
|
|
|
|
CREATE TABLE fk(id INT, col1 INT, col2 STRING, PRIMARY KEY(id),
|
|
FOREIGN KEY(col1, col2) REFERENCES pk(col1, col2));
|
|
|
|
CREATE TABLE new_Table like old_table;
|
|
|
|
CREATE TABLE new_Table like old_table partitioned by (year int) SORT BY (last_name, state);
|
|
|
|
CREATE TABLE IF NOT EXISTS t1 (id INT);
|
|
CREATE TABLE IF NOT EXISTS t1 (
|
|
id1 INT,
|
|
id2 BINARY,
|
|
id3 BIGINT,
|
|
id4 BOOLEAN,
|
|
id5 CHAR(4),
|
|
id6 DATE,
|
|
id7 DECIMAL(38, 0),
|
|
id8 DOUBLE,
|
|
id9 INT,
|
|
id10 MAP<INT, DOUBLE>,
|
|
id11 REAL,
|
|
id12 SMALLINT,
|
|
id13 FLOAT,
|
|
id14 STRING,
|
|
id15 STRUCT,
|
|
id16 TIMESTAMP,
|
|
id17 TINYINT,
|
|
id18 VARCHAR(256),
|
|
id19 COMPLEX,
|
|
id19 ARRAY<INT>
|
|
);
|
|
|
|
CREATE TABLE IF NOT EXISTS t1 (
|
|
id INT,
|
|
person STRUCT<first_name: STRING, last_name: VARCHAR(256)>
|
|
) PARTITIONED BY (student STRUCT<id: INT, name: VARCHAR(256), height: STRING, cost: DECIMAL(38, 0)>);
|