mirror of
https://github.com/apache/impala.git
synced 2026-02-01 12:00:22 -05:00
IMPALA-11809 adds support non unique primary key for Kudu table. It allows to create Kudu table without specifying primary key since partition columns could be promoted as non unique primary key. But when creating Kudu table in CTAS without specifying primary key, Impala returns parsing error. This patch fixed the parsing issue for creating Kudu table in CTAS without specifying primary key. Testing: - Added new test cases in parsing unit-test and end-to-end unit-test. - Passed core tests. Change-Id: Ia7bb0cf1954e0a4c3d864a800e929a88de272dd5 Reviewed-on: http://gerrit.cloudera.org:8080/19825 Reviewed-by: Abhishek Chennaka <achennaka@cloudera.com> Reviewed-by: Riza Suminto <riza.suminto@cloudera.com> Tested-by: Impala Public Jenkins <impala-public-jenkins@cloudera.com>
668 lines
19 KiB
Plaintext
668 lines
19 KiB
Plaintext
====
|
|
---- QUERY
|
|
create table t primary key (id) partition by hash (id) partitions 3
|
|
stored as kudu
|
|
as select id, int_col from functional.alltypestiny;
|
|
select * from t;
|
|
---- RESULTS
|
|
0,0
|
|
1,1
|
|
2,0
|
|
3,1
|
|
4,0
|
|
5,1
|
|
6,0
|
|
7,1
|
|
---- TYPES
|
|
INT,INT
|
|
====
|
|
---- QUERY
|
|
# Boolean primary key column
|
|
create table tab (x int, y boolean, primary key(x, y))
|
|
partition by hash (x) partitions 3 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: key column may not have type of BOOL, FLOAT, or DOUBLE
|
|
====
|
|
---- QUERY
|
|
# Float primary key column
|
|
create table tab (x int, y float, primary key(x, y))
|
|
partition by hash (x) partitions 3 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: key column may not have type of BOOL, FLOAT, or DOUBLE
|
|
====
|
|
---- QUERY
|
|
# Primary keys should be declared first
|
|
create table tab (x int, y int, primary key(y))
|
|
partition by hash (y) partitions 3 stored as kudu
|
|
---- CATCH
|
|
ImpalaRuntimeException: Kudu PRIMARY KEY columns must be specified as the first columns in the table (expected leading columns ('y') but found ('x'))
|
|
====
|
|
---- QUERY
|
|
# Primary keys should be be listed in the same order
|
|
create table tab (x int, y int, z int, primary key(y,x))
|
|
partition by hash (y) partitions 3 stored as kudu
|
|
---- CATCH
|
|
ImpalaRuntimeException: Kudu PRIMARY KEY columns must be specified as the first columns in the table (expected leading columns ('y', 'x') but found ('x', 'y'))
|
|
====
|
|
---- QUERY
|
|
# Small number of hash partitions
|
|
create table tab (a int, b int, c int, d int, primary key(a, b, c))
|
|
partition by hash(a,b) partitions 8, hash(c) partitions 1 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: must have at least two hash buckets
|
|
====
|
|
---- QUERY
|
|
# Same column in multiple hash based distributions
|
|
create table tab (a int, b int, primary key (a))
|
|
partition by hash (a) partitions 3, hash (a) partitions 2 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: hash bucket schema components must not contain columns in common
|
|
====
|
|
---- QUERY
|
|
# Same column referenced multiple times in the same hash-based distribution
|
|
create table tab (a int primary key) partition by hash (a, a, a) partitions 3
|
|
stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: hash bucket schema components must not contain columns in common
|
|
====
|
|
---- QUERY
|
|
# Kudu table that uses Impala keywords as table name and column names
|
|
create table `add`(`analytic` int, `function` int, primary key(`analytic`, `function`))
|
|
partition by hash (`analytic`) partitions 4, range (`function`)
|
|
(partition values <= 1, partition 1 < values <= 10, partition 10 < values) stored as kudu;
|
|
insert into `add` select id, int_col from functional.alltypestiny;
|
|
select * from `add`
|
|
---- RESULTS
|
|
0,0
|
|
1,1
|
|
2,0
|
|
3,1
|
|
4,0
|
|
5,1
|
|
6,0
|
|
7,1
|
|
---- TYPES
|
|
INT,INT
|
|
====
|
|
---- QUERY
|
|
# Test implicit casting/folding of partition values.
|
|
create table tab (a int not null primary key)
|
|
partition by range (a) (partition value = false)
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
# Invalid hostname
|
|
create table tdata_bogus_host (id int primary key, name string, valf float, vali bigint)
|
|
PARTITION BY RANGE (PARTITION 10 <= VALUES <= 30) STORED AS KUDU
|
|
TBLPROPERTIES('kudu.master_addresses' = 'bogus host name')
|
|
---- CATCH
|
|
Couldn't resolve this master's address bogus host name:7051
|
|
====
|
|
---- QUERY
|
|
# Non-existing host
|
|
create table tdata_non_existing_host
|
|
(id int primary key, name string, valf float, vali bigint)
|
|
PARTITION BY RANGE (PARTITION 10 <= VALUES <= 30) STORED AS KUDU
|
|
TBLPROPERTIES('kudu.master_addresses' = 'bogus.host.name')
|
|
---- CATCH
|
|
Couldn't resolve this master's address bogus.host.name:7051
|
|
====
|
|
---- QUERY
|
|
# Valid host with whitespace
|
|
create table tdata_master_addresses_whitespace (id int primary key) stored as kudu
|
|
tblproperties('kudu.master_addresses' = ' $INTERNAL_LISTEN_HOST ')
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into tdata_master_addresses_whitespace values (0), (1)
|
|
---- DML_RESULTS: tdata_master_addresses_whitespace
|
|
0
|
|
1
|
|
====
|
|
---- QUERY
|
|
# Test that string case is ignored
|
|
create table ignore_column_case (Id int, NAME string, vAlf float, vali bigint,
|
|
primary key (Id, NAME)) PARTITION BY RANGE (PARTITION VALUE = (1, 'Martin'))
|
|
STORED AS KUDU
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into ignore_column_case values (1, 'Martin', 1.0, 10);
|
|
---- RESULTS
|
|
: 1
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 1
|
|
NumRowErrors: 0
|
|
====
|
|
---- QUERY
|
|
select ID, nAmE, VALF, VALI from ignore_column_case where NaMe = 'Martin';
|
|
---- RESULTS
|
|
1,'Martin',1.0,10
|
|
---- TYPES
|
|
INT,STRING,FLOAT,BIGINT
|
|
====
|
|
---- QUERY
|
|
# Using NULL as default values
|
|
create table tbl_with_null_defaults (x int primary key, i1 tinyint default null,
|
|
i2 smallint default null, i3 int default null, i4 bigint default null,
|
|
vals string default null, valf float default null, vald double default null,
|
|
valb boolean default null, valdec4 decimal(9) default null,
|
|
valdec8 decimal(18) default null, valdec16 decimal(38) default null,
|
|
valdate date default null, valvc varchar(2000) default null)
|
|
partition by hash (x) partitions 3 stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into tbl_with_null_defaults (x) values (1);
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 1
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
X, I1, I2, I3, I4, VALS, VALF, VALD, VALB, VALDEC4, VALDEC8, VALDEC16, VALDATE, VALVC
|
|
---- DML_RESULTS: tbl_with_null_defaults
|
|
1,NULL,NULL,NULL,NULL,'NULL',NULL,NULL,NULL,NULL,NULL,NULL,NULL,'NULL'
|
|
---- TYPES
|
|
INT,TINYINT,SMALLINT,INT,BIGINT,STRING,FLOAT,DOUBLE,BOOLEAN,DECIMAL,DECIMAL,DECIMAL,DATE,STRING
|
|
====
|
|
---- QUERY
|
|
# Overlapping ranges are rejected by the Kudu client
|
|
create table ts_ranges (ts timestamp primary key, i int)
|
|
partition by range (
|
|
partition cast('2009-01-02 00:00:00' as timestamp) <= VALUES <
|
|
cast('2009-01-03 00:00:00' as timestamp),
|
|
partition cast('2009-01-02 10:00:00' as timestamp) <= VALUES
|
|
) stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: overlapping range partitions: first range partition: 2009-01-02T00:00:00.000000Z <= VALUES < 2009-01-03T00:00:00.000000Z, second range partition: 2009-01-02T10:00:00.000000Z <= VALUES
|
|
====
|
|
---- QUERY
|
|
# Creates a range partitioned Kudu table with a timestamp PK. Note that nanoseconds
|
|
# are rounded (same behavior as when writing timestamp values to Kudu).
|
|
create table ts_ranges (ts timestamp primary key, i int)
|
|
partition by range (
|
|
partition nanoseconds_add(cast('2009-01-01 00:00:00' as timestamp), 999) <= VALUES <
|
|
nanoseconds_add(cast('2009-01-02 00:00:00' as timestamp), 1),
|
|
partition cast('2009-01-02 00:00:00' as timestamp) <= VALUES <
|
|
cast('2009-01-03 00:00:00' as timestamp),
|
|
partition '2009-01-03 00:00:00' <= VALUES
|
|
) stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
show range partitions ts_ranges
|
|
---- RESULTS
|
|
'2009-01-01T00:00:00.000001Z <= VALUES < 2009-01-02T00:00:00.000000Z'
|
|
'2009-01-02T00:00:00.000000Z <= VALUES < 2009-01-03T00:00:00.000000Z'
|
|
'VALUES >= 2009-01-03T00:00:00.000000Z'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
create table ts_ranges_ctas
|
|
primary key (ts)
|
|
partition by range (
|
|
partition VALUES < '2009-01-02 00:00:00',
|
|
partition '2009-01-02 00:00:00' <= VALUES <
|
|
'2009-01-03 00:00:00',
|
|
partition '2009-01-03 00:00:00' < VALUES,
|
|
partition VALUE = ('2009-01-03 00:00:00')
|
|
)
|
|
stored as kudu
|
|
as select timestamp_col ts, id from functional.alltypestiny;
|
|
---- RESULTS
|
|
'Inserted 8 row(s)'
|
|
====
|
|
---- QUERY
|
|
show range partitions ts_ranges_ctas
|
|
---- RESULTS
|
|
'VALUES < 2009-01-02T00:00:00.000000Z'
|
|
'2009-01-02T00:00:00.000000Z <= VALUES < 2009-01-03T00:00:00.000000Z'
|
|
'VALUE = 2009-01-03T00:00:00.000000Z'
|
|
'VALUES >= 2009-01-03T00:00:00.000001Z'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select * from ts_ranges_ctas order by id
|
|
---- RESULTS
|
|
2009-01-01 00:00:00,0
|
|
2009-01-01 00:01:00,1
|
|
2009-02-01 00:00:00,2
|
|
2009-02-01 00:01:00,3
|
|
2009-03-01 00:00:00,4
|
|
2009-03-01 00:01:00,5
|
|
2009-04-01 00:00:00,6
|
|
2009-04-01 00:01:00,7
|
|
---- TYPES
|
|
TIMESTAMP,INT
|
|
====
|
|
---- QUERY
|
|
# Creates a Kudu table with timestamp column default values.
|
|
create table ts_default (i int primary key, ts1 timestamp,
|
|
ts2 timestamp default cast('2009-01-01 00:00:00' as timestamp))
|
|
partition by hash(i) partitions 3 stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into ts_default (i) values (1);
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 1
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
I, TS1, TS2
|
|
---- DML_RESULTS: ts_default
|
|
1,NULL,2009-01-01 00:00:00
|
|
---- TYPES
|
|
INT,TIMESTAMP,TIMESTAMP
|
|
====
|
|
---- QUERY
|
|
insert into ts_default (i, ts1, ts2) values (2, NULL, NULL);
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 1
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
I, TS1, TS2
|
|
---- DML_RESULTS: ts_default
|
|
1,NULL,2009-01-01 00:00:00
|
|
2,NULL,NULL
|
|
---- TYPES
|
|
INT,TIMESTAMP,TIMESTAMP
|
|
====
|
|
---- QUERY
|
|
# create an unpartitioned table
|
|
create table unpartitioned_kudu_table (col0 bigint primary key, col1 string)
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
---- ERRORS
|
|
Unpartitioned Kudu tables are inefficient for large data sizes.
|
|
====
|
|
---- QUERY
|
|
insert into unpartitioned_kudu_table values (0, 'zero'), (1, 'one')
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 2
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
COL0,COL1
|
|
---- DML_RESULTS: unpartitioned_kudu_table
|
|
0,'zero'
|
|
1,'one'
|
|
---- TYPES
|
|
BIGINT,STRING
|
|
====
|
|
---- QUERY
|
|
create table unpartitioned_kudu_table2 primary key(id) stored as kudu
|
|
as select id from functional.alltypestiny where id > 4
|
|
---- RESULTS
|
|
'Inserted 3 row(s)'
|
|
---- ERRORS
|
|
Unpartitioned Kudu tables are inefficient for large data sizes.
|
|
====
|
|
---- QUERY
|
|
select * from unpartitioned_kudu_table2
|
|
---- RESULTS
|
|
5
|
|
6
|
|
7
|
|
---- LABELS
|
|
ID
|
|
---- TYPES
|
|
INT
|
|
====
|
|
---- QUERY
|
|
# Creates a Kudu table with decimal columns and primary key
|
|
create table create_decimal
|
|
(
|
|
decimal_4 decimal(9, 9),
|
|
decimal_8 decimal(18, 2) not null default 100.00,
|
|
decimal_16 decimal(38, 0) null,
|
|
primary key (decimal_4))
|
|
stored as kudu;
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
# Create as select table with decimal columns and primary key
|
|
create table ctas_decimal primary key (d1,d2,d3)
|
|
stored as kudu
|
|
as select * from functional.decimal_tbl;
|
|
select * from ctas_decimal;
|
|
---- RESULTS
|
|
1234,2222,1.2345678900,0.12345678900000000000000000000000000000,12345.78900,1
|
|
2345,111,12.3456789000,0.12345678900000000000000000000000000000,3.14100,1
|
|
12345,333,123.4567890000,0.12345678900000000000000000000000000000,11.22000,1
|
|
12345,333,1234.5678900000,0.12345678900000000000000000000000000000,0.10000,1
|
|
132842,333,12345.6789000000,0.12345678900000000000000000000000000000,0.77889,1
|
|
---- TYPES
|
|
DECIMAL,DECIMAL,DECIMAL,DECIMAL,DECIMAL,DECIMAL
|
|
====
|
|
---- QUERY
|
|
# IMPALA-6954: CTAS with an expr rewrite.
|
|
create table ctas_rewrite primary key(id)
|
|
partition by range(id) (partition 0 <= values < 100) stored as kudu
|
|
as select id, tinyint_col from functional.alltypes
|
|
where id between 0 and 1;
|
|
show range partitions ctas_rewrite;
|
|
---- RESULTS
|
|
'0 <= VALUES < 100'
|
|
====
|
|
---- QUERY
|
|
# create table with primary key of DATE type
|
|
create table kudu_date_key (fdatekey date primary key, val string)
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
---- ERRORS
|
|
Unpartitioned Kudu tables are inefficient for large data sizes.
|
|
====
|
|
---- QUERY
|
|
insert into kudu_date_key values (DATE '1970-01-01', 'Unix epoch'), (DATE '2019-12-12', 'today')
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 2
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
FDATEKEY,VAL
|
|
---- DML_RESULTS: kudu_date_key
|
|
1970-01-01,'Unix epoch'
|
|
2019-12-12,'today'
|
|
---- TYPES
|
|
DATE,STRING
|
|
====
|
|
---- QUERY
|
|
# create table with invalid default DATE value
|
|
create table kudu_invalid_default_date (fdate date default DATE '111111-33-33')
|
|
stored as kudu
|
|
---- CATCH
|
|
AnalysisException: Invalid date literal: '111111-33-33'
|
|
====
|
|
---- QUERY
|
|
# create table with DATE primary key partitioned by range
|
|
create table kudu_datepk_range (fdate DATE not null primary key)
|
|
partition by range (fdate)
|
|
(
|
|
partition values < DATE '1900-01-01',
|
|
partition DATE '1900-01-01' <= values < DATE '1970-01-01',
|
|
partition DATE '1970-01-01' <= values < DATE '2000-01-01',
|
|
partition DATE '2000-01-01' <= values
|
|
)
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into kudu_datepk_range values
|
|
(DATE '1800-01-01'),
|
|
(DATE '1970-01-01'),
|
|
(DATE '2019-12-12')
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 3
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
FDATE
|
|
---- DML_RESULTS: kudu_datepk_range
|
|
1800-01-01
|
|
1970-01-01
|
|
2019-12-12
|
|
---- TYPES
|
|
DATE
|
|
====
|
|
---- QUERY
|
|
select * from kudu_datepk_range;
|
|
---- RESULTS
|
|
1800-01-01
|
|
1970-01-01
|
|
2019-12-12
|
|
---- TYPES
|
|
DATE
|
|
====
|
|
---- QUERY
|
|
# Creates a Kudu table with varchar columns, primary key,
|
|
# hash partition and range partition.
|
|
create table create_varchar
|
|
(
|
|
valvc varchar(10),
|
|
primary key (valvc))
|
|
partition by hash (valvc) partitions 4, range (valvc) (
|
|
partition values < cast('m' as VARCHAR(10)),
|
|
partition cast('m' as VARCHAR(10)) <= values)
|
|
stored as kudu;
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into create_varchar values
|
|
(cast('a' as VARCHAR(10))),
|
|
(cast('m' as VARCHAR(10))),
|
|
(cast('z' as VARCHAR(10)))
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 3
|
|
NumRowErrors: 0
|
|
---- LABELS
|
|
VALVC
|
|
---- DML_RESULTS: create_varchar
|
|
'a'
|
|
'm'
|
|
'z'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
# Creates as select table with varchar columns and primary key
|
|
create table ctas_varchar primary key (vc)
|
|
stored as kudu
|
|
as select vc from functional.chars_tiny;
|
|
select * from ctas_varchar;
|
|
---- RESULTS
|
|
'1cccc'
|
|
'2cccccc'
|
|
'3ccc'
|
|
'4cc'
|
|
'5c'
|
|
'6c'
|
|
'c'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
# Create with keyword 'stored by'
|
|
create table kudu_stored_by (i int primary key, s string, ts timestamp, d date) stored by kudu;
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
describe formatted kudu_stored_by;
|
|
---- RESULTS: VERIFY_IS_SUBSET
|
|
'','storage_handler ','org.apache.hadoop.hive.kudu.KuduStorageHandler'
|
|
---- TYPES
|
|
string, string, string
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table with non unique primary key
|
|
create table non_unique_key_create_tbl1 (id int non unique primary key, name string)
|
|
partition by hash (id) partitions 3
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
insert into non_unique_key_create_tbl1 values (1,'Martin'), (2,'Smith');
|
|
---- RESULTS
|
|
: 2
|
|
---- RUNTIME_PROFILE
|
|
NumModifiedRows: 2
|
|
NumRowErrors: 0
|
|
====
|
|
---- QUERY
|
|
# auto-incrementing column is not shown for "select *"
|
|
select * from non_unique_key_create_tbl1 where name = 'Martin';
|
|
---- RESULTS
|
|
1,'Martin'
|
|
---- TYPES
|
|
INT,STRING
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table with non unique composite primary key
|
|
create table non_unique_key_create_tbl2 (a int, b string, non unique primary key(a, b))
|
|
partition by hash (a) partitions 3
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table with non unique composite primary key
|
|
create table non_unique_key_create_tbl3 (a string, b int, non unique primary key(a, b))
|
|
partition by hash (a) partitions 3
|
|
stored as kudu
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table without primary key columns,
|
|
# partition columns will be promoted as non unique primary key columns.
|
|
create table promote_partition_keys_as_non_unique_keys_test (a int, b string, c float)
|
|
partition by hash (a, b) partitions 3
|
|
stored as kudu;
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
---- ERRORS
|
|
Partition columns (a, b) are promoted as non unique primary key.
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table without primary key columns,
|
|
# partition columns cannot be promoted as non unique primary key columns since the columns
|
|
# are not beginning columns of the table.
|
|
create table partition_keys_not_promoted_test (a int, b string, c float)
|
|
partition by hash (b, c) partitions 3
|
|
stored as kudu;
|
|
---- CATCH
|
|
AnalysisException: Specify primary key or non unique primary key for the Kudu table, or create partitions with the beginning columns of the table.
|
|
====
|
|
---- QUERY
|
|
# Create unpartitioned Kudu table with non unique primary key column.
|
|
create table non_unique_key_create_tbl4 (a int non unique primary key, b string)
|
|
stored as kudu;
|
|
---- RESULTS
|
|
'Table has been created.'
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table in CTAS statement with non unique primary key
|
|
create table non_unique_key_create_tbl5 non unique primary key (id)
|
|
partition by hash (id) partitions 3
|
|
stored as kudu
|
|
as select id, int_col from functional.alltypestiny;
|
|
select * from non_unique_key_create_tbl5 order by id asc;
|
|
---- RESULTS
|
|
0,0
|
|
1,1
|
|
2,0
|
|
3,1
|
|
4,0
|
|
5,1
|
|
6,0
|
|
7,1
|
|
---- TYPES
|
|
INT,INT
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table in CTAS statement with non unique primary key and range partitions
|
|
create table non_unique_key_create_tbl6 non unique primary key (id)
|
|
partition by range (id) (partition values <= 1, partition 1 < values <= 3,
|
|
partition 3 < values <= 5, partition 5 < values)
|
|
stored as kudu
|
|
as select id, int_col from functional.alltypestiny order by id asc limit 100;
|
|
select id, int_col, auto_incrementing_id from non_unique_key_create_tbl6 order by id asc;
|
|
---- RESULTS
|
|
0,0,1
|
|
1,1,2
|
|
2,0,1
|
|
3,1,2
|
|
4,0,1
|
|
5,1,2
|
|
6,0,1
|
|
7,1,2
|
|
---- TYPES
|
|
INT,INT,BIGINT
|
|
====
|
|
---- QUERY
|
|
# Non unique primary key for non Kudu table
|
|
create table non_unique_key_create_tbl7 (x int, y boolean, non unique primary key(x, y))
|
|
---- CATCH
|
|
AnalysisException: NON UNIQUE PRIMARY KEY is only supported for Kudu
|
|
====
|
|
---- QUERY
|
|
# Non unique primary keys should be declared first
|
|
create table non_unique_key_create_tbl8 (x int, y int, non unique primary key(y))
|
|
partition by hash (y) partitions 3 stored as kudu
|
|
---- CATCH
|
|
ImpalaRuntimeException: Kudu NON UNIQUE PRIMARY KEY columns must be specified as the first columns in the table (expected leading columns ('y') but found ('x'))
|
|
====
|
|
---- QUERY
|
|
# Non unique primary keys should be be listed in the same order
|
|
create table non_unique_key_create_tbl9 (x int, y int, z int, non unique primary key(y,x))
|
|
partition by hash (y) partitions 3 stored as kudu
|
|
---- CATCH
|
|
ImpalaRuntimeException: Kudu NON UNIQUE PRIMARY KEY columns must be specified as the first columns in the table (expected leading columns ('y', 'x') but found ('x', 'y'))
|
|
====
|
|
---- QUERY
|
|
# Non unique primary key cannot be boolean type
|
|
create table non_unique_key_create_tbl10 (x boolean non unique primary key)
|
|
partition by hash(x) partitions 8 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: key column may not have type of BOOL, FLOAT, or DOUBLE
|
|
====
|
|
---- QUERY
|
|
# Non unique primary key cannot be float type
|
|
create table non_unique_key_create_tbl11 (x float non unique primary key)
|
|
partition by hash(x) partitions 8 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: key column may not have type of BOOL, FLOAT, or DOUBLE
|
|
====
|
|
---- QUERY
|
|
# Non unique primary key cannot be double type
|
|
create table non_unique_key_create_tbl12 (x double non unique primary key)
|
|
partition by hash(x) partitions 8 stored as kudu
|
|
---- CATCH
|
|
NonRecoverableException: key column may not have type of BOOL, FLOAT, or DOUBLE
|
|
====
|
|
---- QUERY
|
|
# Cannot create a Kudu table without any key and partition
|
|
create table non_unique_key_create_tbl13 (x int) stored as kudu
|
|
---- CATCH
|
|
AnalysisException: A primary key is required for a Kudu table.
|
|
====
|
|
---- QUERY
|
|
# Cannot create a Kudu table with a column named as "auto_incrementing_id"
|
|
create table non_unique_key_create_tbl14 (id int primary key, auto_incrementing_id bigint)
|
|
partition by hash(id) partitions 3 stored as kudu
|
|
---- CATCH
|
|
IllegalArgumentException: Column name auto_incrementing_id is reserved by Kudu engine
|
|
====
|
|
---- QUERY
|
|
# Create Kudu table in CTAS statement without specifying primary key.
|
|
# Partition column 'id' is promoted as non unique primary key.
|
|
create table non_unique_key_create_tbl15
|
|
partition by range (id) (partition values <= 1, partition 1 < values <= 3,
|
|
partition 3 < values <= 5, partition 5 < values)
|
|
stored as kudu
|
|
as select id, int_col from functional.alltypestiny order by id asc limit 100;
|
|
select id, int_col, auto_incrementing_id from non_unique_key_create_tbl15 order by id asc;
|
|
---- RESULTS
|
|
0,0,1
|
|
1,1,2
|
|
2,0,1
|
|
3,1,2
|
|
4,0,1
|
|
5,1,2
|
|
6,0,1
|
|
7,1,2
|
|
---- TYPES
|
|
INT,INT,BIGINT
|
|
====
|