mirror of
https://github.com/apache/impala.git
synced 2026-01-06 06:01:03 -05:00
For files that have a Cloudera copyright (and no other copyright notice), make changes to follow the ASF source file header policy here: http://www.apache.org/legal/src-headers.html#headers Specifically: 1) Remove the Cloudera copyright. 2) Modify NOTICE.txt according to http://www.apache.org/legal/src-headers.html#notice to follow that format and add a line for Cloudera. 3) Replace or add the existing ASF license text with the one given on the website. Much of this change was automatically generated via: git grep -li 'Copyright.*Cloudera' > modified_files.txt cat modified_files.txt | xargs perl -n -i -e 'print unless m#Copyright.*Cloudera#i;' cat modified_files_txt | xargs fix_apache_license.py [1] Some manual fixups were performed following those steps, especially when license text was completely missing from the file. [1] https://gist.github.com/anonymous/ff71292094362fc5c594 with minor modification to ORIG_LICENSE to match Impala's license text. Change-Id: I2e0bd8420945b953e1b806041bea4d72a3943d86 Reviewed-on: http://gerrit.cloudera.org:8080/3779 Reviewed-by: Dan Hecht <dhecht@cloudera.com> Tested-by: Internal Jenkins
364 lines
9.8 KiB
SQL
364 lines
9.8 KiB
SQL
# Licensed to the Apache Software Foundation (ASF) under one
|
|
# or more contributor license agreements. See the NOTICE file
|
|
# distributed with this work for additional information
|
|
# regarding copyright ownership. The ASF licenses this file
|
|
# to you under the Apache License, Version 2.0 (the
|
|
# "License"); you may not use this file except in compliance
|
|
# with the License. You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
#
|
|
# For details on this file format please see hive-benchmark_schema_template.sql
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
lineitem
|
|
---- COLUMNS
|
|
L_ORDERKEY BIGINT
|
|
L_PARTKEY BIGINT
|
|
L_SUPPKEY BIGINT
|
|
L_LINENUMBER INT
|
|
L_QUANTITY DECIMAL(12,2)
|
|
L_EXTENDEDPRICE DECIMAL(12,2)
|
|
L_DISCOUNT DECIMAL(12,2)
|
|
L_TAX DECIMAL(12,2)
|
|
L_RETURNFLAG STRING
|
|
L_LINESTATUS STRING
|
|
L_SHIPDATE STRING
|
|
L_COMMITDATE STRING
|
|
L_RECEIPTDATE STRING
|
|
L_SHIPINSTRUCT STRING
|
|
L_SHIPMODE STRING
|
|
L_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
L_ORDERKEY BIGINT,
|
|
L_PARTKEY BIGINT,
|
|
L_SUPPKEY BIGINT,
|
|
L_LINENUMBER INT,
|
|
L_QUANTITY DOUBLE,
|
|
L_EXTENDEDPRICE DOUBLE,
|
|
L_DISCOUNT DOUBLE,
|
|
L_TAX DOUBLE,
|
|
L_RETURNFLAG STRING,
|
|
L_LINESTATUS STRING,
|
|
L_SHIPDATE STRING,
|
|
L_COMMITDATE STRING,
|
|
L_RECEIPTDATE STRING,
|
|
L_SHIPINSTRUCT STRING,
|
|
L_SHIPMODE STRING,
|
|
L_COMMENT STRING
|
|
)
|
|
distribute by hash (l_orderkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'l_orderkey, l_partkey, l_suppkey, l_linenumber'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
part
|
|
---- COLUMNS
|
|
P_PARTKEY BIGINT
|
|
P_NAME STRING
|
|
P_MFGR STRING
|
|
P_BRAND STRING
|
|
P_TYPE STRING
|
|
P_SIZE INT
|
|
P_CONTAINER STRING
|
|
P_RETAILPRICE DECIMAL(12,2)
|
|
P_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
P_PARTKEY BIGINT,
|
|
P_NAME STRING,
|
|
P_MFGR STRING,
|
|
P_BRAND STRING,
|
|
P_TYPE STRING,
|
|
P_SIZE INT,
|
|
P_CONTAINER STRING,
|
|
P_RETAILPRICE DOUBLE,
|
|
P_COMMENT STRING
|
|
)
|
|
distribute by hash (p_partkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'p_partkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
partsupp
|
|
---- COLUMNS
|
|
PS_PARTKEY BIGINT
|
|
PS_SUPPKEY BIGINT
|
|
PS_AVAILQTY INT
|
|
PS_SUPPLYCOST DECIMAL(12,2)
|
|
PS_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
PS_PARTKEY BIGINT,
|
|
PS_SUPPKEY BIGINT,
|
|
PS_AVAILQTY BIGINT,
|
|
PS_SUPPLYCOST DOUBLE,
|
|
PS_COMMENT STRING
|
|
)
|
|
distribute by hash (ps_partkey, ps_suppkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'ps_partkey, ps_suppkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
supplier
|
|
---- COLUMNS
|
|
S_SUPPKEY BIGINT
|
|
S_NAME STRING
|
|
S_ADDRESS STRING
|
|
S_NATIONKEY SMALLINT
|
|
S_PHONE STRING
|
|
S_ACCTBAL DECIMAL(12,2)
|
|
S_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
S_SUPPKEY BIGINT,
|
|
S_NAME STRING,
|
|
S_ADDRESS STRING,
|
|
S_NATIONKEY SMALLINT,
|
|
S_PHONE STRING,
|
|
S_ACCTBAL DOUBLE,
|
|
S_COMMENT STRING
|
|
)
|
|
distribute by hash (s_suppkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 's_suppkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
nation
|
|
---- COLUMNS
|
|
N_NATIONKEY SMALLINT
|
|
N_NAME STRING
|
|
N_REGIONKEY SMALLINT
|
|
N_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
N_NATIONKEY SMALLINT,
|
|
N_NAME STRING,
|
|
N_REGIONKEY SMALLINT,
|
|
N_COMMENT STRING
|
|
)
|
|
distribute by hash (n_nationkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'n_nationkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
region
|
|
---- COLUMNS
|
|
R_REGIONKEY SMALLINT
|
|
R_NAME STRING
|
|
R_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
R_REGIONKEY SMALLINT,
|
|
R_NAME STRING,
|
|
R_COMMENT STRING
|
|
)
|
|
distribute by hash (r_regionkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'r_regionkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
orders
|
|
---- COLUMNS
|
|
O_ORDERKEY BIGINT
|
|
O_CUSTKEY BIGINT
|
|
O_ORDERSTATUS STRING
|
|
O_TOTALPRICE DECIMAL(12,2)
|
|
O_ORDERDATE STRING
|
|
O_ORDERPRIORITY STRING
|
|
O_CLERK STRING
|
|
O_SHIPPRIORITY INT
|
|
O_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
O_ORDERKEY BIGINT,
|
|
O_CUSTKEY BIGINT,
|
|
O_ORDERSTATUS STRING,
|
|
O_TOTALPRICE DOUBLE,
|
|
O_ORDERDATE STRING,
|
|
O_ORDERPRIORITY STRING,
|
|
O_CLERK STRING,
|
|
O_SHIPPRIORITY INT,
|
|
O_COMMENT STRING
|
|
)
|
|
distribute by hash (o_orderkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'o_orderkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
customer
|
|
---- COLUMNS
|
|
C_CUSTKEY BIGINT
|
|
C_NAME STRING
|
|
C_ADDRESS STRING
|
|
C_NATIONKEY SMALLINT
|
|
C_PHONE STRING
|
|
C_ACCTBAL DECIMAL(12,2)
|
|
C_MKTSEGMENT STRING
|
|
C_COMMENT STRING
|
|
---- ROW_FORMAT
|
|
DELIMITED FIELDS TERMINATED BY '|'
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
C_CUSTKEY BIGINT,
|
|
C_NAME STRING,
|
|
C_ADDRESS STRING,
|
|
C_NATIONKEY SMALLINT,
|
|
C_PHONE STRING,
|
|
C_ACCTBAL DOUBLE,
|
|
C_MKTSEGMENT STRING,
|
|
C_COMMENT STRING
|
|
)
|
|
distribute by hash (c_custkey) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'c_custkey'
|
|
);
|
|
---- DEPENDENT_LOAD
|
|
INSERT OVERWRITE TABLE {db_name}{db_suffix}.{table_name} SELECT * FROM {db_name}.{table_name};
|
|
---- LOAD
|
|
LOAD DATA LOCAL INPATH '{impala_home}/testdata/impala-data/{db_name}/{table_name}'
|
|
OVERWRITE INTO TABLE {db_name}{db_suffix}.{table_name};
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
revenue
|
|
---- COLUMNS
|
|
supplier_no bigint
|
|
total_revenue Decimal(38,4)
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
supplier_no bigint,
|
|
total_revevue double
|
|
)
|
|
distribute by hash (supplier_no) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'supplier_no'
|
|
);
|
|
====
|
|
---- DATASET
|
|
tpch
|
|
---- BASE_TABLE_NAME
|
|
max_revenue
|
|
---- COLUMNS
|
|
max_revenue Decimal(38, 4)
|
|
---- CREATE_KUDU
|
|
create table if not exists {db_name}{db_suffix}.{table_name} (
|
|
max_revenue bigint
|
|
)
|
|
distribute by hash (max_revenue) into 9 buckets
|
|
tblproperties(
|
|
'storage_handler' = 'com.cloudera.kudu.hive.KuduStorageHandler',
|
|
'kudu.master_addresses' = '127.0.0.1:7051',
|
|
'kudu.table_name' = '{table_name}',
|
|
'kudu.key_columns' = 'max_revenue'
|
|
);
|
|
====
|