Files
impala/testdata/datasets/tpch/tpch_schema_template.sql
Lenni Kuff 1e25c98fb4 Test data loading framework improvements
This change includes a number of improvements for the test data loading framework:
* Named sections for schema template definitions
* Removal of uneeded sections from schema template definitions (ex. ANALYZE TABLE)
* More granular data loading via table name filters
* Improved robustness in detecting failed data loads
* Table level constraints for specific file formats
* Re-written compute stats script
2014-01-08 10:46:49 -08:00

364 lines
9.3 KiB
SQL

# Copyright (c) 2012 Cloudera, Inc. All rights reserved.
# For details on this file format please see hive-benchmark_schema_template.sql
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.lineitem
---- CREATE
CREATE DATABASE IF NOT EXISTS tpch%(scale_factor)s;
CREATE EXTERNAL TABLE %(table_name)s (
L_ORDERKEY INT,
L_PARTKEY INT,
L_SUPPKEY INT,
L_LINENUMBER INT,
L_QUANTITY DOUBLE,
L_EXTENDEDPRICE DOUBLE,
L_DISCOUNT DOUBLE,
L_TAX DOUBLE,
L_RETURNFLAG STRING,
L_LINESTATUS STRING,
L_SHIPDATE STRING,
L_COMMITDATE STRING,
L_RECEIPTDATE STRING,
L_SHIPINSTRUCT STRING,
L_SHIPMODE STRING,
L_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/lineitem/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.part
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
P_PARTKEY INT,
P_NAME STRING,
P_MFGR STRING,
P_BRAND STRING,
P_TYPE
STRING,
P_SIZE INT,
P_CONTAINER STRING,
P_RETAILPRICE DOUBLE,
P_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/part/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.partsupp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
PS_PARTKEY INT,
PS_SUPPKEY INT,
PS_AVAILQTY INT,
PS_SUPPLYCOST DOUBLE,
PS_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/partsupp/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.supplier
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
S_SUPPKEY INT,
S_NAME STRING,
S_ADDRESS STRING,
S_NATIONKEY INT,
S_PHONE STRING,
S_ACCTBAL DOUBLE,
S_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/supplier/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.nation
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
N_NATIONKEY INT,
N_NAME STRING,
N_REGIONKEY INT,
N_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/nation/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.region
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
R_REGIONKEY INT,
R_NAME STRING,
R_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/region/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.orders
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
O_ORDERKEY INT,
O_CUSTKEY INT,
O_ORDERSTATUS STRING,
O_TOTALPRICE DOUBLE,
O_ORDERDATE STRING,
O_ORDERPRIORITY STRING,
O_CLERK STRING,
O_SHIPPRIORITY INT,
O_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/orders/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.customer
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
C_CUSTKEY INT,
C_NAME STRING,
C_ADDRESS STRING,
C_NATIONKEY INT,
C_PHONE STRING,
C_ACCTBAL DOUBLE,
C_MKTSEGMENT STRING,
C_COMMENT STRING)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
---- DEPENDENT_LOAD
INSERT OVERWRITE TABLE %(table_name)s SELECT * FROM %(base_table_name)s;
---- LOAD
LOAD DATA LOCAL INPATH '${env:IMPALA_HOME}/testdata/impala-data/tpch%(scale_factor)s/customer/'
OVERWRITE INTO TABLE %(table_name)s;
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q2_minimum_cost_supplier_tmp1
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
s_acctbal double,
s_name string,
n_name string,
p_partkey int,
ps_supplycost double,
p_mfgr string,
s_address string,
s_phone string,
s_comment string)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q2_minimum_cost_supplier_tmp2
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
p_partkey int,
ps_min_supplycost double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q7_volume_shipping_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
supp_nation string,
cust_nation string,
s_nationkey int,
c_nationkey int)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q11_part_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
ps_partkey int,
part_value double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q11_sum_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (total_value double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.revenue
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
supplier_no int,
total_revenue double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.max_revenue
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (max_revenue double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.supplier_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (s_suppkey int)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q16_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
p_brand string,
p_type string,
p_size int,
ps_suppkey int)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.lineitem_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
t_partkey int,
t_avg_quantity double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q18_tmp
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
l_orderkey int,
t_sum_quantity double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q20_tmp1
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (p_partkey int)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q20_tmp2
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
l_partkey int,
l_suppkey int,
sum_quantity double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q20_tmp3
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (
ps_suppkey int,
ps_availqty int,
sum_quantity double)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q20_tmp4
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (ps_suppkey int)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====
---- DATASET
tpch
---- BASE_TABLE_NAME
tpch%(scale_factor)s.q22_customer_tmp1
---- CREATE
CREATE EXTERNAL TABLE %(table_name)s (avg_acctbal double, cust_name_char string)
STORED AS %(file_format)s
LOCATION '${hiveconf:hive.metastore.warehouse.dir}/%(table_name)s';
====