mirror of
https://github.com/apache/impala.git
synced 2025-12-19 09:58:28 -05:00
IMPALA-13617: Rename c_last_review_date to c_last_review_date_sk
TPC-DS v2.11.0, section 2.4.7, rename column customer.c_last_review_date
to customer.c_last_review_date_sk to align with other surrogate key
columns. impala-tpcds-kit has been modified to reflect this column name
change in
086d7113c8
However, the tpcds dataset schema in Impala test data remains unchanged.
This patch did such a rename to align closer to TPC-DS v2.11.0. This
patch contains no data type adjustment because such adjustment requires
larger changes.
customer_multiblock_page_index.parquet added by IMPALA-10310 is
regenerated to follow the new schema of table customer. The SQL used to
create the file is ordered more specifically over both
c_current_cdemo_sk and c_customer_sk columns. The associated test
assertion in parquet-page-index.test is also updated.
A workaround in test_file_parser.py added by IMPALA-13543 is now removed
after this change is applied.
Testing:
- Pass core tests.
Change-Id: Ie446b3c534cb8f6f54265cd9b2f705cad91dd4ac
Reviewed-on: http://gerrit.cloudera.org:8080/22223
Reviewed-by: Impala Public Jenkins <impala-public-jenkins@cloudera.com>
Tested-by: Impala Public Jenkins <impala-public-jenkins@cloudera.com>
This commit is contained in:
committed by
Impala Public Jenkins
parent
f8f2020391
commit
2f5aef64a5
@@ -462,7 +462,7 @@ CREATE TABLE tpcds_kudu.customer (
|
||||
c_birth_country STRING,
|
||||
c_login STRING,
|
||||
c_email_address STRING,
|
||||
c_last_review_date STRING
|
||||
c_last_review_date_sk STRING
|
||||
)
|
||||
PARTITION BY HASH (c_customer_sk) PARTITIONS 12
|
||||
STORED AS KUDU;
|
||||
|
||||
@@ -188,7 +188,7 @@ CREATE EXTERNAL TABLE tpcds_raw.customer (
|
||||
c_birth_country STRING,
|
||||
c_login STRING,
|
||||
c_email_address STRING,
|
||||
c_last_review_date STRING
|
||||
c_last_review_date_sk STRING
|
||||
)
|
||||
ROW FORMAT DELIMITED FIELDS TERMINATED BY '|'
|
||||
WITH SERDEPROPERTIES ('field.delim'='|', 'serialization.format'='|')
|
||||
@@ -808,7 +808,7 @@ CREATE TABLE tpcds_parquet.customer (
|
||||
c_birth_country STRING,
|
||||
c_login STRING,
|
||||
c_email_address STRING,
|
||||
c_last_review_date STRING
|
||||
c_last_review_date_sk STRING
|
||||
)
|
||||
STORED AS PARQUET;
|
||||
CREATE TABLE tpcds_parquet.customer_address (
|
||||
|
||||
@@ -1121,7 +1121,7 @@ show table stats store_sales;
|
||||
| c_birth_country | STRING | -1 | -1 | -1 | -1 |
|
||||
| c_login | STRING | -1 | -1 | -1 | -1 |
|
||||
| c_email_address | STRING | -1 | -1 | -1 | -1 |
|
||||
| c_last_review_date | STRING | -1 | -1 | -1 | -1 |
|
||||
| c_last_review_date_sk | STRING | -1 | -1 | -1 | -1 |
|
||||
+------------------------+--------+------------------+--------+----------+----------+
|
||||
|
||||
show column stats store_sales;
|
||||
@@ -1196,7 +1196,7 @@ show column stats customer;
|
||||
| c_birth_country | STRING | 205 | -1 | 20 | 8.4001 |
|
||||
| c_login | STRING | 1 | -1 | 0 | 0 |
|
||||
| c_email_address | STRING | 94492 | -1 | 46 | 26.485 |
|
||||
| c_last_review_date | STRING | 349 | -1 | 7 | 6.7561 |
|
||||
| c_last_review_date_sk | STRING | 349 | -1 | 7 | 6.7561 |
|
||||
+------------------------+--------+------------------+--------+----------+--------+
|
||||
|
||||
show column stats store_sales;
|
||||
|
||||
@@ -250,7 +250,7 @@ Welcome to the Impala shell. Press TAB twice to see a list of available commands
|
||||
| c_birth_country | string | |
|
||||
| c_login | string | |
|
||||
| c_email_address | string | |
|
||||
| c_last_review_date | string | |
|
||||
| c_last_review_date_sk | string | |
|
||||
+------------------------+--------+---------+
|
||||
[localhost:21000] > select count(*) from customer;
|
||||
+----------+
|
||||
@@ -724,7 +724,7 @@ create external table customer
|
||||
c_birth_country string,
|
||||
c_login string,
|
||||
c_email_address string,
|
||||
c_last_review_date string
|
||||
c_last_review_date_sk string
|
||||
)
|
||||
row format delimited fields terminated by '|'
|
||||
location '/user/hive/tpcds/customer';
|
||||
|
||||
16
testdata/data/README
vendored
16
testdata/data/README
vendored
@@ -620,17 +620,17 @@ if (r ... ) location.offset = -1;
|
||||
|
||||
customer_multiblock_page_index.parquet
|
||||
Parquet file that contains multiple blocks in a single file Needed to test IMPALA-10310.
|
||||
In order to generate this file, execute the following instruments:
|
||||
// use 1.11.0 to generate page index
|
||||
1. export HIVE_AUX_JARS_PATH=/path/parquet-hadoop-1.11.0.jar
|
||||
// in hive shell
|
||||
2. SET parquet.block.size=8192; // use little block size
|
||||
3. SET parquet.page.row.count.limit=10; // little page row count generate multi pages
|
||||
4. CREATE TABLE customer_multiblock_page_index_6
|
||||
In order to generate this file, execute the following instruments in beeline
|
||||
(Beeline version 3.1.3000.7.3.1.0-160 by Apache Hive):
|
||||
1. SET parquet.block.size=8192; // use little block size
|
||||
2. SET parquet.page.row.count.limit=10; // little page row count generate multi pages
|
||||
3. CREATE TABLE customer_multiblock_page_index_6
|
||||
STORED AS PARQUET
|
||||
TBLPROPERTIES('parquet.compression'='SNAPPY')
|
||||
AS SELECT * FROM tpcds.customer
|
||||
WHERE c_current_cdemo_sk IS NOT NULL ORDER BY c_current_cdemo_sk LIMIT 2000;
|
||||
WHERE c_current_cdemo_sk IS NOT NULL
|
||||
ORDER BY c_current_cdemo_sk, c_customer_sk
|
||||
LIMIT 2000;
|
||||
generated file will contains multi blocks, multi pages per block.
|
||||
|
||||
customer_nested_multiblock_multipage.parquet
|
||||
|
||||
BIN
testdata/data/customer_multiblock_page_index.parquet
vendored
BIN
testdata/data/customer_multiblock_page_index.parquet
vendored
Binary file not shown.
@@ -308,7 +308,7 @@ CREATE EXTERNAL TABLE IF NOT EXISTS {jdbc_db_name}.customer (
|
||||
c_birth_country STRING,
|
||||
c_login STRING,
|
||||
c_email_address STRING,
|
||||
c_last_review_date STRING
|
||||
c_last_review_date_sk STRING
|
||||
)
|
||||
STORED AS JDBC
|
||||
TBLPROPERTIES (
|
||||
|
||||
@@ -451,7 +451,7 @@ CREATE TABLE {target_db_name}.customer (
|
||||
c_birth_country STRING,
|
||||
c_login STRING,
|
||||
c_email_address STRING,
|
||||
c_last_review_date STRING
|
||||
c_last_review_date_sk STRING
|
||||
)
|
||||
PARTITION BY HASH (c_customer_sk) PARTITIONS {buckets}
|
||||
STORED AS KUDU
|
||||
|
||||
@@ -376,7 +376,7 @@ c_birth_year int
|
||||
c_birth_country string
|
||||
c_login string
|
||||
c_email_address string
|
||||
c_last_review_date string
|
||||
c_last_review_date_sk string
|
||||
primary key (c_customer_sk) DISABLE NOVALIDATE RELY
|
||||
foreign key (c_current_addr_sk) references {db_name}{db_suffix}.customer_address (ca_address_sk) DISABLE NOVALIDATE RELY
|
||||
foreign key (c_current_cdemo_sk) references {db_name}{db_suffix}.customer_demographics (cd_demo_sk) DISABLE NOVALIDATE RELY
|
||||
|
||||
@@ -391,7 +391,7 @@ SELECT
|
||||
c_birth_country,
|
||||
c_login,
|
||||
c_email_address,
|
||||
CAST(c_last_review_date AS INT)
|
||||
CAST(c_last_review_date_sk AS INT)
|
||||
FROM tpcds{scale_factor}.{table_name};
|
||||
====
|
||||
---- DATASET
|
||||
|
||||
@@ -7,7 +7,7 @@ where c_salutation = 'Mrs.'
|
||||
F00:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=181.75MB mem-reservation=21.75MB thread-reservation=3 runtime-filters-memory=1.00MB
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date_sk
|
||||
| mem-estimate=100.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
02:HASH JOIN [INNER JOIN]
|
||||
@@ -51,7 +51,7 @@ where c_salutation = 'Mrs.'
|
||||
F00:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=180.75MB mem-reservation=20.75MB thread-reservation=3
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date_sk
|
||||
| mem-estimate=100.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
02:HASH JOIN [LEFT OUTER JOIN]
|
||||
@@ -94,7 +94,7 @@ where c_salutation = 'Mrs.'
|
||||
F00:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=181.75MB mem-reservation=21.75MB thread-reservation=3 runtime-filters-memory=1.00MB
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date_sk
|
||||
| mem-estimate=100.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
02:HASH JOIN [RIGHT OUTER JOIN]
|
||||
@@ -364,7 +364,7 @@ on ss_customer_sk % 10 = c_customer_sk / 100
|
||||
F00:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=211.00MB mem-reservation=51.00MB thread-reservation=3 runtime-filters-memory=1.00MB
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date
|
||||
| output exprs: tpcds.store_sales.ss_sold_time_sk, tpcds.store_sales.ss_item_sk, tpcds.store_sales.ss_customer_sk, tpcds.store_sales.ss_cdemo_sk, tpcds.store_sales.ss_hdemo_sk, tpcds.store_sales.ss_addr_sk, tpcds.store_sales.ss_store_sk, tpcds.store_sales.ss_promo_sk, tpcds.store_sales.ss_ticket_number, tpcds.store_sales.ss_quantity, tpcds.store_sales.ss_wholesale_cost, tpcds.store_sales.ss_list_price, tpcds.store_sales.ss_sales_price, tpcds.store_sales.ss_ext_discount_amt, tpcds.store_sales.ss_ext_sales_price, tpcds.store_sales.ss_ext_wholesale_cost, tpcds.store_sales.ss_ext_list_price, tpcds.store_sales.ss_ext_tax, tpcds.store_sales.ss_coupon_amt, tpcds.store_sales.ss_net_paid, tpcds.store_sales.ss_net_paid_inc_tax, tpcds.store_sales.ss_net_profit, tpcds.store_sales.ss_sold_date_sk, tpcds.customer.c_customer_sk, tpcds.customer.c_customer_id, tpcds.customer.c_current_cdemo_sk, tpcds.customer.c_current_hdemo_sk, tpcds.customer.c_current_addr_sk, tpcds.customer.c_first_shipto_date_sk, tpcds.customer.c_first_sales_date_sk, tpcds.customer.c_salutation, tpcds.customer.c_first_name, tpcds.customer.c_last_name, tpcds.customer.c_preferred_cust_flag, tpcds.customer.c_birth_day, tpcds.customer.c_birth_month, tpcds.customer.c_birth_year, tpcds.customer.c_birth_country, tpcds.customer.c_login, tpcds.customer.c_email_address, tpcds.customer.c_last_review_date_sk
|
||||
| mem-estimate=100.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
02:HASH JOIN [INNER JOIN]
|
||||
|
||||
@@ -22,7 +22,7 @@ SELECT c_customer_id,
|
||||
c_birth_country,
|
||||
c_login,
|
||||
c_email_address,
|
||||
c_last_review_date,
|
||||
c_last_review_date_sk,
|
||||
ctr_total_return
|
||||
FROM customer_total_return ctr1,
|
||||
customer_address,
|
||||
@@ -45,7 +45,7 @@ ORDER BY c_customer_id,
|
||||
c_birth_country,
|
||||
c_login,
|
||||
c_email_address,
|
||||
c_last_review_date,
|
||||
c_last_review_date_sk,
|
||||
ctr_total_return
|
||||
LIMIT 100;
|
||||
---- PLAN
|
||||
@@ -54,11 +54,11 @@ Per-Host Resource Estimates: Memory=429MB
|
||||
F00:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=428.81MB mem-reservation=27.44MB thread-reservation=9 runtime-filters-memory=7.00MB
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date, ctr_total_return
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date_sk, ctr_total_return
|
||||
| mem-estimate=4.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
18:TOP-N [LIMIT=100]
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date ASC, ctr_total_return ASC
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date_sk ASC, ctr_total_return ASC
|
||||
| mem-estimate=20.64KB mem-reservation=0B thread-reservation=0
|
||||
| tuple-ids=15 row-size=211B cardinality=100
|
||||
| in pipelines: 18(GETNEXT), 07(OPEN)
|
||||
@@ -239,11 +239,11 @@ Per-Host Resource Estimates: Memory=504MB
|
||||
F11:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Host Resources: mem-estimate=4.04MB mem-reservation=4.00MB thread-reservation=1
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date, ctr_total_return
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date_sk, ctr_total_return
|
||||
| mem-estimate=4.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
32:MERGING-EXCHANGE [UNPARTITIONED]
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date ASC, ctr_total_return ASC
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date_sk ASC, ctr_total_return ASC
|
||||
| limit: 100
|
||||
| mem-estimate=41.67KB mem-reservation=0B thread-reservation=0
|
||||
| tuple-ids=15 row-size=211B cardinality=100
|
||||
@@ -252,7 +252,7 @@ PLAN-ROOT SINK
|
||||
F00:PLAN FRAGMENT [RANDOM] hosts=1 instances=1
|
||||
Per-Host Resources: mem-estimate=137.32MB mem-reservation=16.81MB thread-reservation=2 runtime-filters-memory=3.00MB
|
||||
18:TOP-N [LIMIT=100]
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date ASC, ctr_total_return ASC
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date_sk ASC, ctr_total_return ASC
|
||||
| mem-estimate=20.64KB mem-reservation=0B thread-reservation=0
|
||||
| tuple-ids=15 row-size=211B cardinality=100
|
||||
| in pipelines: 18(GETNEXT), 07(OPEN)
|
||||
@@ -524,11 +524,11 @@ Per-Host Resource Estimates: Memory=236MB
|
||||
F11:PLAN FRAGMENT [UNPARTITIONED] hosts=1 instances=1
|
||||
| Per-Instance Resources: mem-estimate=4.04MB mem-reservation=4.00MB thread-reservation=1
|
||||
PLAN-ROOT SINK
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date, ctr_total_return
|
||||
| output exprs: c_customer_id, c_salutation, c_first_name, c_last_name, c_preferred_cust_flag, c_birth_day, c_birth_month, c_birth_year, c_birth_country, c_login, c_email_address, c_last_review_date_sk, ctr_total_return
|
||||
| mem-estimate=4.00MB mem-reservation=4.00MB spill-buffer=2.00MB thread-reservation=0
|
||||
|
|
||||
32:MERGING-EXCHANGE [UNPARTITIONED]
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date ASC, ctr_total_return ASC
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date_sk ASC, ctr_total_return ASC
|
||||
| limit: 100
|
||||
| mem-estimate=41.67KB mem-reservation=0B thread-reservation=0
|
||||
| tuple-ids=15 row-size=211B cardinality=100
|
||||
@@ -538,7 +538,7 @@ F00:PLAN FRAGMENT [RANDOM] hosts=1 instances=1
|
||||
Per-Host Shared Resources: mem-estimate=2.00MB mem-reservation=2.00MB thread-reservation=0 runtime-filters-memory=2.00MB
|
||||
Per-Instance Resources: mem-estimate=16.02MB mem-reservation=8.00MB thread-reservation=1
|
||||
18:TOP-N [LIMIT=100]
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date ASC, ctr_total_return ASC
|
||||
| order by: c_customer_id ASC, c_salutation ASC, c_first_name ASC, c_last_name ASC, c_preferred_cust_flag ASC, c_birth_day ASC, c_birth_month ASC, c_birth_year ASC, c_birth_country ASC, c_login ASC, c_email_address ASC, c_last_review_date_sk ASC, ctr_total_return ASC
|
||||
| mem-estimate=20.64KB mem-reservation=0B thread-reservation=0
|
||||
| tuple-ids=15 row-size=211B cardinality=100
|
||||
| in pipelines: 18(GETNEXT), 07(OPEN)
|
||||
|
||||
@@ -371,8 +371,11 @@ where c_current_cdemo_sk < 100 group by c_birth_country;
|
||||
---- TYPES
|
||||
STRING, BIGINT
|
||||
---- RUNTIME_PROFILE
|
||||
aggregation(SUM, NumPages): 30
|
||||
aggregation(SUM, NumStatsFilteredPages): 27
|
||||
aggregation(SUM, NumPages): 6
|
||||
aggregation(SUM, NumRowGroups): 20
|
||||
aggregation(SUM, NumRowGroupsWithPageIndex): 20
|
||||
aggregation(SUM, NumStatsFilteredPages): 3
|
||||
aggregation(SUM, NumStatsFilteredRowGroups): 19
|
||||
====
|
||||
---- QUERY
|
||||
# IMPALA-10345: Impala hits DCHECK in parquet-column-stats.inline.h
|
||||
|
||||
@@ -15,7 +15,7 @@ with customer_total_return as
|
||||
,ca_state)
|
||||
select c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
from customer_total_return ctr1
|
||||
,customer_address
|
||||
,customer
|
||||
@@ -27,7 +27,7 @@ with customer_total_return as
|
||||
and ctr1.ctr_customer_sk = c_customer_sk
|
||||
order by c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
limit 100;
|
||||
|
||||
|
||||
|
||||
@@ -13,7 +13,7 @@ with customer_total_return as
|
||||
,ca_state)
|
||||
select c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
from customer_total_return ctr1
|
||||
,customer_address
|
||||
,customer
|
||||
@@ -25,7 +25,7 @@ with customer_total_return as
|
||||
and ctr1.ctr_customer_sk = c_customer_sk
|
||||
order by c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
limit 100;
|
||||
|
||||
-- end query 1 in stream 0 using template query30.tpl
|
||||
|
||||
@@ -14,7 +14,7 @@ with customer_total_return as
|
||||
,ca_state)
|
||||
select c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
from customer_total_return ctr1
|
||||
,customer_address
|
||||
,customer
|
||||
@@ -26,7 +26,7 @@ with customer_total_return as
|
||||
and ctr1.ctr_customer_sk = c_customer_sk
|
||||
order by c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
limit 100;
|
||||
---- RESULTS
|
||||
'AAAAAAAAACBFAAAA','Dr.','Clifton','Carr','N',4,4,1950,'INDIA','NULL','Clifton.Carr@mOm0RG.com','2452385',2232.42
|
||||
|
||||
@@ -14,7 +14,7 @@ with customer_total_return as
|
||||
,ca_state)
|
||||
select c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
from customer_total_return ctr1
|
||||
,customer_address
|
||||
,customer
|
||||
@@ -26,7 +26,7 @@ with customer_total_return as
|
||||
and ctr1.ctr_customer_sk = c_customer_sk
|
||||
order by c_customer_id,c_salutation,c_first_name,c_last_name,c_preferred_cust_flag
|
||||
,c_birth_day,c_birth_month,c_birth_year,c_birth_country,c_login,c_email_address
|
||||
,c_last_review_date,ctr_total_return
|
||||
,c_last_review_date_sk,ctr_total_return
|
||||
limit 100;
|
||||
---- RESULTS
|
||||
'AAAAAAAAACBFAAAA','Dr.','Clifton','Carr','N',4,4,1950,'INDIA','NULL','Clifton.Carr@mOm0RG.com','2452385',2232.42
|
||||
|
||||
@@ -433,9 +433,6 @@ def load_tpc_queries(workload, include_stress_queries=False, query_name_filters=
|
||||
test_cases = parse_query_test_file(file_path)
|
||||
for test_case in test_cases:
|
||||
query_sql = remove_comments(test_case["QUERY"])
|
||||
if workload == "tpcds_partitioned":
|
||||
# replace old columns names from old TPC-DS spec with a new one.
|
||||
query_sql = query_sql.replace("c_last_review_date", "c_last_review_date_sk")
|
||||
|
||||
if re.match(filter_regex, test_case["QUERY_NAME"]):
|
||||
query_name_match = query_name_pattern.search(test_case["QUERY_NAME"])
|
||||
|
||||
Reference in New Issue
Block a user