Add list of tables missing stats to explain header and mem-limit exceeded error.

Change-Id: Ibe8f329d5513ae84a8134b9ddb3645fa174d8a66
Reviewed-on: http://gerrit.ent.cloudera.com:8080/1501
Reviewed-by: Alex Behm <alex.behm@cloudera.com>
Tested-by: jenkins
Reviewed-on: http://gerrit.ent.cloudera.com:8080/1880
This commit is contained in:
Alex Behm
2014-02-07 19:55:08 -08:00
committed by jenkins
parent b1aeea3f0b
commit 7fcd7cd64e
15 changed files with 323 additions and 29 deletions

View File

@@ -109,4 +109,27 @@ where month = 2
''
'WRITE TO HDFS [functional.t, OVERWRITE=false]'
'00:SCAN HDFS [functional.alltypes]'
====
---- QUERY
# Tests the warning about missing table stats in the explain header.
explain select count(t1.int_col), avg(t2.float_col), sum(t3.bigint_col)
from functional_avro.alltypes t1
inner join functional_parquet.alltypessmall t2 on (t1.id = t2.id)
left outer join functional_avro.alltypes t3 on (t2.id = t3.id)
where t1.month = 1 and t2.year = 2009 and t3.bool_col = false
---- RESULTS
'Estimated Per-Host Requirements: Memory=4.03GB VCores=3'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'functional_avro.alltypes, functional_parquet.alltypessmall'
''
'09:AGGREGATE [MERGE FINALIZE]'
'08:EXCHANGE [PARTITION=UNPARTITIONED]'
'05:AGGREGATE'
'04:HASH JOIN [LEFT OUTER JOIN, BROADCAST]'
'|--07:EXCHANGE [BROADCAST]'
'| 02:SCAN HDFS [functional_avro.alltypes t3]'
'03:HASH JOIN [INNER JOIN, BROADCAST]'
'|--06:EXCHANGE [BROADCAST]'
'| 01:SCAN HDFS [functional_parquet.alltypessmall t2]'
'00:SCAN HDFS [functional_avro.alltypes t1]'
====

View File

@@ -174,4 +174,45 @@ where month = 2
'|'
'00:SCAN HDFS [functional.alltypes]'
' partitions=2/24 size=36.51KB'
====
---- QUERY
# Tests the warning about missing table stats in the explain header.
explain select count(t1.int_col), avg(t2.float_col), sum(t3.bigint_col)
from functional_avro.alltypes t1
inner join functional_parquet.alltypessmall t2 on (t1.id = t2.id)
left outer join functional_avro.alltypes t3 on (t2.id = t3.id)
where t1.month = 1 and t2.year = 2009 and t3.bool_col = false
---- RESULTS
'Estimated Per-Host Requirements: Memory=4.03GB VCores=3'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'functional_avro.alltypes, functional_parquet.alltypessmall'
''
'09:AGGREGATE [MERGE FINALIZE]'
'| output: sum(count(t1.int_col)), sum(sum(t2.float_col)), sum(count(t2.float_col)), sum(sum(t3.bigint_col))'
'|'
'08:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
'05:AGGREGATE'
'| output: count(t1.int_col), sum(t2.float_col), count(t2.float_col), sum(t3.bigint_col)'
'|'
'04:HASH JOIN [LEFT OUTER JOIN, BROADCAST]'
'| hash predicates: t2.id = t3.id'
'| other predicates: t3.bool_col = FALSE'
'|'
'|--07:EXCHANGE [BROADCAST]'
'| |'
'| 02:SCAN HDFS [functional_avro.alltypes t3]'
'| partitions=24/24 size=470.35KB'
'| predicates: t3.bool_col = FALSE'
'|'
'03:HASH JOIN [INNER JOIN, BROADCAST]'
'| hash predicates: t1.id = t2.id'
'|'
'|--06:EXCHANGE [BROADCAST]'
'| |'
'| 01:SCAN HDFS [functional_parquet.alltypessmall t2]'
'| partitions=4/4 size=9.63KB'
'|'
'00:SCAN HDFS [functional_avro.alltypes t1]'
' partitions=2/24 size=39.87KB'
====

View File

@@ -280,3 +280,70 @@ where month = 2
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=1 row-size=97B cardinality=560'
====
---- QUERY
# Tests the warning about missing table stats in the explain header.
explain select count(t1.int_col), avg(t2.float_col), sum(t3.bigint_col)
from functional_avro.alltypes t1
inner join functional_parquet.alltypessmall t2 on (t1.id = t2.id)
left outer join functional_avro.alltypes t3 on (t2.id = t3.id)
where t1.month = 1 and t2.year = 2009 and t3.bool_col = false
---- RESULTS
'Estimated Per-Host Requirements: Memory=4.03GB VCores=3'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'functional_avro.alltypes, functional_parquet.alltypessmall'
''
'09:AGGREGATE [MERGE FINALIZE]'
'| output: sum(count(t1.int_col)), sum(sum(t2.float_col)), sum(count(t2.float_col)), sum(sum(t3.bigint_col))'
'| hosts=3 per-host-mem=unavailable'
'| tuple-ids=3 row-size=32B cardinality=1'
'|'
'08:EXCHANGE [PARTITION=UNPARTITIONED]'
'| hosts=3 per-host-mem=unavailable'
'| tuple-ids=3 row-size=32B cardinality=1'
'|'
'05:AGGREGATE'
'| output: count(t1.int_col), sum(t2.float_col), count(t2.float_col), sum(t3.bigint_col)'
'| hosts=3 per-host-mem=10.00MB'
'| tuple-ids=3 row-size=32B cardinality=1'
'|'
'04:HASH JOIN [LEFT OUTER JOIN, BROADCAST]'
'| hash predicates: t2.id = t3.id'
'| other predicates: t3.bool_col = FALSE'
'| hosts=3 per-host-mem=2.00GB'
'| tuple-ids=0,1,2N row-size=37B cardinality=unavailable'
'|'
'|--07:EXCHANGE [BROADCAST]'
'| | hosts=3 per-host-mem=0B'
'| | tuple-ids=2 row-size=13B cardinality=unavailable'
'| |'
'| 02:SCAN HDFS [functional_avro.alltypes t3, PARTITION=RANDOM]'
'| partitions=24/24 size=470.35KB'
'| predicates: t3.bool_col = FALSE'
'| table stats: unavailable'
'| column stats: unavailable'
'| hosts=3 per-host-mem=16.00MB'
'| tuple-ids=2 row-size=13B cardinality=unavailable'
'|'
'03:HASH JOIN [INNER JOIN, BROADCAST]'
'| hash predicates: t1.id = t2.id'
'| hosts=3 per-host-mem=2.00GB'
'| tuple-ids=0,1 row-size=24B cardinality=unavailable'
'|'
'|--06:EXCHANGE [BROADCAST]'
'| | hosts=3 per-host-mem=0B'
'| | tuple-ids=1 row-size=12B cardinality=unavailable'
'| |'
'| 01:SCAN HDFS [functional_parquet.alltypessmall t2, PARTITION=RANDOM]'
'| partitions=4/4 size=9.63KB'
'| table stats: unavailable'
'| columns missing stats: id, float_col'
'| hosts=3 per-host-mem=16.00MB'
'| tuple-ids=1 row-size=12B cardinality=unavailable'
'|'
'00:SCAN HDFS [functional_avro.alltypes t1, PARTITION=RANDOM]'
' partitions=2/24 size=39.87KB'
' table stats: unavailable'
' columns missing stats: id, int_col'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=0 row-size=12B cardinality=unavailable'
====

View File

@@ -312,3 +312,77 @@ where month = 2
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=1 row-size=97B cardinality=560'
====
---- QUERY
# Tests the warning about missing table stats in the explain header.
explain select count(t1.int_col), avg(t2.float_col), sum(t3.bigint_col)
from functional_avro.alltypes t1
inner join functional_parquet.alltypessmall t2 on (t1.id = t2.id)
left outer join functional_avro.alltypes t3 on (t2.id = t3.id)
where t1.month = 1 and t2.year = 2009 and t3.bool_col = false
---- RESULTS
'Estimated Per-Host Requirements: Memory=4.03GB VCores=3'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'functional_avro.alltypes, functional_parquet.alltypessmall'
''
'F03:PLAN FRAGMENT [PARTITION=UNPARTITIONED]'
' 09:AGGREGATE [MERGE FINALIZE]'
' | output: sum(count(t1.int_col)), sum(sum(t2.float_col)), sum(count(t2.float_col)), sum(sum(t3.bigint_col))'
' | hosts=3 per-host-mem=unavailable'
' | tuple-ids=3 row-size=32B cardinality=1'
' |'
' 08:EXCHANGE [PARTITION=UNPARTITIONED]'
' hosts=3 per-host-mem=unavailable'
' tuple-ids=3 row-size=32B cardinality=1'
''
'F00:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F03, EXCHANGE=08, PARTITION=UNPARTITIONED]'
' 05:AGGREGATE'
' | output: count(t1.int_col), sum(t2.float_col), count(t2.float_col), sum(t3.bigint_col)'
' | hosts=3 per-host-mem=10.00MB'
' | tuple-ids=3 row-size=32B cardinality=1'
' |'
' 04:HASH JOIN [LEFT OUTER JOIN, BROADCAST]'
' | hash predicates: t2.id = t3.id'
' | other predicates: t3.bool_col = FALSE'
' | hosts=3 per-host-mem=2.00GB'
' | tuple-ids=0,1,2N row-size=37B cardinality=unavailable'
' |'
' |--07:EXCHANGE [BROADCAST]'
' | hosts=3 per-host-mem=0B'
' | tuple-ids=2 row-size=13B cardinality=unavailable'
' |'
' 03:HASH JOIN [INNER JOIN, BROADCAST]'
' | hash predicates: t1.id = t2.id'
' | hosts=3 per-host-mem=2.00GB'
' | tuple-ids=0,1 row-size=24B cardinality=unavailable'
' |'
' |--06:EXCHANGE [BROADCAST]'
' | hosts=3 per-host-mem=0B'
' | tuple-ids=1 row-size=12B cardinality=unavailable'
' |'
' 00:SCAN HDFS [functional_avro.alltypes t1, PARTITION=RANDOM]'
' partitions=2/24 size=39.87KB'
' table stats: unavailable'
' columns missing stats: id, int_col'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=0 row-size=12B cardinality=unavailable'
''
'F02:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F00, EXCHANGE=07, BROADCAST]'
' 02:SCAN HDFS [functional_avro.alltypes t3, PARTITION=RANDOM]'
' partitions=24/24 size=470.35KB'
' predicates: t3.bool_col = FALSE'
' table stats: unavailable'
' column stats: unavailable'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=2 row-size=13B cardinality=unavailable'
''
'F01:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F00, EXCHANGE=06, BROADCAST]'
' 01:SCAN HDFS [functional_parquet.alltypessmall t2, PARTITION=RANDOM]'
' partitions=4/4 size=9.63KB'
' table stats: unavailable'
' columns missing stats: id, float_col'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=1 row-size=12B cardinality=unavailable'
====

View File

@@ -82,6 +82,8 @@ WHERE tinyint_col < 7 AND smallint_col < 6 AND int_col < 5 AND bigint_col < 40 A
string_col in ('1', '2', '3')
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -94,6 +96,8 @@ SELECT * from all_insert_partition_col_types
WHERE tinyint_col < 7
---- RESULTS
'Estimated Per-Host Requirements: Memory=48.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -106,6 +110,8 @@ SELECT * from all_insert_partition_col_types
WHERE smallint_col < 6
---- RESULTS
'Estimated Per-Host Requirements: Memory=48.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -118,6 +124,8 @@ SELECT * from all_insert_partition_col_types
WHERE int_col < 5
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -130,6 +138,8 @@ SELECT * from all_insert_partition_col_types
WHERE bigint_col < 40
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -142,6 +152,8 @@ SELECT * from all_insert_partition_col_types
WHERE string_col in ('1', '2', '3')
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -154,6 +166,8 @@ SELECT * from all_insert_partition_col_types
WHERE double_col = 1.1
---- RESULTS
'Estimated Per-Host Requirements: Memory=64.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -166,6 +180,8 @@ SELECT * from all_insert_partition_col_types
WHERE float_col = 2
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_insert_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'
@@ -223,6 +239,8 @@ SELECT * FROM all_partition_col_types
WHERE bool_col=false
---- RESULTS
'Estimated Per-Host Requirements: Memory=32.00MB VCores=1'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'hdfs_partitioning.all_partition_col_types'
''
'01:EXCHANGE [PARTITION=UNPARTITIONED]'
'|'