Add list of tables missing stats to explain header and mem-limit exceeded error.

Change-Id: Ibe8f329d5513ae84a8134b9ddb3645fa174d8a66
Reviewed-on: http://gerrit.ent.cloudera.com:8080/1501
Reviewed-by: Alex Behm <alex.behm@cloudera.com>
Tested-by: jenkins
Reviewed-on: http://gerrit.ent.cloudera.com:8080/1880
This commit is contained in:
Alex Behm
2014-02-07 19:55:08 -08:00
committed by jenkins
parent b1aeea3f0b
commit 7fcd7cd64e
15 changed files with 323 additions and 29 deletions

View File

@@ -312,3 +312,77 @@ where month = 2
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=1 row-size=97B cardinality=560'
====
---- QUERY
# Tests the warning about missing table stats in the explain header.
explain select count(t1.int_col), avg(t2.float_col), sum(t3.bigint_col)
from functional_avro.alltypes t1
inner join functional_parquet.alltypessmall t2 on (t1.id = t2.id)
left outer join functional_avro.alltypes t3 on (t2.id = t3.id)
where t1.month = 1 and t2.year = 2009 and t3.bool_col = false
---- RESULTS
'Estimated Per-Host Requirements: Memory=4.03GB VCores=3'
'WARNING: The following tables are missing relevant table and/or column statistics.'
'functional_avro.alltypes, functional_parquet.alltypessmall'
''
'F03:PLAN FRAGMENT [PARTITION=UNPARTITIONED]'
' 09:AGGREGATE [MERGE FINALIZE]'
' | output: sum(count(t1.int_col)), sum(sum(t2.float_col)), sum(count(t2.float_col)), sum(sum(t3.bigint_col))'
' | hosts=3 per-host-mem=unavailable'
' | tuple-ids=3 row-size=32B cardinality=1'
' |'
' 08:EXCHANGE [PARTITION=UNPARTITIONED]'
' hosts=3 per-host-mem=unavailable'
' tuple-ids=3 row-size=32B cardinality=1'
''
'F00:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F03, EXCHANGE=08, PARTITION=UNPARTITIONED]'
' 05:AGGREGATE'
' | output: count(t1.int_col), sum(t2.float_col), count(t2.float_col), sum(t3.bigint_col)'
' | hosts=3 per-host-mem=10.00MB'
' | tuple-ids=3 row-size=32B cardinality=1'
' |'
' 04:HASH JOIN [LEFT OUTER JOIN, BROADCAST]'
' | hash predicates: t2.id = t3.id'
' | other predicates: t3.bool_col = FALSE'
' | hosts=3 per-host-mem=2.00GB'
' | tuple-ids=0,1,2N row-size=37B cardinality=unavailable'
' |'
' |--07:EXCHANGE [BROADCAST]'
' | hosts=3 per-host-mem=0B'
' | tuple-ids=2 row-size=13B cardinality=unavailable'
' |'
' 03:HASH JOIN [INNER JOIN, BROADCAST]'
' | hash predicates: t1.id = t2.id'
' | hosts=3 per-host-mem=2.00GB'
' | tuple-ids=0,1 row-size=24B cardinality=unavailable'
' |'
' |--06:EXCHANGE [BROADCAST]'
' | hosts=3 per-host-mem=0B'
' | tuple-ids=1 row-size=12B cardinality=unavailable'
' |'
' 00:SCAN HDFS [functional_avro.alltypes t1, PARTITION=RANDOM]'
' partitions=2/24 size=39.87KB'
' table stats: unavailable'
' columns missing stats: id, int_col'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=0 row-size=12B cardinality=unavailable'
''
'F02:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F00, EXCHANGE=07, BROADCAST]'
' 02:SCAN HDFS [functional_avro.alltypes t3, PARTITION=RANDOM]'
' partitions=24/24 size=470.35KB'
' predicates: t3.bool_col = FALSE'
' table stats: unavailable'
' column stats: unavailable'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=2 row-size=13B cardinality=unavailable'
''
'F01:PLAN FRAGMENT [PARTITION=RANDOM]'
' DATASTREAM SINK [FRAGMENT=F00, EXCHANGE=06, BROADCAST]'
' 01:SCAN HDFS [functional_parquet.alltypessmall t2, PARTITION=RANDOM]'
' partitions=4/4 size=9.63KB'
' table stats: unavailable'
' columns missing stats: id, float_col'
' hosts=3 per-host-mem=16.00MB'
' tuple-ids=1 row-size=12B cardinality=unavailable'
====