mirror of
https://github.com/apache/impala.git
synced 2025-12-25 02:03:09 -05:00
Fix a bug in which Impala only reads the first stream of a multi-stream bz2/gzip file. Changes the bz2 decoder to read the file in a streaming fashion rather than reading the entire file into memory before it can be decompressed. Change-Id: Icbe617d03a69953f0bf3aa0f7c30d34bc612f9f8 (cherry picked from commit b6d0b4e059329633dc50f1f73ebe35b7ac317a8e) Reviewed-on: http://gerrit.cloudera.org:8080/2219 Reviewed-by: Juan Yu <jyu@cloudera.com> Tested-by: Internal Jenkins
102 lines
1.6 KiB
Plaintext
102 lines
1.6 KiB
Plaintext
====
|
|
---- QUERY
|
|
select count(*) from functional_text_bzip.bzip2_tbl
|
|
---- RESULTS
|
|
1000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select count(col) from functional_text_bzip.bzip2_tbl
|
|
---- RESULTS
|
|
1000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select * from functional_text_bzip.bzip2_tbl order by col limit 5
|
|
---- RESULTS
|
|
'0'
|
|
'1'
|
|
'10'
|
|
'100'
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select * from functional_text_bzip.large_bzip2_tbl order by col limit 5
|
|
---- RESULTS
|
|
'0'
|
|
'1'
|
|
'10'
|
|
'100'
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select count(col) from functional_text_bzip.large_bzip2_tbl
|
|
---- RESULTS
|
|
10000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select * from functional_text_bzip.large_multistream_bzip2_tbl order by col limit 5
|
|
---- RESULTS
|
|
'0'
|
|
'1'
|
|
'10'
|
|
'100'
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select count(col) from functional_text_bzip.multistream_bzip2_tbl
|
|
---- RESULTS
|
|
1000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select * from functional_text_bzip.multistream_bzip2_tbl order by col limit 5
|
|
---- RESULTS
|
|
'0'
|
|
'1'
|
|
'10'
|
|
'100'
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select count(*) from functional_text_bzip.large_multistream_bzip2_tbl
|
|
---- RESULTS
|
|
10000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select count(col) from functional_text_bzip.large_multistream_bzip2_tbl
|
|
---- RESULTS
|
|
10000000
|
|
---- TYPES
|
|
BIGINT
|
|
====
|
|
---- QUERY
|
|
select max(col) from (select * from functional_text_bzip.bzip2_tbl order by col limit 5) t
|
|
---- RESULTS
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|
|
---- QUERY
|
|
select max(col) from (select * from functional_text_bzip.multistream_bzip2_tbl order by col limit 5) t
|
|
---- RESULTS
|
|
'1000'
|
|
---- TYPES
|
|
STRING
|
|
====
|