impala/testdata/workloads/functional-query/queries/QueryTest/parquet-continue-on-error.test

====
---- QUERY
# Returns all results despite a discrepancy between the number of values
# scanned and the number of values stored in the file metadata.
# Set a single node and scanner thread to make this test deterministic.
set num_nodes=1;
set num_scanner_threads=1;
select id, cnt from bad_column_metadata t, (select count(*) cnt from t.int_array) v
---- TYPES
bigint,bigint
---- RESULTS
1,10
2,10
3,10
4,10
5,10
6,10
7,10
8,10
9,10
10,10
11,10
12,10
13,10
14,10
15,10
16,10
17,10
18,10
19,10
20,10
21,10
22,10
23,10
24,10
25,10
26,10
27,10
28,10
29,10
30,10
---- ERRORS
Column metadata states there are 50 values, but read 100 values from column element. file: hdfs://regex:.$
====
---- QUERY
# Same as above but only selecting a single scalar column.
set num_nodes=1;
set num_scanner_threads=1;
select id from bad_column_metadata
---- TYPES
bigint
---- RESULTS
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
---- ERRORS
Column metadata states there are 11 values, but read 10 values from column id. file: hdfs://regex:.$
====
---- QUERY
SELECT * from bad_parquet_strings_negative_len
---- TYPES
STRING
---- RESULTS
---- ERRORS
row_regex: .*File '.*/plain-encoded-negative-len.parq' is corrupt: error decoding value of type STRING at offset 58.*
row_regex: .*File '.*/dict-encoded-negative-len.parq' is corrupt: error reading dictionary for data of type STRING: could not decode dictionary.*
====
---- QUERY
SELECT * from bad_parquet_strings_out_of_bounds
---- TYPES
STRING
---- RESULTS
---- ERRORS
row_regex: .*File '.*/plain-encoded-out-of-bounds.parq' is corrupt: error decoding value of type STRING at offset 58.*
row_regex: .*File '.*/dict-encoded-out-of-bounds.parq' is corrupt: error reading dictionary for data of type STRING: could not decode dictionary.*
====