mirror of
https://github.com/apache/impala.git
synced 2025-12-30 12:02:10 -05:00
This commit implements nested queries with [NOT] IN, [NOT] EXISTS and aggregate subquery predicates in Impala. The following cases are supported: 1. Correlated and uncorrelated [NOT] IN. 2. Correlated [NOT] EXISTS. 3. Correlated and uncorrelated aggregate subqueries. Change-Id: Ia3f4843c5f07d4e31ef3faedc58a15e623f91a5d Reviewed-on: http://gerrit.sjc.cloudera.com:8080/3754 Reviewed-by: Dimitris Tsirogiannis <dtsirogiannis@cloudera.com> Tested-by: jenkins Reviewed-on: http://gerrit.sjc.cloudera.com:8080/4109
81 lines
2.8 KiB
Plaintext
81 lines
2.8 KiB
Plaintext
---- QUERY
|
|
# limit in subquery
|
|
select count(*) from (select * from alltypessmall limit 10) a
|
|
---- TYPES
|
|
BIGINT
|
|
---- RESULTS
|
|
10
|
|
====
|
|
---- QUERY
|
|
# order by/limit in subquery, followed by addititional selection predicate;
|
|
# predicate is not applied in subquery
|
|
select id, bool_col, tinyint_col, smallint_col, int_col, bigint_col, float_col, double_col, date_string_col, string_col, timestamp_col, year, month
|
|
from (select id, bool_col, tinyint_col, smallint_col, int_col, bigint_col, float_col, double_col, date_string_col, string_col, timestamp_col, year, month from alltypessmall order by id limit 10) a
|
|
where bool_col = true
|
|
---- TYPES
|
|
INT, BOOLEAN, TINYINT, SMALLINT, INT, BIGINT, FLOAT, DOUBLE, STRING, STRING, TIMESTAMP, INT, INT
|
|
---- RESULTS
|
|
0,true,0,0,0,0,0,0,'01/01/09','0',2009-01-01 00:00:00,2009,1
|
|
2,true,2,2,2,20,2.200000047683716,20.2,'01/01/09','2',2009-01-01 00:02:00.100000000,2009,1
|
|
4,true,4,4,4,40,4.400000095367432,40.4,'01/01/09','4',2009-01-01 00:04:00.600000000,2009,1
|
|
6,true,6,6,6,60,6.599999904632568,60.6,'01/01/09','6',2009-01-01 00:06:00.150000000,2009,1
|
|
8,true,8,8,8,80,8.800000190734863,80.8,'01/01/09','8',2009-01-01 00:08:00.280000000,2009,1
|
|
====
|
|
---- QUERY
|
|
# order by/limit in subquery, followed by addititional selection predicate;
|
|
# variant w/ join
|
|
select id, bool_col, tinyint_col, smallint_col, int_col, bigint_col, float_col, double_col, date_string_col, string_col, timestamp_col, year, month
|
|
from (
|
|
select a.* from alltypessmall a join alltypessmall using (id)
|
|
order by a.id limit 10
|
|
) a
|
|
where bool_col = true
|
|
---- TYPES
|
|
INT, BOOLEAN, TINYINT, SMALLINT, INT, BIGINT, FLOAT, DOUBLE, STRING, STRING, TIMESTAMP, INT, INT
|
|
---- RESULTS
|
|
0,true,0,0,0,0,0,0,'01/01/09','0',2009-01-01 00:00:00,2009,1
|
|
2,true,2,2,2,20,2.200000047683716,20.2,'01/01/09','2',2009-01-01 00:02:00.100000000,2009,1
|
|
4,true,4,4,4,40,4.400000095367432,40.4,'01/01/09','4',2009-01-01 00:04:00.600000000,2009,1
|
|
6,true,6,6,6,60,6.599999904632568,60.6,'01/01/09','6',2009-01-01 00:06:00.150000000,2009,1
|
|
8,true,8,8,8,80,8.800000190734863,80.8,'01/01/09','8',2009-01-01 00:08:00.280000000,2009,1
|
|
====
|
|
---- QUERY
|
|
# join against subquery with limit creates a merge fragment that applies the limit
|
|
select alltypes.id, a.id
|
|
from alltypes
|
|
join (select id from alltypessmall order by id limit 10) a using (id)
|
|
---- TYPES
|
|
INT, INT
|
|
---- RESULTS: VERIFY_IS_EQUAL_SORTED
|
|
0,0
|
|
1,1
|
|
2,2
|
|
3,3
|
|
4,4
|
|
5,5
|
|
6,6
|
|
7,7
|
|
8,8
|
|
9,9
|
|
====
|
|
---- QUERY
|
|
# join against subquery with limit;
|
|
# predicate pushdown is prevented in presence of order by/limit clause; variant w/ join
|
|
select alltypes.id, a.id
|
|
from alltypes
|
|
join (
|
|
select a.id, a.bool_col
|
|
from alltypessmall a join alltypessmall using (id)
|
|
order by a.id limit 10
|
|
) a using (id)
|
|
where a.bool_col = true order by a.id limit 5
|
|
---- TYPES
|
|
INT, INT
|
|
---- RESULTS
|
|
0,0
|
|
2,2
|
|
4,4
|
|
6,6
|
|
8,8
|
|
====
|