testdata/workloads/functional-planner/queries/PlannerTest/inline-view.test - impala - Git at Google

 # subquery with aggregation and order by/limit, as left-hand side of join;
 # having clause in subquery is transfered to merge agg step in distrib plan
 select *
 from (
   select int_col, count(*)
   from functional.alltypessmall
   where month = 1
   group by int_col
   having count(*) > 1
   order by count(*) desc limit 5
   ) t1
 join functional.alltypes t2 on (t1.int_col = t2.int_col)
 where month = 1
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: t2.int_col = int_col
 |  runtime filters: RF000 <- int_col
 |  row-size=101B cardinality=620
 |
 |--02:TOP-N [LIMIT=5]
 |  |  order by: count(*) DESC
 |  |  row-size=12B cardinality=1
 |  |
 |  01:AGGREGATE [FINALIZE]
 |  |  output: count(*)
 |  |  group by: int_col
 |  |  having: count(*) > 1
 |  |  row-size=12B cardinality=1
 |  |
 |  00:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: `month` = 1
 |     partitions=1/4 files=1 size=1.57KB
 |     row-size=4B cardinality=25
 |
 03:SCAN HDFS [functional.alltypes t2]
    partition predicates: `month` = 1
    partitions=2/24 files=2 size=40.32KB
    runtime filters: RF000 -> t2.int_col
    row-size=89B cardinality=620
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 09:EXCHANGE [UNPARTITIONED]
 |
 04:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: t2.int_col = int_col
 |  runtime filters: RF000 <- int_col
 |  row-size=101B cardinality=620
 |
 |--08:EXCHANGE [BROADCAST]
 |  |
 |  07:MERGING-EXCHANGE [UNPARTITIONED]
 |  |  order by: count(*) DESC
 |  |  limit: 5
 |  |
 |  02:TOP-N [LIMIT=5]
 |  |  order by: count(*) DESC
 |  |  row-size=12B cardinality=1
 |  |
 |  06:AGGREGATE [FINALIZE]
 |  |  output: count:merge(*)
 |  |  group by: int_col
 |  |  having: count(*) > 1
 |  |  row-size=12B cardinality=1
 |  |
 |  05:EXCHANGE [HASH(int_col)]
 |  |
 |  01:AGGREGATE [STREAMING]
 |  |  output: count(*)
 |  |  group by: int_col
 |  |  row-size=12B cardinality=10
 |  |
 |  00:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: `month` = 1
 |     partitions=1/4 files=1 size=1.57KB
 |     row-size=4B cardinality=25
 |
 03:SCAN HDFS [functional.alltypes t2]
    partition predicates: `month` = 1
    partitions=2/24 files=2 size=40.32KB
    runtime filters: RF000 -> t2.int_col
    row-size=89B cardinality=620
 ====
 # simple full scan subquery
 select * from (select y x from (select id y from functional_hbase.alltypessmall) a) b
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:SCAN HBASE [functional_hbase.alltypessmall]
    row-size=4B cardinality=50
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 01:EXCHANGE [UNPARTITIONED]
 |
 00:SCAN HBASE [functional_hbase.alltypessmall]
    row-size=4B cardinality=50
 ====
 # subquery doing join
 select * from (select t2.*
 from functional.testtbl t1 join functional.testtbl t2 using(id)
 where t1.zip = 94611) x
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [INNER JOIN]
 |  hash predicates: t1.id = t2.id
 |  runtime filters: RF000 <- t2.id
 |  row-size=36B cardinality=0
 |
 |--01:SCAN HDFS [functional.testtbl t2]
 |     partitions=1/1 files=0 size=0B
 |     row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl t1]
    partitions=1/1 files=0 size=0B
    predicates: t1.zip = 94611
    runtime filters: RF000 -> t1.id
    row-size=12B cardinality=0
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 04:EXCHANGE [UNPARTITIONED]
 |
 02:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: t1.id = t2.id
 |  runtime filters: RF000 <- t2.id
 |  row-size=36B cardinality=0
 |
 |--03:EXCHANGE [BROADCAST]
 |  |
 |  01:SCAN HDFS [functional.testtbl t2]
 |     partitions=1/1 files=0 size=0B
 |     row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl t1]
    partitions=1/1 files=0 size=0B
    predicates: t1.zip = 94611
    runtime filters: RF000 -> t1.id
    row-size=12B cardinality=0
 ====
 # subquery doing join
 # multiple join predicates;
 # scan predicates get propagated correctly;
 # non-eq join predicates are evaluated as extra conjuncts by the join node
 select *
 from
   (select a.*
    from functional.alltypesagg a
      right outer join functional.alltypessmall b using (id, int_col)
    where a.day >= 6
      and b.month > 2
      and a.tinyint_col = 15
      and b.string_col = '15'
      and a.tinyint_col + b.tinyint_col < 15) x
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: a.id = b.id, a.int_col = b.int_col
 |  other predicates: a.tinyint_col = 15, a.`day` >= 6, a.tinyint_col + b.tinyint_col < 15
 |  runtime filters: RF000 <- b.id, RF001 <- b.int_col
 |  row-size=117B cardinality=5
 |
 |--01:SCAN HDFS [functional.alltypessmall b]
 |     partition predicates: b.`month` > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: b.string_col = '15'
 |     row-size=22B cardinality=5
 |
 00:SCAN HDFS [functional.alltypesagg a]
    partition predicates: a.`day` >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: a.tinyint_col = 15
    runtime filters: RF000 -> a.id, RF001 -> a.int_col
    row-size=95B cardinality=556
 ---- SCANRANGELOCATIONS
 NODE 0:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=10/100110.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=6/100106.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=7/100107.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=8/100108.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=9/100109.txt 0:76263
 NODE 1:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=3/090301.txt 0:1620
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=4/090401.txt 0:1621
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:EXCHANGE [UNPARTITIONED]
 |
 02:HASH JOIN [RIGHT OUTER JOIN, PARTITIONED]
 |  hash predicates: a.id = b.id, a.int_col = b.int_col
 |  other predicates: a.tinyint_col = 15, a.`day` >= 6, a.tinyint_col + b.tinyint_col < 15
 |  runtime filters: RF000 <- b.id, RF001 <- b.int_col
 |  row-size=117B cardinality=5
 |
 |--04:EXCHANGE [HASH(b.id,b.int_col)]
 |  |
 |  01:SCAN HDFS [functional.alltypessmall b]
 |     partition predicates: b.`month` > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: b.string_col = '15'
 |     row-size=22B cardinality=5
 |
 03:EXCHANGE [HASH(a.id,a.int_col)]
 |
 00:SCAN HDFS [functional.alltypesagg a]
    partition predicates: a.`day` >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: a.tinyint_col = 15
    runtime filters: RF000 -> a.id, RF001 -> a.int_col
    row-size=95B cardinality=556
 ====
 # predicate pushdown
 select * from (select * from functional_hbase.alltypessmall) a where id < 5
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:SCAN HBASE [functional_hbase.alltypessmall]
    predicates: functional_hbase.alltypessmall.id < 5
    row-size=89B cardinality=5
 ====
 # subquery join
 # multiple join predicates;
 # scan predicates get propagated correctly;
 # non-eq join predicates are evaluated as extra conjuncts by the join node
 select *
 from
   (select id, int_col, day, tinyint_col from functional.alltypesagg) a
   right outer join
   (select id, int_col, month, string_col, tinyint_col
    from functional.alltypessmall) b using (id, int_col)
 where a.day >= 6
 and b.month > 2
 and a.tinyint_col = 15
 and b.string_col = '15'
 and a.tinyint_col + b.tinyint_col < 15
 and b.id + 15 = 27
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: id = id, int_col = int_col
 |  other predicates: tinyint_col = 15, `day` >= 6, tinyint_col + tinyint_col < 15
 |  runtime filters: RF000 <- id, RF001 <- int_col
 |  row-size=39B cardinality=2
 |
 |--01:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: functional.alltypessmall.month > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: functional.alltypessmall.string_col = '15', functional.alltypessmall.id + 15 = 27
 |     row-size=26B cardinality=2
 |
 00:SCAN HDFS [functional.alltypesagg]
    partition predicates: functional.alltypesagg.day >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: functional.alltypesagg.tinyint_col = 15, functional.alltypesagg.id + 15 = 27
    runtime filters: RF000 -> id, RF001 -> int_col
    row-size=13B cardinality=167
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:EXCHANGE [UNPARTITIONED]
 |
 02:HASH JOIN [RIGHT OUTER JOIN, PARTITIONED]
 |  hash predicates: id = id, int_col = int_col
 |  other predicates: tinyint_col = 15, `day` >= 6, tinyint_col + tinyint_col < 15
 |  runtime filters: RF000 <- id, RF001 <- int_col
 |  row-size=39B cardinality=2
 |
 |--04:EXCHANGE [HASH(id,int_col)]
 |  |
 |  01:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: functional.alltypessmall.month > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: functional.alltypessmall.string_col = '15', functional.alltypessmall.id + 15 = 27
 |     row-size=26B cardinality=2
 |
 03:EXCHANGE [HASH(id,int_col)]
 |
 00:SCAN HDFS [functional.alltypesagg]
    partition predicates: functional.alltypesagg.day >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: functional.alltypesagg.tinyint_col = 15, functional.alltypesagg.id + 15 = 27
    runtime filters: RF000 -> id, RF001 -> int_col
    row-size=13B cardinality=167
 ====
 # subquery join
 # multiple join predicates;
 # scan predicates get propagated correctly;
 # non-eq join predicates are evaluated as extra conjuncts by the join node
 select *
 from
   (select id, int_col, day, tinyint_col
    from
      (select id, int_col, day, tinyint_col from functional.alltypesagg) a0
    where a0.day >= 6) a
   right outer join
   (select id, int_col, month, string_col, tinyint_col from functional.alltypessmall) b
   using (id, int_col)
 where b.month > 2
 and a.tinyint_col = 15
 and b.string_col = '15'
 and a.tinyint_col + b.tinyint_col < 15
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: id = id, int_col = int_col
 |  other predicates: tinyint_col = 15, tinyint_col + tinyint_col < 15
 |  runtime filters: RF000 <- id, RF001 <- int_col
 |  row-size=39B cardinality=5
 |
 |--01:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: functional.alltypessmall.month > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: functional.alltypessmall.string_col = '15'
 |     row-size=26B cardinality=5
 |
 00:SCAN HDFS [functional.alltypesagg]
    partition predicates: functional.alltypesagg.day >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: functional.alltypesagg.tinyint_col = 15
    runtime filters: RF000 -> id, RF001 -> int_col
    row-size=13B cardinality=556
 ---- SCANRANGELOCATIONS
 NODE 0:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=10/100110.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=6/100106.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=7/100107.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=8/100108.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=9/100109.txt 0:76263
 NODE 1:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=3/090301.txt 0:1620
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=4/090401.txt 0:1621
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:EXCHANGE [UNPARTITIONED]
 |
 02:HASH JOIN [RIGHT OUTER JOIN, PARTITIONED]
 |  hash predicates: id = id, int_col = int_col
 |  other predicates: tinyint_col = 15, tinyint_col + tinyint_col < 15
 |  runtime filters: RF000 <- id, RF001 <- int_col
 |  row-size=39B cardinality=5
 |
 |--04:EXCHANGE [HASH(id,int_col)]
 |  |
 |  01:SCAN HDFS [functional.alltypessmall]
 |     partition predicates: functional.alltypessmall.month > 2
 |     partitions=2/4 files=2 size=3.17KB
 |     predicates: functional.alltypessmall.string_col = '15'
 |     row-size=26B cardinality=5
 |
 03:EXCHANGE [HASH(id,int_col)]
 |
 00:SCAN HDFS [functional.alltypesagg]
    partition predicates: functional.alltypesagg.day >= 6
    partitions=5/11 files=5 size=372.38KB
    predicates: functional.alltypesagg.tinyint_col = 15
    runtime filters: RF000 -> id, RF001 -> int_col
    row-size=13B cardinality=556
 ====
 # complex join, having joined subquery on the rhs, and predicate
 # at multiple subquery level. This tests that both sides of a join
 # that is itself on the build side of another join get compacted.
 select x.smallint_col, x.id, x.tinyint_col, c.id, x.int_col, x.float_col, c.string_col
 from functional.alltypessmall c
 join (
    select a.smallint_col smallint_col, a.tinyint_col tinyint_col, a.day day,
            a.int_col int_col, a.month month, b.float_col float_col, b.id id
    from ( select * from functional.alltypesagg a where month=1 ) a
    join functional.alltypessmall b on (a.smallint_col = b.id)
  ) x on (x.tinyint_col = c.id)
 where x.day=1
 and x.int_col > 899
 and x.float_col > 4.5
 and c.string_col < '7'
 and x.int_col + x.float_col + cast(c.string_col as float) < 1000
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: c.id = a.tinyint_col
 |  other predicates: a.int_col + b.float_col + CAST(c.string_col AS FLOAT) < 1000
 |  runtime filters: RF000 <- a.tinyint_col
 |  row-size=32B cardinality=11
 |
 |--03:HASH JOIN [INNER JOIN]
 |  |  hash predicates: a.smallint_col = b.id
 |  |  runtime filters: RF002 <- b.id
 |  |  row-size=15B cardinality=11
 |  |
 |  |--02:SCAN HDFS [functional.alltypessmall b]
 |  |     partitions=4/4 files=4 size=6.32KB
 |  |     predicates: b.float_col > 4.5
 |  |     row-size=8B cardinality=10
 |  |
 |  01:SCAN HDFS [functional.alltypesagg a]
 |     partition predicates: `month` = 1, a.day = 1
 |     partitions=1/11 files=1 size=73.39KB
 |     predicates: a.int_col > 899
 |     runtime filters: RF002 -> a.smallint_col
 |     row-size=7B cardinality=100
 |
 00:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    predicates: c.string_col < '7'
    runtime filters: RF000 -> c.id
    row-size=17B cardinality=10
 ---- SCANRANGELOCATIONS
 NODE 0:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=1/090101.txt 0:1610
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=2/090201.txt 0:1621
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=3/090301.txt 0:1620
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=4/090401.txt 0:1621
 NODE 1:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=1/100101.txt 0:75153
 NODE 2:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=1/090101.txt 0:1610
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=2/090201.txt 0:1621
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=3/090301.txt 0:1620
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypessmall/year=2009/month=4/090401.txt 0:1621
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 09:EXCHANGE [UNPARTITIONED]
 |
 04:HASH JOIN [INNER JOIN, PARTITIONED]
 |  hash predicates: c.id = a.tinyint_col
 |  other predicates: a.int_col + b.float_col + CAST(c.string_col AS FLOAT) < 1000
 |  runtime filters: RF000 <- a.tinyint_col
 |  row-size=32B cardinality=11
 |
 |--08:EXCHANGE [HASH(a.tinyint_col)]
 |  |
 |  03:HASH JOIN [INNER JOIN, PARTITIONED]
 |  |  hash predicates: b.id = a.smallint_col
 |  |  runtime filters: RF002 <- a.smallint_col
 |  |  row-size=15B cardinality=11
 |  |
 |  |--06:EXCHANGE [HASH(a.smallint_col)]
 |  |  |
 |  |  01:SCAN HDFS [functional.alltypesagg a]
 |  |     partition predicates: `month` = 1, a.day = 1
 |  |     partitions=1/11 files=1 size=73.39KB
 |  |     predicates: a.int_col > 899
 |  |     row-size=7B cardinality=100
 |  |
 |  05:EXCHANGE [HASH(b.id)]
 |  |
 |  02:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     predicates: b.float_col > 4.5
 |     runtime filters: RF002 -> b.id
 |     row-size=8B cardinality=10
 |
 07:EXCHANGE [HASH(c.id)]
 |
 00:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    predicates: c.string_col < '7'
    runtime filters: RF000 -> c.id
    row-size=17B cardinality=10
 ====
 # with grouping
 select tinyint_col, count(*), min(tinyint_col), max(tinyint_col), sum(tinyint_col),
 avg(tinyint_col)
 from (select * from functional.alltypesagg) a
 group by 1
 ---- PLAN
 PLAN-ROOT SINK
 |
 01:AGGREGATE [FINALIZE]
 |  output: count(*), min(functional.alltypesagg.tinyint_col), max(functional.alltypesagg.tinyint_col), sum(functional.alltypesagg.tinyint_col), avg(functional.alltypesagg.tinyint_col)
 |  group by: functional.alltypesagg.tinyint_col
 |  row-size=27B cardinality=9
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=1B cardinality=11.00K
 ---- SCANRANGELOCATIONS
 NODE 0:
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=1/100101.txt 0:75153
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=10/100110.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=2/100102.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=3/100103.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=4/100104.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=5/100105.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=6/100106.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=7/100107.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=8/100108.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=9/100109.txt 0:76263
   HDFS SPLIT hdfs://localhost:20500/test-warehouse/alltypesagg/year=2010/month=1/day=__HIVE_DEFAULT_PARTITION__/000000_0 0:72759
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 04:EXCHANGE [UNPARTITIONED]
 |
 03:AGGREGATE [FINALIZE]
 |  output: count:merge(*), min:merge(tinyint_col), max:merge(tinyint_col), sum:merge(tinyint_col), avg:merge(tinyint_col)
 |  group by: tinyint_col
 |  row-size=27B cardinality=9
 |
 02:EXCHANGE [HASH(tinyint_col)]
 |
 01:AGGREGATE [STREAMING]
 |  output: count(*), min(functional.alltypesagg.tinyint_col), max(functional.alltypesagg.tinyint_col), sum(functional.alltypesagg.tinyint_col), avg(functional.alltypesagg.tinyint_col)
 |  group by: functional.alltypesagg.tinyint_col
 |  row-size=27B cardinality=9
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=1B cardinality=11.00K
 ====
 # with grouping
 select * from (
 select tinyint_col, count(*), min(tinyint_col), max(tinyint_col), sum(tinyint_col),
 avg(tinyint_col)
 from functional.alltypesagg
 group by 1
 ) a
 ---- PLAN
 PLAN-ROOT SINK
 |
 01:AGGREGATE [FINALIZE]
 |  output: count(*), min(tinyint_col), max(tinyint_col), sum(tinyint_col), avg(tinyint_col)
 |  group by: tinyint_col
 |  row-size=27B cardinality=9
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=1B cardinality=11.00K
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 04:EXCHANGE [UNPARTITIONED]
 |
 03:AGGREGATE [FINALIZE]
 |  output: count:merge(*), min:merge(tinyint_col), max:merge(tinyint_col), sum:merge(tinyint_col), avg:merge(tinyint_col)
 |  group by: tinyint_col
 |  row-size=27B cardinality=9
 |
 02:EXCHANGE [HASH(tinyint_col)]
 |
 01:AGGREGATE [STREAMING]
 |  output: count(*), min(tinyint_col), max(tinyint_col), sum(tinyint_col), avg(tinyint_col)
 |  group by: tinyint_col
 |  row-size=27B cardinality=9
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=1B cardinality=11.00K
 ====
 select c1, c2, c3
 from
   (select c1, c2, c3
    from
      (select int_col c1, sum(float_col) c2, min(float_col) c3
       from functional_hbase.alltypessmall
       group by 1) x
     order by 2,3 desc
     limit 5
 ) y
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:TOP-N [LIMIT=5]
 |  order by: c2 ASC, c3 DESC
 |  row-size=16B cardinality=5
 |
 01:AGGREGATE [FINALIZE]
 |  output: sum(float_col), min(float_col)
 |  group by: int_col
 |  row-size=16B cardinality=10
 |
 00:SCAN HBASE [functional_hbase.alltypessmall]
    row-size=8B cardinality=50
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:MERGING-EXCHANGE [UNPARTITIONED]
 |  order by: c2 ASC, c3 DESC
 |  limit: 5
 |
 02:TOP-N [LIMIT=5]
 |  order by: c2 ASC, c3 DESC
 |  row-size=16B cardinality=5
 |
 04:AGGREGATE [FINALIZE]
 |  output: sum:merge(float_col), min:merge(float_col)
 |  group by: int_col
 |  row-size=16B cardinality=10
 |
 03:EXCHANGE [HASH(int_col)]
 |
 01:AGGREGATE [STREAMING]
 |  output: sum(float_col), min(float_col)
 |  group by: int_col
 |  row-size=16B cardinality=10
 |
 00:SCAN HBASE [functional_hbase.alltypessmall]
    row-size=8B cardinality=50
 ====
 select c1, x2
 from (
   select c1, min(c2) x2
   from (
     select c1, c2, c3
     from (
       select int_col c1, tinyint_col c2, min(float_col) c3
       from functional_hbase.alltypessmall
       group by 1, 2
       order by 1,2
       limit 1
     ) x
   ) x2
   group by c1
 ) y
 order by 2,1 desc
 limit 0
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:EMPTYSET
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 00:EMPTYSET
 ====
 # distinct *
 select distinct *
 from (select distinct * from functional.testtbl) x
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 01:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl]
    partitions=1/1 files=0 size=0B
    row-size=24B cardinality=0
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:EXCHANGE [UNPARTITIONED]
 |
 02:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 04:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 03:EXCHANGE [HASH(functional.testtbl.id,functional.testtbl.name,functional.testtbl.zip)]
 |
 01:AGGREGATE [STREAMING]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl]
    partitions=1/1 files=0 size=0B
    row-size=24B cardinality=0
 ====
 # distinct w/ explicit select list
 select distinct id, zip
 from (select distinct * from functional.testtbl) x
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.zip
 |  row-size=12B cardinality=0
 |
 01:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl]
    partitions=1/1 files=0 size=0B
    row-size=24B cardinality=0
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 07:EXCHANGE [UNPARTITIONED]
 |
 06:AGGREGATE [FINALIZE]
 |  group by: id, zip
 |  row-size=12B cardinality=0
 |
 05:EXCHANGE [HASH(id,zip)]
 |
 02:AGGREGATE [STREAMING]
 |  group by: functional.testtbl.id, functional.testtbl.zip
 |  row-size=12B cardinality=0
 |
 04:AGGREGATE [FINALIZE]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 03:EXCHANGE [HASH(functional.testtbl.id,functional.testtbl.name,functional.testtbl.zip)]
 |
 01:AGGREGATE [STREAMING]
 |  group by: functional.testtbl.id, functional.testtbl.name, functional.testtbl.zip
 |  row-size=24B cardinality=0
 |
 00:SCAN HDFS [functional.testtbl]
    partitions=1/1 files=0 size=0B
    row-size=24B cardinality=0
 ====
 # aggregate with group-by, having
 select *
 from (
        select int_col % 7 c1, count(*) c2, avg(int_col) c3
        from (
               select * from functional.alltypesagg
             ) a
        group by 1
        having avg(int_col) > 500 or count(*) = 10
      ) b
 where c1 is not null
 and   c2 > 10
 ---- PLAN
 PLAN-ROOT SINK
 |
 01:AGGREGATE [FINALIZE]
 |  output: count(*), avg(functional.alltypesagg.int_col)
 |  group by: functional.alltypesagg.int_col % 7
 |  having: int_col % 7 IS NOT NULL, count(*) > 10, avg(int_col) > 500 OR count(*) = 10
 |  row-size=20B cardinality=96
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=4B cardinality=11.00K
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 04:EXCHANGE [UNPARTITIONED]
 |
 03:AGGREGATE [FINALIZE]
 |  output: count:merge(*), avg:merge(int_col)
 |  group by: int_col % 7
 |  having: int_col % 7 IS NOT NULL, count(*) > 10, avg(int_col) > 500 OR count(*) = 10
 |  row-size=20B cardinality=96
 |
 02:EXCHANGE [HASH(int_col % 7)]
 |
 01:AGGREGATE [STREAMING]
 |  output: count(*), avg(functional.alltypesagg.int_col)
 |  group by: functional.alltypesagg.int_col % 7
 |  row-size=20B cardinality=957
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    row-size=4B cardinality=11.00K
 ====
 # subquery with left outer join
 select j.*, d.*
 from (
        select *
        from functional.JoinTbl a
      ) j
      left outer join
      (
        select *
        from functional.DimTbl b
      ) d
      on (j.test_name = d.name)
 where j.test_id <= 1006
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: b.name = a.test_name
 |  runtime filters: RF000 <- a.test_name
 |  row-size=63B cardinality=2
 |
 |--00:SCAN HDFS [functional.jointbl a]
 |     partitions=1/1 files=1 size=433B
 |     predicates: a.test_id <= 1006
 |     row-size=33B cardinality=2
 |
 01:SCAN HDFS [functional.dimtbl b]
    partitions=1/1 files=1 size=171B
    runtime filters: RF000 -> b.name
    row-size=29B cardinality=10
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 05:EXCHANGE [UNPARTITIONED]
 |
 02:HASH JOIN [RIGHT OUTER JOIN, PARTITIONED]
 |  hash predicates: b.name = a.test_name
 |  runtime filters: RF000 <- a.test_name
 |  row-size=63B cardinality=2
 |
 |--04:EXCHANGE [HASH(a.test_name)]
 |  |
 |  00:SCAN HDFS [functional.jointbl a]
 |     partitions=1/1 files=1 size=433B
 |     predicates: a.test_id <= 1006
 |     row-size=33B cardinality=2
 |
 03:EXCHANGE [HASH(b.name)]
 |
 01:SCAN HDFS [functional.dimtbl b]
    partitions=1/1 files=1 size=171B
    runtime filters: RF000 -> b.name
    row-size=29B cardinality=10
 ====
 # complex join, having joined subquery on the rhs, and predicate
 # at multiple subquery level
 select x.smallint_col, count(x.id)
 from functional.alltypessmall c
      left outer join
      (
        select a.smallint_col smallint_col, a.tinyint_col tinyint_col, a.day day,
                a.int_col int_col, a.month month, b.float_col float_col, b.id id
         from (
                 select *
                 from functional.alltypesagg a
              ) a
              join
              functional.alltypessmall b
              on (a.smallint_col = b.id)
      ) x
      on (x.tinyint_col = c.id)
 group by x.smallint_col
 ---- PLAN
 PLAN-ROOT SINK
 |
 05:AGGREGATE [FINALIZE]
 |  output: count(b.id)
 |  group by: a.smallint_col
 |  row-size=10B cardinality=97
 |
 04:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: a.tinyint_col = c.id
 |  runtime filters: RF000 <- c.id
 |  row-size=11B cardinality=11.11K
 |
 |--00:SCAN HDFS [functional.alltypessmall c]
 |     partitions=4/4 files=4 size=6.32KB
 |     row-size=4B cardinality=100
 |
 03:HASH JOIN [INNER JOIN]
 |  hash predicates: a.smallint_col = b.id
 |  runtime filters: RF002 <- b.id
 |  row-size=7B cardinality=11.00K
 |
 |--02:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     row-size=4B cardinality=100
 |
 01:SCAN HDFS [functional.alltypesagg a]
    partitions=11/11 files=11 size=814.73KB
    runtime filters: RF000 -> a.tinyint_col, RF002 -> a.smallint_col
    row-size=3B cardinality=11.00K
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 11:EXCHANGE [UNPARTITIONED]
 |
 10:AGGREGATE [FINALIZE]
 |  output: count:merge(x.id)
 |  group by: x.smallint_col
 |  row-size=10B cardinality=97
 |
 09:EXCHANGE [HASH(x.smallint_col)]
 |
 05:AGGREGATE [STREAMING]
 |  output: count(b.id)
 |  group by: a.smallint_col
 |  row-size=10B cardinality=97
 |
 04:HASH JOIN [RIGHT OUTER JOIN, PARTITIONED]
 |  hash predicates: a.tinyint_col = c.id
 |  runtime filters: RF000 <- c.id
 |  row-size=11B cardinality=11.11K
 |
 |--08:EXCHANGE [HASH(c.id)]
 |  |
 |  00:SCAN HDFS [functional.alltypessmall c]
 |     partitions=4/4 files=4 size=6.32KB
 |     row-size=4B cardinality=100
 |
 07:EXCHANGE [HASH(a.tinyint_col)]
 |
 03:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: a.smallint_col = b.id
 |  runtime filters: RF002 <- b.id
 |  row-size=7B cardinality=11.00K
 |
 |--06:EXCHANGE [BROADCAST]
 |  |
 |  02:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     row-size=4B cardinality=100
 |
 01:SCAN HDFS [functional.alltypesagg a]
    partitions=11/11 files=11 size=814.73KB
    runtime filters: RF000 -> a.tinyint_col, RF002 -> a.smallint_col
    row-size=3B cardinality=11.00K
 ====
 # complex join, having joined subquery on the lhs, and predicate
 # at multiple subquery level
 select x.smallint_col, x.id, x.tinyint_col, c.id, x.int_col, x.float_col, c.string_col
 from
      (
        select a.smallint_col smallint_col, a.tinyint_col tinyint_col, a.day day,
                a.int_col int_col, a.month month, b.float_col float_col, b.id id
         from (
                 select *
                 from functional.alltypesagg a
                 where month=1
              ) a
              join
              functional.alltypessmall b
              on (a.smallint_col = b.id)
      ) x
      join
       functional.alltypessmall c
      on (x.tinyint_col = c.id)
 where x.day=1
 and x.int_col > 899
 and x.float_col > 4.5
 and c.string_col < '7'
 and x.int_col + x.float_col + CAST(c.string_col AS FLOAT) < 1000
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: c.id = a.tinyint_col
 |  other predicates: a.int_col + b.float_col + CAST(c.string_col AS FLOAT) < 1000
 |  runtime filters: RF000 <- a.tinyint_col
 |  row-size=32B cardinality=11
 |
 |--02:HASH JOIN [INNER JOIN]
 |  |  hash predicates: a.smallint_col = b.id
 |  |  runtime filters: RF002 <- b.id
 |  |  row-size=15B cardinality=11
 |  |
 |  |--01:SCAN HDFS [functional.alltypessmall b]
 |  |     partitions=4/4 files=4 size=6.32KB
 |  |     predicates: b.float_col > 4.5
 |  |     row-size=8B cardinality=10
 |  |
 |  00:SCAN HDFS [functional.alltypesagg a]
 |     partition predicates: `month` = 1, a.day = 1
 |     partitions=1/11 files=1 size=73.39KB
 |     predicates: a.int_col > 899
 |     runtime filters: RF002 -> a.smallint_col
 |     row-size=7B cardinality=100
 |
 03:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    predicates: c.string_col < '7'
    runtime filters: RF000 -> c.id
    row-size=17B cardinality=10
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 09:EXCHANGE [UNPARTITIONED]
 |
 04:HASH JOIN [INNER JOIN, PARTITIONED]
 |  hash predicates: c.id = a.tinyint_col
 |  other predicates: a.int_col + b.float_col + CAST(c.string_col AS FLOAT) < 1000
 |  runtime filters: RF000 <- a.tinyint_col
 |  row-size=32B cardinality=11
 |
 |--08:EXCHANGE [HASH(a.tinyint_col)]
 |  |
 |  02:HASH JOIN [INNER JOIN, PARTITIONED]
 |  |  hash predicates: b.id = a.smallint_col
 |  |  runtime filters: RF002 <- a.smallint_col
 |  |  row-size=15B cardinality=11
 |  |
 |  |--06:EXCHANGE [HASH(a.smallint_col)]
 |  |  |
 |  |  00:SCAN HDFS [functional.alltypesagg a]
 |  |     partition predicates: `month` = 1, a.day = 1
 |  |     partitions=1/11 files=1 size=73.39KB
 |  |     predicates: a.int_col > 899
 |  |     row-size=7B cardinality=100
 |  |
 |  05:EXCHANGE [HASH(b.id)]
 |  |
 |  01:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     predicates: b.float_col > 4.5
 |     runtime filters: RF002 -> b.id
 |     row-size=8B cardinality=10
 |
 07:EXCHANGE [HASH(c.id)]
 |
 03:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    predicates: c.string_col < '7'
    runtime filters: RF000 -> c.id
    row-size=17B cardinality=10
 ====
 # complex join, having joined aggregate subquery on the rhs, and predicate
 # at multiple subquery level
 select x.smallint_col, sum(x.cnt)
 from functional.alltypessmall c
   join (
     select count(a.id) cnt, b.smallint_col smallint_col
     from ( select * from functional.alltypesagg a ) a
       join functional.alltypessmall b on (a.smallint_col = b.id)
     group by b.smallint_col
   ) x on (x.smallint_col = c.id)
 group by x.smallint_col
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:AGGREGATE [FINALIZE]
 |  output: sum(count(a.id))
 |  group by: b.smallint_col
 |  row-size=10B cardinality=10
 |
 05:HASH JOIN [INNER JOIN]
 |  hash predicates: c.id = b.smallint_col
 |  runtime filters: RF000 <- b.smallint_col
 |  row-size=14B cardinality=10
 |
 |--04:AGGREGATE [FINALIZE]
 |  |  output: count(a.id)
 |  |  group by: b.smallint_col
 |  |  row-size=10B cardinality=10
 |  |
 |  03:HASH JOIN [INNER JOIN]
 |  |  hash predicates: a.smallint_col = b.id
 |  |  runtime filters: RF002 <- b.id
 |  |  row-size=12B cardinality=11.00K
 |  |
 |  |--02:SCAN HDFS [functional.alltypessmall b]
 |  |     partitions=4/4 files=4 size=6.32KB
 |  |     row-size=6B cardinality=100
 |  |
 |  01:SCAN HDFS [functional.alltypesagg a]
 |     partitions=11/11 files=11 size=814.73KB
 |     runtime filters: RF002 -> a.smallint_col
 |     row-size=6B cardinality=11.00K
 |
 00:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> c.id
    row-size=4B cardinality=100
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 13:EXCHANGE [UNPARTITIONED]
 |
 12:AGGREGATE [FINALIZE]
 |  output: sum:merge(x.cnt)
 |  group by: x.smallint_col
 |  row-size=10B cardinality=10
 |
 11:EXCHANGE [HASH(x.smallint_col)]
 |
 06:AGGREGATE [STREAMING]
 |  output: sum(count(a.id))
 |  group by: b.smallint_col
 |  row-size=10B cardinality=10
 |
 05:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: c.id = b.smallint_col
 |  runtime filters: RF000 <- b.smallint_col
 |  row-size=14B cardinality=10
 |
 |--10:EXCHANGE [BROADCAST]
 |  |
 |  09:AGGREGATE [FINALIZE]
 |  |  output: count:merge(a.id)
 |  |  group by: b.smallint_col
 |  |  row-size=10B cardinality=10
 |  |
 |  08:EXCHANGE [HASH(b.smallint_col)]
 |  |
 |  04:AGGREGATE [STREAMING]
 |  |  output: count(a.id)
 |  |  group by: b.smallint_col
 |  |  row-size=10B cardinality=10
 |  |
 |  03:HASH JOIN [INNER JOIN, BROADCAST]
 |  |  hash predicates: a.smallint_col = b.id
 |  |  runtime filters: RF002 <- b.id
 |  |  row-size=12B cardinality=11.00K
 |  |
 |  |--07:EXCHANGE [BROADCAST]
 |  |  |
 |  |  02:SCAN HDFS [functional.alltypessmall b]
 |  |     partitions=4/4 files=4 size=6.32KB
 |  |     row-size=6B cardinality=100
 |  |
 |  01:SCAN HDFS [functional.alltypesagg a]
 |     partitions=11/11 files=11 size=814.73KB
 |     runtime filters: RF002 -> a.smallint_col
 |     row-size=6B cardinality=11.00K
 |
 00:SCAN HDFS [functional.alltypessmall c]
    partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> c.id
    row-size=4B cardinality=100
 ====
 # Values statement in subqueries with predicate
 select * from (select y from (values((1 as y),(11))) a where y < 10) b
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
    constant-operands=1
    row-size=1B cardinality=1
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 00:UNION
    constant-operands=1
    row-size=1B cardinality=1
 ====
 # Mixed constant and non-constant select; the predicate is evaluated directly
 # by the non-const select
 select * from
   (select y from
     ((select 1 as y)
      union all
      (select tinyint_col from functional.alltypes)) a
    where y < 10) b
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  pass-through-operands: all
 |  row-size=1B cardinality=731
 |
 01:SCAN HDFS [functional.alltypes]
    partitions=24/24 files=24 size=478.45KB
    predicates: functional.alltypes.tinyint_col < 10
    row-size=1B cardinality=730
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 02:EXCHANGE [UNPARTITIONED]
 |
 00:UNION
 |  constant-operands=1
 |  pass-through-operands: all
 |  row-size=1B cardinality=731
 |
 01:SCAN HDFS [functional.alltypes]
    partitions=24/24 files=24 size=478.45KB
    predicates: functional.alltypes.tinyint_col < 10
    row-size=1B cardinality=730
 ====
 # Union of constant selects in subquery
 select * from (select 1 as y union all select 2 union all select * from (select 11) a) b
 where y < 10
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
    constant-operands=2
    row-size=1B cardinality=2
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 00:UNION
    constant-operands=2
    row-size=1B cardinality=2
 ====
 # Union of values statements in subquery
 # TODO: We could combine the merge nodes below.
 select * from (values(1 as y) union all values(2) union all select * from (values(11)) a) b
 where y < 10
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=2
 |  row-size=1B cardinality=2
 |
 01:UNION
    row-size=1B cardinality=0
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=2
 |  row-size=1B cardinality=2
 |
 01:UNION
    row-size=1B cardinality=0
 ====
 # Inner join on inline views made up of unions of constant selects
 select * from
 (select 1 a, 2 b union all select 1 a, 2 b) x
 inner join
 (select 1 a, 3 b union all select 1 a, 2 b) y on x.a = y.a
 inner join
 (select 1 a, 3 b union all select 1 a, 3 b) z on z.b = y.b
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: b = b
 |  row-size=6B cardinality=2
 |
 |--02:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 03:HASH JOIN [INNER JOIN]
 |  hash predicates: a = a
 |  row-size=4B cardinality=2
 |
 |--01:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 00:UNION
    constant-operands=2
    row-size=2B cardinality=2
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: b = b
 |  row-size=6B cardinality=2
 |
 |--06:EXCHANGE [UNPARTITIONED]
 |  |
 |  02:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 03:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: a = a
 |  row-size=4B cardinality=2
 |
 |--05:EXCHANGE [UNPARTITIONED]
 |  |
 |  01:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 00:UNION
    constant-operands=2
    row-size=2B cardinality=2
 ====
 # Semi and inner join on a table and on inline views made up of constant selects
 select * from functional.alltypessmall x
 left semi join
 (select 1 a, 3 b union all select 1 a, 3 b) y on y.a = x.id
 inner join
 (select 1 a, 3 b union all select 1 a, 3 b) z on z.b = x.id + 2
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: x.id + 2 = b
 |  runtime filters: RF000 <- b
 |  row-size=91B cardinality=2
 |
 |--02:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 03:HASH JOIN [LEFT SEMI JOIN]
 |  hash predicates: x.id = a
 |  runtime filters: RF002 <- a
 |  row-size=89B cardinality=2
 |
 |--01:UNION
 |     constant-operands=2
 |     row-size=1B cardinality=2
 |
 00:SCAN HDFS [functional.alltypessmall x]
    partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> x.id + 2, RF002 -> x.id
    row-size=89B cardinality=100
 ---- DISTRIBUTEDPLAN
 PLAN-ROOT SINK
 |
 07:EXCHANGE [UNPARTITIONED]
 |
 04:HASH JOIN [INNER JOIN, BROADCAST]
 |  hash predicates: x.id + 2 = b
 |  runtime filters: RF000 <- b
 |  row-size=91B cardinality=2
 |
 |--06:EXCHANGE [BROADCAST]
 |  |
 |  02:UNION
 |     constant-operands=2
 |     row-size=2B cardinality=2
 |
 03:HASH JOIN [LEFT SEMI JOIN, BROADCAST]
 |  hash predicates: x.id = a
 |  runtime filters: RF002 <- a
 |  row-size=89B cardinality=2
 |
 |--05:EXCHANGE [BROADCAST]
 |  |
 |  01:UNION
 |     constant-operands=2
 |     row-size=1B cardinality=2
 |
 00:SCAN HDFS [functional.alltypessmall x]
    partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> x.id + 2, RF002 -> x.id
    row-size=89B cardinality=100
 ====
 # Tests that views correctly reanalyze cloned exprs. (IMPALA-984)
 select b.* from functional.decimal_tbl a left outer join
   (select d1, d1 + NULL IS NULL x from functional.decimal_tbl) b
 on (a.d1 = b.d1)
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.d1 = d1
 |  row-size=8B cardinality=unavailable
 |
 |--01:SCAN HDFS [functional.decimal_tbl]
 |     partitions=1/1 files=1 size=195B
 |     row-size=4B cardinality=unavailable
 |
 00:SCAN HDFS [functional.decimal_tbl a]
    partitions=1/1 files=1 size=195B
    row-size=4B cardinality=unavailable
 ====
 # Test predicate assignment through inline view when the query contains
 # group by and distinct (IMPALA-1165)
 select foo, sum(distinct foo)
 from (select int_col + int_col as foo from functional.alltypesagg) t
 where foo = 10
 group by foo
 limit 10
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:AGGREGATE [FINALIZE]
 |  output: sum(foo)
 |  group by: foo
 |  limit: 10
 |  row-size=16B cardinality=10
 |
 01:AGGREGATE
 |  group by: int_col + int_col, int_col + int_col
 |  row-size=16B cardinality=11
 |
 00:SCAN HDFS [functional.alltypesagg]
    partitions=11/11 files=11 size=814.73KB
    predicates: int_col + int_col = 10
    row-size=4B cardinality=11
 ====
 # Test enforcement of inline-view slot equivalences when the inline-view
 # contains an outer join (IMPALA-1441)
 select * from
   (select t1.int_col, t1.tinyint_col, t2.int_col as int_col2, t2.tinyint_col as tinyint_col2
    from functional.alltypestiny t1 left outer join functional.alltypes t2
    on t1.int_col = t2.int_col and t1.tinyint_col = t2.tinyint_col) t
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: t2.int_col = t1.int_col, t2.tinyint_col = t1.tinyint_col
 |  runtime filters: RF000 <- t1.int_col, RF001 <- t1.tinyint_col
 |  row-size=10B cardinality=5.84K
 |
 |--00:SCAN HDFS [functional.alltypestiny t1]
 |     partitions=4/4 files=4 size=460B
 |     row-size=5B cardinality=8
 |
 01:SCAN HDFS [functional.alltypes t2]
    partitions=24/24 files=24 size=478.45KB
    runtime filters: RF000 -> t2.int_col, RF001 -> t2.tinyint_col
    row-size=5B cardinality=7.30K
 ====
 # IMPALA-1459: Test correct assignment of On-clause predicate from an enclosing block
 # inside an inline view with an outer join.
 select 1 from
   (select a.id aid, b.id bid from
    functional.alltypes a inner join functional.alltypes b
    on a.id = b.id
    full outer join functional.alltypessmall c on a.id = c.id) v
 inner join functional.alltypestiny c
 on (aid < bid and aid = c.id)
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:HASH JOIN [INNER JOIN]
 |  hash predicates: a.id = c.id
 |  runtime filters: RF000 <- c.id
 |  row-size=16B cardinality=9
 |
 |--05:SCAN HDFS [functional.alltypestiny c]
 |     partitions=4/4 files=4 size=460B
 |     row-size=4B cardinality=8
 |
 04:HASH JOIN [FULL OUTER JOIN]
 |  hash predicates: a.id = c.id
 |  other predicates: a.id < b.id
 |  row-size=12B cardinality=7.40K
 |
 |--02:SCAN HDFS [functional.alltypessmall c]
 |     partitions=4/4 files=4 size=6.32KB
 |     row-size=4B cardinality=100
 |
 03:HASH JOIN [INNER JOIN]
 |  hash predicates: a.id = b.id
 |  runtime filters: RF002 <- b.id
 |  row-size=8B cardinality=7.30K
 |
 |--01:SCAN HDFS [functional.alltypes b]
 |     partitions=24/24 files=24 size=478.45KB
 |     runtime filters: RF000 -> b.id
 |     row-size=4B cardinality=7.30K
 |
 00:SCAN HDFS [functional.alltypes a]
    partitions=24/24 files=24 size=478.45KB
    runtime filters: RF000 -> a.id, RF002 -> a.id
    row-size=4B cardinality=7.30K
 ====
 # IMPALA-2665: Test correct assignment of On-clause predicate from an enclosing block
 # inside an inline view with an outer join.
 select 1 from functional.alltypes t1
 inner join
   (select a.id, b.int_col
    from functional.alltypes a left outer join functional.alltypes b
    on a.id = b.int_col) v
 on (t1.id = v.id and v.int_col is null and v.int_col < 10 and v.id < 10)
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: a.id = t1.id
 |  runtime filters: RF000 <- t1.id
 |  row-size=12B cardinality=73
 |
 |--00:SCAN HDFS [functional.alltypes t1]
 |     partitions=24/24 files=24 size=478.45KB
 |     predicates: t1.id < 10
 |     row-size=4B cardinality=730
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.id = b.int_col
 |  other predicates: b.int_col IS NULL, b.int_col < 10
 |  row-size=8B cardinality=730
 |
 |--02:SCAN HDFS [functional.alltypes b]
 |     partitions=24/24 files=24 size=478.45KB
 |     predicates: b.int_col < 10
 |     runtime filters: RF000 -> b.int_col
 |     row-size=4B cardinality=730
 |
 01:SCAN HDFS [functional.alltypes a]
    partitions=24/24 files=24 size=478.45KB
    predicates: a.id < 10
    runtime filters: RF000 -> a.id
    row-size=4B cardinality=730
 ====
 # IMPALA-2643: Test inline views with duplicate exprs in their select list.
 # Inferred predicate referencing the same expr gets filtered out.
 select * from
   (select * from
     (select bigint_col, bigint_col as bigint_col2
      from functional.alltypestiny) iv
   ) ivv
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:SCAN HDFS [functional.alltypestiny]
    partitions=4/4 files=4 size=460B
    row-size=8B cardinality=8
 ====
 # IMPALA-2643: Explicit predicates remain unafftected.
 select * from
   (select * from
     (select bigint_col, bigint_col as bigint_col2
      from functional.alltypestiny) iv
   ) ivv where bigint_col = bigint_col2
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:SCAN HDFS [functional.alltypestiny]
    partitions=4/4 files=4 size=460B
    predicates: bigint_col = bigint_col
    row-size=8B cardinality=1
 ====
 # IMPALA-2643: Test aggregation.
 # Inferred predicate referencing the same expr gets filtered out.
 select * from
   (select * from
     (select sum(bigint_col) as s1, sum(bigint_col) as s2
      from functional.alltypestiny) iv
   ) ivv
 ---- PLAN
 PLAN-ROOT SINK
 |
 01:AGGREGATE [FINALIZE]
 |  output: sum(bigint_col)
 |  row-size=8B cardinality=1
 |
 00:SCAN HDFS [functional.alltypestiny]
    partitions=4/4 files=4 size=460B
    row-size=8B cardinality=8
 ====
 # IMPALA-2643: Explicit predicates remain unafftected.
 select * from
   (select * from
     (select sum(bigint_col) as s1, sum(bigint_col) as s2
      from functional.alltypestiny) iv
   ) ivv where s1 = s2
 ---- PLAN
 PLAN-ROOT SINK
 |
 01:AGGREGATE [FINALIZE]
 |  output: sum(bigint_col)
 |  having: sum(bigint_col) = sum(bigint_col)
 |  row-size=8B cardinality=0
 |
 00:SCAN HDFS [functional.alltypestiny]
    partitions=4/4 files=4 size=460B
    row-size=8B cardinality=8
 ====
 # IMPALA-8386: Predicates generated from slot equivalences won't be identities.
 # Without this patch, there will be a predicate "sum(c.int_col) = sum(c.int_col)"
 # in node 05, which may incorrectly reject rows with nulls.
 select count(1) from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypes a
     left outer join (
         select c.bigint_col, sum(c.int_col) as amount1, sum(c.int_col) as amount2
         from functional.alltypessmall b
         join functional.alltypestiny c
         on b.bigint_col = c.bigint_col
         group by c.bigint_col
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:AGGREGATE [FINALIZE]
 |  output: count(*)
 |  row-size=8B cardinality=1
 |
 05:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = c.bigint_col
 |  row-size=16B cardinality=7.30K
 |
 |--04:AGGREGATE [FINALIZE]
 |  |  group by: c.bigint_col
 |  |  row-size=8B cardinality=2
 |  |
 |  03:HASH JOIN [INNER JOIN]
 |  |  hash predicates: b.bigint_col = c.bigint_col
 |  |  runtime filters: RF000 <- c.bigint_col
 |  |  row-size=16B cardinality=80
 |  |
 |  |--02:SCAN HDFS [functional.alltypestiny c]
 |  |     partitions=4/4 files=4 size=460B
 |  |     row-size=8B cardinality=8
 |  |
 |  01:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     runtime filters: RF000 -> b.bigint_col
 |     row-size=8B cardinality=100
 |
 00:SCAN HDFS [functional.alltypes a]
    partitions=24/24 files=24 size=478.45KB
    row-size=8B cardinality=7.30K
 ====
 # IMPALA-8386: Predicates generated from slot equivalences won't be identities.
 # Without this patch, there will be a predicate "c.int_col = c.int_col" in node 04,
 # which may incorrectly reject rows with nulls.
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypes a
     left outer join (
         select c.bigint_col, c.int_col as amount1, c.int_col as amount2
         from functional.alltypessmall b
         join functional.alltypestiny c
         on b.bigint_col = c.bigint_col
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = c.bigint_col
 |  row-size=28B cardinality=58.40K
 |
 |--03:HASH JOIN [INNER JOIN]
 |  |  hash predicates: b.bigint_col = c.bigint_col
 |  |  runtime filters: RF000 <- c.bigint_col
 |  |  row-size=20B cardinality=80
 |  |
 |  |--02:SCAN HDFS [functional.alltypestiny c]
 |  |     partitions=4/4 files=4 size=460B
 |  |     row-size=12B cardinality=8
 |  |
 |  01:SCAN HDFS [functional.alltypessmall b]
 |     partitions=4/4 files=4 size=6.32KB
 |     runtime filters: RF000 -> b.bigint_col
 |     row-size=8B cardinality=100
 |
 00:SCAN HDFS [functional.alltypes a]
    partitions=24/24 files=24 size=478.45KB
    row-size=8B cardinality=7.30K
 ====
 # A more deeper inline view test for IMPALA-8386. No predicate "int_col = int_col" will
 # be generated.
 select * from (
     select t2.id, t2.amount1, t2.amount2
     from functional.alltypestiny a
     left outer join (
         select t3.id, t3.amount1, t3.amount2
         from functional.alltypestiny b
         left outer join (
             select c.id, c.int_col as amount1, c.int_col as amount2
             from functional.alltypestiny c
             join functional.alltypestiny d
             on c.id = d.id
         ) t3
         on b.id = t3.id
     ) t2
     on a.id = t2.id
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: c.id = a.id
 |  runtime filters: RF000 <- a.id
 |  row-size=20B cardinality=8
 |
 |--00:SCAN HDFS [functional.alltypestiny a]
 |     partitions=4/4 files=4 size=460B
 |     row-size=4B cardinality=8
 |
 05:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: c.id = b.id
 |  runtime filters: RF002 <- b.id
 |  row-size=16B cardinality=8
 |
 |--01:SCAN HDFS [functional.alltypestiny b]
 |     partitions=4/4 files=4 size=460B
 |     row-size=4B cardinality=8
 |
 04:HASH JOIN [INNER JOIN]
 |  hash predicates: c.id = d.id
 |  runtime filters: RF004 <- d.id
 |  row-size=12B cardinality=8
 |
 |--03:SCAN HDFS [functional.alltypestiny d]
 |     partitions=4/4 files=4 size=460B
 |     runtime filters: RF000 -> d.id, RF002 -> d.id
 |     row-size=4B cardinality=8
 |
 02:SCAN HDFS [functional.alltypestiny c]
    partitions=4/4 files=4 size=460B
    runtime filters: RF000 -> c.id, RF002 -> c.id, RF004 -> c.id
    row-size=8B cardinality=8
 ====
 # A minimal reproduce for IMPALA-8386. Though the query results are correct, without
 # this patch there's a wrong inferred predicate "int_col = int_col" assigned at the
 # Join node.
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypessmall a
     left outer join (
         select bigint_col, int_col as amount1, int_col as amount2
         from functional.alltypestiny
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 02:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = bigint_col
 |  row-size=20B cardinality=100
 |
 |--01:SCAN HDFS [functional.alltypestiny]
 |     partitions=4/4 files=4 size=460B
 |     row-size=12B cardinality=8
 |
 00:SCAN HDFS [functional.alltypessmall a]
    partitions=4/4 files=4 size=6.32KB
    row-size=8B cardinality=100
 ====
 # IMPALA-8386: test coverage for ORDER BY/LIMIT
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypessmall a
     left outer join (
         select bigint_col, int_col as amount1, int_col as amount2
         from functional.alltypestiny
         order by bigint_col limit 10
     ) t2
     on a.bigint_col = t2.bigint_col
     order by 1 limit 10
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:TOP-N [LIMIT=10]
 |  order by: bigint_col ASC
 |  row-size=16B cardinality=10
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = bigint_col
 |  row-size=20B cardinality=100
 |
 |--02:TOP-N [LIMIT=10]
 |  |  order by: bigint_col ASC
 |  |  row-size=12B cardinality=8
 |  |
 |  01:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     row-size=12B cardinality=8
 |
 00:SCAN HDFS [functional.alltypessmall a]
    HDFS partitions=4/4 files=4 size=6.32KB
    row-size=8B cardinality=100
 ====
 # IMPALA-8386: test coverage for analytic functions
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypessmall a
     left outer join (
         select bigint_col, max(int_col) over (partition by bigint_col) as amount1,
             max(int_col) over (partition by bigint_col) as amount2
         from functional.alltypestiny
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = bigint_col
 |  row-size=24B cardinality=100
 |
 |--03:ANALYTIC
 |  |  functions: max(int_col)
 |  |  partition by: bigint_col
 |  |  row-size=16B cardinality=8
 |  |
 |  02:SORT
 |  |  order by: bigint_col ASC NULLS FIRST
 |  |  row-size=12B cardinality=8
 |  |
 |  01:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     row-size=12B cardinality=8
 |
 00:SCAN HDFS [functional.alltypessmall a]
    HDFS partitions=4/4 files=4 size=6.32KB
    row-size=8B cardinality=100
 ====
 # IMPALA-8386: test coverage for unions
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypessmall a
     left outer join (
         select bigint_col, int_col as amount1, int_col as amount2
         from (
             select * from functional.alltypestiny where id < 4
             union all
             select * from functional.alltypestiny where id >= 4
         ) t3
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = bigint_col
 |  row-size=20B cardinality=100
 |
 |--01:UNION
 |  |  row-size=12B cardinality=2
 |  |
 |  |--03:SCAN HDFS [functional.alltypestiny]
 |  |     HDFS partitions=4/4 files=4 size=460B
 |  |     predicates: id >= 4
 |  |     row-size=16B cardinality=1
 |  |
 |  02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: id < 4
 |     row-size=16B cardinality=1
 |
 00:SCAN HDFS [functional.alltypessmall a]
    HDFS partitions=4/4 files=4 size=6.32KB
    row-size=8B cardinality=100
 ====
 # IMPALA-8386: test coverage for unions
 select * from (
     select t2.bigint_col, t2.amount1, t2.amount2
     from functional.alltypessmall a
     left join (
         select bigint_col, int_col as amount1, int_col as amount2
         from functional.alltypestiny
         union all values (NULL, NULL, NULL)
     ) t2
     on a.bigint_col = t2.bigint_col
 ) t1;
 ---- PLAN
 PLAN-ROOT SINK
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: a.bigint_col = bigint_col
 |  row-size=24B cardinality=100
 |
 |--01:UNION
 |  |  constant-operands=1
 |  |  row-size=16B cardinality=9
 |  |
 |  02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     row-size=12B cardinality=8
 |
 00:SCAN HDFS [functional.alltypessmall a]
    HDFS partitions=4/4 files=4 size=6.32KB
    row-size=8B cardinality=100
 ====
 # IMPALA-7957: Slot equivalences should not be enforced multiple times.
 # Without this patch, the planner will incorrectly generated a SELECT node with a wrong
 # predicate "functional.alltypestiny.id = functional.alltypestiny.int_col" on top of the
 # JOIN node. So LEFT JOIN results with NULL values will be incorrectly rejects.
 SELECT t.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
    FROM functional.alltypestiny
    WHERE int_col = id) t2
 ON (t.id = t2.id)
 UNION ALL
 VALUES (NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=4B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  row-size=12B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # IMPALA-7957: Slot equivalences should not be enforced multiple times.
 # Coverage for UNION DISTINCT
 SELECT t.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
   FROM functional.alltypestiny
   WHERE int_col = id) t2
 ON (t.id = t2.id)
 UNION DISTINCT
 VALUES (NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 04:AGGREGATE [FINALIZE]
 |  group by: id
 |  row-size=4B cardinality=9
 |
 00:UNION
 |  constant-operands=1
 |  row-size=4B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  row-size=12B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # IMPALA-7957: Slot equivalences should not be enforced multiple times.
 # The WHERE predicate "t.int_col = t.id" is pushed down to the scan node of t.
 SELECT t.id, t.int_col
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
   FROM functional.alltypestiny) t2
 ON (t.id = t2.id)
 WHERE t.int_col = t.id
 UNION ALL
 VALUES (NULL, NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=1
 |
 03:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: id = t.id
 |  runtime filters: RF000 <- t.id
 |  row-size=12B cardinality=1
 |
 |--01:SCAN HDFS [functional.alltypestiny t]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: t.int_col = t.id
 |     row-size=8B cardinality=1
 |
 02:SCAN HDFS [functional.alltypestiny]
    HDFS partitions=4/4 files=4 size=460B
    runtime filters: RF000 -> id
    row-size=4B cardinality=8
 ====
 # Regression test for IMPALA-7957. Comparing to the test above, this test changes the
 # WHERE clause to target on the rhs of the LEFT JOIN. The WHERE predicate is correctly
 # duplicated and pushed down to the SCAN node.
 SELECT t2.id, t2.int_col
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
   FROM functional.alltypestiny) t2
 ON (t.id = t2.id)
 WHERE t2.int_col = t2.id
 UNION ALL
 VALUES (NULL, NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  other predicates: int_col = id
 |  row-size=12B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: functional.alltypestiny.int_col = functional.alltypestiny.id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # Regression test for IMPALA-7957. The inline view t2 has a ORDER BY LIMIT clause.
 # No behavior changes after the patch.
 SELECT t2.id, t2.int_col
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
   FROM functional.alltypestiny
   ORDER BY id LIMIT 2) t2
 ON (t.id = t2.id)
 WHERE t2.int_col = t2.id
 UNION ALL
 VALUES (NULL, NULL);
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=9
 |
 05:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  other predicates: int_col = id
 |  row-size=12B cardinality=8
 |
 |--04:SELECT
 |  |  predicates: id = int_col
 |  |  row-size=8B cardinality=0
 |  |
 |  03:TOP-N [LIMIT=2]
 |  |  order by: id ASC
 |  |  row-size=8B cardinality=2
 |  |
 |  02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     row-size=8B cardinality=8
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # Regression test for IMPALA-7957. The inline view t2 has an analytic function.
 # No behavior changes after the patch.
 SELECT t2.id, t2.int_col
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col, count(int_col) over (partition by int_col) int_sum
   FROM functional.alltypestiny
   ORDER BY id LIMIT 2) t2
 ON (t.id = t2.id)
 WHERE t2.int_col = t2.id
 UNION ALL
 VALUES (NULL, NULL);
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=9
 |
 05:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  other predicates: int_col = id
 |  row-size=12B cardinality=8
 |
 |--04:SELECT
 |  |  predicates: id = int_col
 |  |  row-size=8B cardinality=0
 |  |
 |  03:TOP-N [LIMIT=2]
 |  |  order by: id ASC
 |  |  row-size=8B cardinality=2
 |  |
 |  02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     row-size=8B cardinality=8
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # Regression test for IMPALA-7957. The first union operand has an ORDER BY LIMIT clause.
 SELECT t.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
    FROM functional.alltypestiny
    WHERE int_col = id) t2
 ON (t.id = t2.id)
 ORDER BY 1 LIMIT 3
 UNION ALL
 VALUES (NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  pass-through-operands: all
 |  row-size=4B cardinality=4
 |
 04:TOP-N [LIMIT=3]
 |  order by: id ASC
 |  row-size=4B cardinality=3
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  row-size=12B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # Regression test for IMPALA-7957. The first union operand has a GROUP BY clause.
 SELECT t.id, sum(t.int_col)
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
    FROM functional.alltypestiny
    WHERE int_col = id) t2
 ON (t.id = t2.id)
 GROUP BY 1
 UNION ALL
 VALUES (NULL, NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  pass-through-operands: all
 |  row-size=12B cardinality=9
 |
 04:AGGREGATE [FINALIZE]
 |  output: sum(t.int_col)
 |  group by: t.id
 |  row-size=12B cardinality=8
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  row-size=16B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=8B cardinality=8
 ====
 # IMPALA-7957: Add the same predicate *outside* the left join, it should still be enforced.
 SELECT t.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col
   FROM functional.alltypestiny
   WHERE int_col = id) t2
 ON (t.id = t2.id) where t2.id = t2.int_col
 UNION ALL
 VALUES (NULL);
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=4B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  other predicates: id = int_col
 |  row-size=12B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id
 |     row-size=8B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # IMPALA-7957: Same thing except with a predicate on a different column (i.e. adding it
 # to the equivalence class)
 SELECT t.id, t2.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col, smallint_col
   FROM functional.alltypestiny
   WHERE int_col = id) t2
 ON (t.id = t2.id) where t2.int_col = t2.smallint_col
 UNION ALL
 VALUES (NULL, NULL)
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  other predicates: int_col = smallint_col
 |  row-size=14B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id, id = smallint_col
 |     row-size=10B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # IMPALA-7957: Multiple predicates that must not be placed above the join
 SELECT t.id, t2.id
 FROM functional.alltypestiny t
 LEFT JOIN
   (SELECT id, int_col, smallint_col
   FROM functional.alltypestiny
   WHERE int_col = id and smallint_col = id and tinyint_col = id) t2
 ON (t.id = t2.id)
 UNION ALL
 VALUES (NULL, NULL);
 ---- PLAN
 PLAN-ROOT SINK
 |
 00:UNION
 |  constant-operands=1
 |  row-size=8B cardinality=9
 |
 03:HASH JOIN [LEFT OUTER JOIN]
 |  hash predicates: t.id = id
 |  row-size=15B cardinality=8
 |
 |--02:SCAN HDFS [functional.alltypestiny]
 |     HDFS partitions=4/4 files=4 size=460B
 |     predicates: int_col = id, smallint_col = id, tinyint_col = id
 |     row-size=11B cardinality=1
 |
 01:SCAN HDFS [functional.alltypestiny t]
    HDFS partitions=4/4 files=4 size=460B
    row-size=4B cardinality=8
 ====
 # IMPALA-9162: Should not add extra predicates to the WHERE part of a left outer join
 select x.* from (select v1.c2, v1.max_c2 from functional.alltypessmall t
   left join (
    with iv1 AS (SELECT smallint_col c1, bigint_col c2
                  FROM functional.alltypessmall
                 group by c1, c2),
         iv2 AS (SELECT smallint_col r_c1, max(bigint_col) max_c2
                  FROM functional.alltypessmall
                 group by r_c1)
     select iv1.c2, iv2.max_c2 FROM iv1, iv2 where iv1.c2 = iv2.max_c2) as v1
   on t.smallint_col=v1.c2) as x;
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:HASH JOIN [RIGHT OUTER JOIN]
 |  hash predicates: bigint_col = t.smallint_col
 |  runtime filters: RF000 <- t.smallint_col
 |  row-size=22B cardinality=81
 |
 |--00:SCAN HDFS [functional.alltypessmall t]
 |     HDFS partitions=4/4 files=4 size=6.32KB
 |     row-size=2B cardinality=81
 |
 05:HASH JOIN [INNER JOIN]
 |  hash predicates: bigint_col = max(bigint_col)
 |  runtime filters: RF002 <- max(bigint_col)
 |  row-size=20B cardinality=81
 |
 |--04:AGGREGATE [FINALIZE]
 |  |  output: max(bigint_col)
 |  |  group by: smallint_col
 |  |  row-size=10B cardinality=81
 |  |
 |  03:SCAN HDFS [functional.alltypessmall]
 |     HDFS partitions=4/4 files=4 size=6.32KB
 |     row-size=10B cardinality=81
 |
 02:AGGREGATE [FINALIZE]
 |  group by: smallint_col, bigint_col
 |  row-size=10B cardinality=81
 |
 01:SCAN HDFS [functional.alltypessmall]
    HDFS partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> functional.alltypessmall.bigint_col, RF002 -> functional.alltypessmall.bigint_col
    row-size=10B cardinality=81
 ====
 # IMPALA-9162: Should not add extra predicates to the WHERE part of a full outer join
 select x.* from (select v1.c2, v1.max_c2 from functional.alltypessmall t
    full outer join (
    with iv1 AS (SELECT smallint_col c1, bigint_col c2
                  FROM functional.alltypessmall
                 group by c1, c2),
         iv2 AS (SELECT smallint_col r_c1, max(bigint_col) max_c2
                  FROM functional.alltypessmall
                 group by r_c1)
     select iv1.c2, iv2.max_c2 FROM iv1, iv2 where iv1.c2 = iv2.max_c2) as v1
   on t.smallint_col=v1.c2) as x;
 ---- PLAN
 PLAN-ROOT SINK
 |
 06:HASH JOIN [FULL OUTER JOIN]
 |  hash predicates: bigint_col = t.smallint_col
 |  row-size=22B cardinality=81
 |
 |--00:SCAN HDFS [functional.alltypessmall t]
 |     HDFS partitions=4/4 files=4 size=6.32KB
 |     row-size=2B cardinality=81
 |
 05:HASH JOIN [INNER JOIN]
 |  hash predicates: bigint_col = max(bigint_col)
 |  runtime filters: RF000 <- max(bigint_col)
 |  row-size=20B cardinality=81
 |
 |--04:AGGREGATE [FINALIZE]
 |  |  output: max(bigint_col)
 |  |  group by: smallint_col
 |  |  row-size=10B cardinality=81
 |  |
 |  03:SCAN HDFS [functional.alltypessmall]
 |     HDFS partitions=4/4 files=4 size=6.32KB
 |     row-size=10B cardinality=81
 |
 02:AGGREGATE [FINALIZE]
 |  group by: smallint_col, bigint_col
 |  row-size=10B cardinality=81
 |
 01:SCAN HDFS [functional.alltypessmall]
    HDFS partitions=4/4 files=4 size=6.32KB
    runtime filters: RF000 -> functional.alltypessmall.bigint_col
    row-size=10B cardinality=81
 ====