src/test/regress/sql/goh_subselect.sql - hawq - Git at Google

 --
 -- SUBSELECT
 --
 \c hdfs

 SELECT 1 AS one WHERE 1 IN (SELECT 1);

 SELECT 1 AS zero WHERE 1 NOT IN (SELECT 1);

 SELECT 1 AS zero WHERE 1 IN (SELECT 2);

 -- Set up some simple test tables

 CREATE TABLE SUBSELECT_TBL (
   f1 integer,
   f2 integer,
   f3 float
 );

 INSERT INTO SUBSELECT_TBL VALUES (1, 2, 3);
 INSERT INTO SUBSELECT_TBL VALUES (2, 3, 4);
 INSERT INTO SUBSELECT_TBL VALUES (3, 4, 5);
 INSERT INTO SUBSELECT_TBL VALUES (1, 1, 1);
 INSERT INTO SUBSELECT_TBL VALUES (2, 2, 2);
 INSERT INTO SUBSELECT_TBL VALUES (3, 3, 3);
 INSERT INTO SUBSELECT_TBL VALUES (6, 7, 8);
 INSERT INTO SUBSELECT_TBL VALUES (8, 9, NULL);

 SELECT '' AS eight, * FROM SUBSELECT_TBL ORDER BY 2,3,4;

 -- Uncorrelated subselects

 SELECT '' AS two, f1 AS "Constant Select" FROM SUBSELECT_TBL
   WHERE f1 IN (SELECT 1) ORDER BY 2;

 SELECT '' AS six, f1 AS "Uncorrelated Field" FROM SUBSELECT_TBL
   WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL) ORDER BY 2;

 SELECT '' AS six, f1 AS "Uncorrelated Field" FROM SUBSELECT_TBL
   WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL WHERE
     f2 IN (SELECT f1 FROM SUBSELECT_TBL)) ORDER BY 2;

 SELECT '' AS three, f1, f2
   FROM SUBSELECT_TBL
   WHERE (f1, f2) NOT IN (SELECT f2, CAST(f3 AS int4) FROM SUBSELECT_TBL
                          WHERE f3 IS NOT NULL) ORDER BY 2,3;

 -- Correlated subselects

 SELECT '' AS six, f1 AS "Correlated Field", f2 AS "Second Field"
   FROM SUBSELECT_TBL upper
   WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL WHERE f1 = upper.f1) ORDER BY 2,3;

 SELECT '' AS six, f1 AS "Correlated Field", f3 AS "Second Field"
   FROM SUBSELECT_TBL upper
   WHERE f1 IN
     (SELECT f2 FROM SUBSELECT_TBL WHERE CAST(upper.f2 AS float) = f3) ORDER BY 2,3;

 SELECT '' AS six, f1 AS "Correlated Field", f3 AS "Second Field"
   FROM SUBSELECT_TBL upper
   WHERE f3 IN (SELECT upper.f1 + f2 FROM SUBSELECT_TBL
                WHERE f2 = CAST(f3 AS integer)) ORDER BY 2,3;

 SELECT '' AS five, f1 AS "Correlated Field"
   FROM SUBSELECT_TBL
   WHERE (f1, f2) IN (SELECT f2, CAST(f3 AS int4) FROM SUBSELECT_TBL
                      WHERE f3 IS NOT NULL) ORDER BY 2;

 --
 -- Use some existing tables in the regression test
 --

 SELECT '' AS eight, ss.f1 AS "Correlated Field", ss.f3 AS "Second Field"
   FROM SUBSELECT_TBL ss
   WHERE f1 NOT IN (SELECT f1+1 FROM INT4_TBL
                    WHERE f1 != ss.f1 AND f1 < 2147483647) ORDER BY 2,3;

 select q1, float8(count(*)) / (select count(*) from int8_tbl)
 from int8_tbl group by q1 order by q1;

 --
 -- Test cases to catch unpleasant interactions between IN-join processing
 -- and subquery pullup.
 --

 select count(*) from
   (select 1 from tenk1 a
    where unique1 IN (select hundred from tenk1 b)) ss;
 select count(distinct ss.ten) from
   (select ten from tenk1 a
    where unique1 IN (select hundred from tenk1 b)) ss;
 select count(*) from
   (select 1 from tenk1 a
    where unique1 IN (select distinct hundred from tenk1 b)) ss;
 select count(distinct ss.ten) from
   (select ten from tenk1 a
    where unique1 IN (select distinct hundred from tenk1 b)) ss;

 --
 -- Test cases to check for overenthusiastic optimization of
 -- "IN (SELECT DISTINCT ...)" and related cases.  Per example from
 -- Luca Pireddu and Michael Fuhr.
 --

 CREATE TEMP TABLE foo (id integer);
 CREATE TEMP TABLE bar (id1 integer, id2 integer);

 INSERT INTO foo VALUES (1);

 INSERT INTO bar VALUES (1, 1);
 INSERT INTO bar VALUES (2, 2);
 INSERT INTO bar VALUES (3, 1);

 -- These cases require an extra level of distinct-ing above subquery s
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT DISTINCT id1, id2 FROM bar) AS s) ORDER BY 1;
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT id1,id2 FROM bar GROUP BY id1,id2) AS s) ORDER BY 1;
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT id1, id2 FROM bar UNION
                       SELECT id1, id2 FROM bar) AS s) ORDER BY 1;

 -- These cases do not
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT DISTINCT ON (id2) id1, id2 FROM bar) AS s) ORDER BY 1;
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT id2 FROM bar GROUP BY id2) AS s) ORDER BY 1;
 SELECT * FROM foo WHERE id IN
     (SELECT id2 FROM (SELECT id2 FROM bar UNION
                       SELECT id2 FROM bar) AS s) ORDER BY 1;

 --
 -- Test case to catch problems with multiply nested sub-SELECTs not getting
 -- recalculated properly.  Per bug report from Didier Moens.
 --

 CREATE TABLE orderstest (
     approver_ref integer,
     po_ref integer,
     ordercancelled boolean
 );

 INSERT INTO orderstest VALUES (1, 1, false);
 INSERT INTO orderstest VALUES (66, 5, false);
 INSERT INTO orderstest VALUES (66, 6, false);
 INSERT INTO orderstest VALUES (66, 7, false);
 INSERT INTO orderstest VALUES (66, 1, true);
 INSERT INTO orderstest VALUES (66, 8, false);
 INSERT INTO orderstest VALUES (66, 1, false);
 INSERT INTO orderstest VALUES (77, 1, false);
 INSERT INTO orderstest VALUES (1, 1, false);
 INSERT INTO orderstest VALUES (66, 1, false);
 INSERT INTO orderstest VALUES (1, 1, false);

 CREATE VIEW orders_view AS
 SELECT *,
 (SELECT CASE
    WHEN ord.approver_ref=1 THEN '---' ELSE 'Approved'
  END) AS "Approved",
 (SELECT CASE
  WHEN ord.ordercancelled
  THEN 'Cancelled'
  ELSE
   (SELECT CASE
 		WHEN ord.po_ref=1
 		THEN
 		 (SELECT CASE
 				WHEN ord.approver_ref=1
 				THEN '---'
 				ELSE 'Approved'
 			END)
 		ELSE 'PO'
 	END)
 END) AS "Status",
 (CASE
  WHEN ord.ordercancelled
  THEN 'Cancelled'
  ELSE
   (CASE
 		WHEN ord.po_ref=1
 		THEN
 		 (CASE
 				WHEN ord.approver_ref=1
 				THEN '---'
 				ELSE 'Approved'
 			END)
 		ELSE 'PO'
 	END)
 END) AS "Status_OK"
 FROM orderstest ord;

 SELECT * FROM orders_view ORDER BY 1,2;

 DROP TABLE orderstest cascade;

 --
 -- Test cases to catch situations where rule rewriter fails to propagate
 -- hasSubLinks flag correctly.  Per example from Kyle Bateman.
 --

 create temp table parts (
     partnum     text,
     cost        float8
 );

 create temp table shipped (
     ttype       char(2),
     ordnum      int4,
     partnum     text,
     value       float8
 );

 create temp view shipped_view as
     select * from shipped where ttype = 'wt';

 create rule shipped_view_insert as on insert to shipped_view do instead
     insert into shipped values('wt', new.ordnum, new.partnum, new.value);

 insert into parts (partnum, cost) values (1, 1234.56);

 insert into shipped_view (ordnum, partnum, value)
     values (0, 1, (select cost from parts where partnum = 1));

 select * from shipped_view ORDER BY 1,2;

 create rule shipped_view_update as on update to shipped_view do instead
     update shipped set partnum = new.partnum, value = new.value
         where ttype = new.ttype and ordnum = new.ordnum;

 select * from shipped_view ORDER BY 1,2;

 select f1, ss1 as relabel from
     (select *, (select sum(f1) from int4_tbl b where f1 >= a.f1) as ss1
      from int4_tbl a) ss;

 --
 -- Test cases involving PARAM_EXEC parameters and min/max index optimizations.
 -- Per bug report from David Sanchez i Gregori.
 --

 select * from (
   select max(unique1) from tenk1 as a
   where exists (select 1 from tenk1 as b where b.thousand = a.unique2)
 ) ss;

 select * from (
   select min(unique1) from tenk1 as a
   where not exists (select 1 from tenk1 as b where b.unique2 = 10000)
 ) ss;

 --
 -- Base tables for CSQ tests
 --

 drop table if exists csq_t1_base;
 create table csq_t1_base(x int, y int) distributed by (x);

 insert into csq_t1_base values(1,2);
 insert into csq_t1_base values(2,1);
 insert into csq_t1_base values(4,2);

 drop table if exists csq_t2_base;
 create table csq_t2_base(x int, y int) distributed by (x);

 insert into csq_t2_base values(3,2);
 insert into csq_t2_base values(3,2);
 insert into csq_t2_base values(3,2);
 insert into csq_t2_base values(3,2);
 insert into csq_t2_base values(3,1);


 --
 -- Correlated subqueries
 --

 drop table if exists csq_t1;
 drop table if exists csq_t2;

 create table csq_t1(x int, y int) distributed by (x);
 create table csq_t2(x int, y int) distributed by (x);

 insert into csq_t1 select * from csq_t1_base;
 insert into csq_t2 select * from csq_t2_base;

 select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1; -- expected (4,2)

 --
 -- correlations in the targetlist
 --

 select csq_t1.x, (select sum(bar.x) from csq_t1 bar where bar.x >= csq_t1.x) as sum from csq_t1 order by csq_t1.x;

 select csq_t1.x, (select sum(bar.x) from csq_t1 bar where bar.x = csq_t1.x) as sum from csq_t1 order by csq_t1.x;

 select csq_t1.x, (select bar.x from csq_t1 bar where bar.x = csq_t1.x) as sum from csq_t1 order by csq_t1.x;

 --
 -- CSQs with partitioned tables
 --

 drop table if exists csq_t1;
 drop table if exists csq_t2;

 create table csq_t1(x int, y int)
 distributed by (x)
 partition by range (y) ( start (0) end (4) every (1))
 ;

 create table csq_t2(x int, y int)
 distributed by (x)
 partition by range (y) ( start (0) end (4) every (1))
 ;

 insert into csq_t1 select * from csq_t1_base;
 insert into csq_t2 select * from csq_t2_base;

 explain select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1;

 select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1; -- expected (4,2)

 drop table if exists csq_t1;
 drop table if exists csq_t2;
 drop table if exists csq_t1_base;
 drop table if exists csq_t2_base;

 --
 -- Multi-row subqueries
 --

 drop table if exists mrs_t1;
 create table mrs_t1(x int) distributed by (x);

 insert into mrs_t1 select generate_series(1,20);

 explain select * from mrs_t1 where exists (select x from mrs_t1 where x < -1);
 select * from mrs_t1 where exists (select x from mrs_t1 where x < -1) order by 1;

 explain select * from mrs_t1 where exists (select x from mrs_t1 where x = 1);
 select * from mrs_t1 where exists (select x from mrs_t1 where x = 1) order by 1;

 explain select * from mrs_t1 where x in (select x-95 from mrs_t1) or x < 5;
 select * from mrs_t1 where x in (select x-95 from mrs_t1) or x < 5 order by 1;

 explain select 1 as mrs_t1 where 1 <= ALL (Select x from mrs_t1);
 select 1 as mrs_t1 where 1 <= ALL (Select x from mrs_t1) order by 1;

 drop table if exists mrs_t1;

 --
 -- Multi-row subquery from MSTR
 --
 drop table if exists mrs_u1;
 drop table if exists mrs_u2;

 create TABLE mrs_u1 (a int, b int);
 create TABLE mrs_u2 (a int, b int);

 insert into mrs_u1 values (1,2),(11,22);
 insert into mrs_u2 values (1,2),(11,22),(33,44);

 select * from mrs_u1 join mrs_u2 on mrs_u1.a=mrs_u2.a where mrs_u1.a in (1,11) or mrs_u2.a in (select a from mrs_u1 where a=1) order by 1;

 drop table if exists mrs_u1;
 drop table if exists mrs_u2;

 --
 -- MPP-13758
 --

 drop table if exists csq_m1;
 create table csq_m1(y int);
 alter table csq_m1 add column x int default 0;
 insert into csq_m1 values(1,1);

 drop table if exists csq_d1;
 create table csq_d1(y int, x int) distributed by (x);
 insert into csq_d1 select * from csq_m1;

 explain select array(select x from csq_m1); -- no initplan
 select array(select x from csq_m1); -- {1}

 explain select array(select x from csq_d1); -- initplan
 select array(select x from csq_d1); -- {1}

 --
 -- CSQs involving master-only and distributed tables
 --

 drop table if exists t3coquicklz;

 create table t3coquicklz (c1 int , c2 varchar) with (appendonly=true, compresstype=quicklz, orientation=column) distributed by (c1);

 drop table if exists pg_attribute_storage;

 create table pg_attribute_storage (attrelid int, attnum int, attoptions text[]) distributed by (attrelid);

 insert into pg_attribute_storage values ('t3coquicklz'::regclass, 1, E'{\'something\'}');
 insert into pg_attribute_storage values ('t3coquicklz'::regclass, 2, E'{\'something2\'}');

 SELECT a.attname
 , pg_catalog.format_type(a.atttypid, a.atttypmod)

 , ( SELECT substring(pg_catalog.pg_get_expr(d.adbin, d.adrelid) for 128)
  FROM pg_catalog.pg_attrdef d
 WHERE d.adrelid = a.attrelid AND d.adnum = a.attnum AND a.atthasdef
 )
 , a.attnotnull
 , a.attnum
 , a.attstorage
 , pg_catalog.col_description(a.attrelid, a.attnum)
 , ( SELECT s.attoptions
 FROM pg_attribute_storage s
 WHERE s.attrelid = a.attrelid AND s.attnum = a.attnum
 ) newcolumn

 FROM pg_catalog.pg_attribute a
 WHERE a.attrelid = 't3coquicklz'::regclass AND a.attnum > 0 AND NOT a.attisdropped
 ORDER BY a.attnum
 ; -- expect to see 2 rows

 --
 -- More CSQs involving master-only and distributed relations
 --

 drop table if exists csq_m1;
 create table csq_m1(y int);
 alter table csq_m1 add column x int default 0;
 insert into csq_m1 values(1,1),(1,2),(1,3);

 drop table if exists csq_d1;
 create table csq_d1(y int, x int) distributed by (x);
 insert into csq_d1 select * from csq_m1 where x < 3;
 insert into csq_d1 values(1, 4);

 select * from csq_m1;
 select * from csq_d1;

 --
 -- outer plan node is master-only and CSQ has distributed relation
 --

 explain select * from csq_m1 where x not in (select x from csq_d1) or x < -100; -- gather motion
 select * from csq_m1 where x not in (select x from csq_d1) or x < -100; -- (3)

 --
 -- outer plan node is master-only and CSQ has distributed relation
 --

 explain select * from csq_d1 where x not in (select x from csq_m1) or x < -100; -- broadcast motion
 select * from csq_d1 where x not in (select x from csq_m1) or x < -100; -- (4)

 --
 -- MPP-14441 Don't lose track of initplans
 --
 drop table if exists csq_t1;
 CREATE TABLE csq_t1 (a int, b int, c int, d int, e text) DISTRIBUTED BY (a);
 INSERT INTO csq_t1 SELECT i, i/3, i%2, 100-i, 'text'||i  FROM generate_series(1,100) i;

 select count(*) from csq_t1 t1 where a > (SELECT x.b FROM ( select avg(a)::int as b,'haha'::text from csq_t1 t2 where t2.a=t1.d) x ) ;

 select count(*) from csq_t1 t1 where a > ( select avg(a)::int from csq_t1 t2 where t2.a=t1.d) ;

 --
 -- correlation in a func expr
 --
 CREATE FUNCTION csq_f(a int) RETURNS int AS $$ select $1 $$ LANGUAGE SQL;
 CREATE TABLE csq_r(a int);
 INSERT INTO csq_r VALUES (1);

 -- subqueries shouldn't be pulled into a join if the from clause has a function call
 -- with a correlated argument

 -- force_explain
 explain SELECT * FROM csq_r WHERE a IN (SELECT * FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE a IN (SELECT * FROM csq_f(csq_r.a));

 -- force_explain
 explain SELECT * FROM csq_r WHERE a not IN (SELECT * FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE a not IN (SELECT * FROM csq_f(csq_r.a));

 -- force_explain
 explain SELECT * FROM csq_r WHERE exists (SELECT * FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE exists (SELECT * FROM csq_f(csq_r.a));

 -- force_explain
 explain SELECT * FROM csq_r WHERE not exists (SELECT * FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE not exists (SELECT * FROM csq_f(csq_r.a));

 -- force_explain
 explain SELECT * FROM csq_r WHERE a > (SELECT csq_f FROM csq_f(csq_r.a) limit 1);

 SELECT * FROM csq_r WHERE a > (SELECT csq_f FROM csq_f(csq_r.a) limit 1);

 -- force_explain
 explain SELECT * FROM csq_r WHERE a < ANY (SELECT csq_f FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE a < ANY (SELECT csq_f FROM csq_f(csq_r.a));

 -- force_explain
 explain SELECT * FROM csq_r WHERE a <= ALL (SELECT csq_f FROM csq_f(csq_r.a));

 SELECT * FROM csq_r WHERE a <= ALL (SELECT csq_f FROM csq_f(csq_r.a));

 -- fails: correlation in distributed subplan
 -- force_explain
 explain SELECT * FROM csq_r WHERE a IN (SELECT csq_f FROM csq_f(csq_r.a),csq_r);

 --
 -- Test pullup of expr CSQs to joins
 --

 --
 -- Test data
 --

 drop table if exists csq_pullup;
 create table csq_pullup(t text, n numeric, i int, v varchar(10));
 insert into csq_pullup values ('abc',1, 2, 'xyz');
 insert into csq_pullup values ('xyz',2, 3, 'def');
 insert into csq_pullup values ('def',3, 1, 'abc');

 --
 -- Expr CSQs to joins
 --

 --
 -- text, text
 --

 explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.t);

 select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.t);

 --
 -- text, varchar
 --

 explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.v);

 select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.v);

 --
 -- numeric, numeric
 --

 explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n=t1.n);

 select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n=t1.n);

 --
 -- function(numeric), function(numeric)
 --

 explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.n + 1);

 select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.n + 1);


 --
 -- function(numeric), function(int)
 --

 explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.i + 1);

 select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.i + 1);


 --
 -- NOT EXISTS CSQs to joins
 --

 --
 -- text, text
 --

 explain select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.t=t1.t and t1.i = 1);

 select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.t=t1.t and t1.i = 1);

 --
 -- int, function(int)
 --

 explain select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.i=t1.i + 1);

 select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.i=t1.i + 1);
	--
	-- SUBSELECT
	--
	\c hdfs

	SELECT 1 AS one WHERE 1 IN (SELECT 1);

	SELECT 1 AS zero WHERE 1 NOT IN (SELECT 1);

	SELECT 1 AS zero WHERE 1 IN (SELECT 2);

	-- Set up some simple test tables

	CREATE TABLE SUBSELECT_TBL (
	f1 integer,
	f2 integer,
	f3 float
	);

	INSERT INTO SUBSELECT_TBL VALUES (1, 2, 3);
	INSERT INTO SUBSELECT_TBL VALUES (2, 3, 4);
	INSERT INTO SUBSELECT_TBL VALUES (3, 4, 5);
	INSERT INTO SUBSELECT_TBL VALUES (1, 1, 1);
	INSERT INTO SUBSELECT_TBL VALUES (2, 2, 2);
	INSERT INTO SUBSELECT_TBL VALUES (3, 3, 3);
	INSERT INTO SUBSELECT_TBL VALUES (6, 7, 8);
	INSERT INTO SUBSELECT_TBL VALUES (8, 9, NULL);

	SELECT '' AS eight, * FROM SUBSELECT_TBL ORDER BY 2,3,4;

	-- Uncorrelated subselects

	SELECT '' AS two, f1 AS "Constant Select" FROM SUBSELECT_TBL
	WHERE f1 IN (SELECT 1) ORDER BY 2;

	SELECT '' AS six, f1 AS "Uncorrelated Field" FROM SUBSELECT_TBL
	WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL) ORDER BY 2;

	SELECT '' AS six, f1 AS "Uncorrelated Field" FROM SUBSELECT_TBL
	WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL WHERE
	f2 IN (SELECT f1 FROM SUBSELECT_TBL)) ORDER BY 2;

	SELECT '' AS three, f1, f2
	FROM SUBSELECT_TBL
	WHERE (f1, f2) NOT IN (SELECT f2, CAST(f3 AS int4) FROM SUBSELECT_TBL
	WHERE f3 IS NOT NULL) ORDER BY 2,3;

	-- Correlated subselects

	SELECT '' AS six, f1 AS "Correlated Field", f2 AS "Second Field"
	FROM SUBSELECT_TBL upper
	WHERE f1 IN (SELECT f2 FROM SUBSELECT_TBL WHERE f1 = upper.f1) ORDER BY 2,3;

	SELECT '' AS six, f1 AS "Correlated Field", f3 AS "Second Field"
	FROM SUBSELECT_TBL upper
	WHERE f1 IN
	(SELECT f2 FROM SUBSELECT_TBL WHERE CAST(upper.f2 AS float) = f3) ORDER BY 2,3;

	SELECT '' AS six, f1 AS "Correlated Field", f3 AS "Second Field"
	FROM SUBSELECT_TBL upper
	WHERE f3 IN (SELECT upper.f1 + f2 FROM SUBSELECT_TBL
	WHERE f2 = CAST(f3 AS integer)) ORDER BY 2,3;

	SELECT '' AS five, f1 AS "Correlated Field"
	FROM SUBSELECT_TBL
	WHERE (f1, f2) IN (SELECT f2, CAST(f3 AS int4) FROM SUBSELECT_TBL
	WHERE f3 IS NOT NULL) ORDER BY 2;

	--
	-- Use some existing tables in the regression test
	--

	SELECT '' AS eight, ss.f1 AS "Correlated Field", ss.f3 AS "Second Field"
	FROM SUBSELECT_TBL ss
	WHERE f1 NOT IN (SELECT f1+1 FROM INT4_TBL
	WHERE f1 != ss.f1 AND f1 < 2147483647) ORDER BY 2,3;

	select q1, float8(count()) / (select count() from int8_tbl)
	from int8_tbl group by q1 order by q1;

	--
	-- Test cases to catch unpleasant interactions between IN-join processing
	-- and subquery pullup.
	--

	select count(*) from
	(select 1 from tenk1 a
	where unique1 IN (select hundred from tenk1 b)) ss;
	select count(distinct ss.ten) from
	(select ten from tenk1 a
	where unique1 IN (select hundred from tenk1 b)) ss;
	select count(*) from
	(select 1 from tenk1 a
	where unique1 IN (select distinct hundred from tenk1 b)) ss;
	select count(distinct ss.ten) from
	(select ten from tenk1 a
	where unique1 IN (select distinct hundred from tenk1 b)) ss;

	--
	-- Test cases to check for overenthusiastic optimization of
	-- "IN (SELECT DISTINCT ...)" and related cases. Per example from
	-- Luca Pireddu and Michael Fuhr.
	--

	CREATE TEMP TABLE foo (id integer);
	CREATE TEMP TABLE bar (id1 integer, id2 integer);

	INSERT INTO foo VALUES (1);

	INSERT INTO bar VALUES (1, 1);
	INSERT INTO bar VALUES (2, 2);
	INSERT INTO bar VALUES (3, 1);

	-- These cases require an extra level of distinct-ing above subquery s
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT DISTINCT id1, id2 FROM bar) AS s) ORDER BY 1;
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT id1,id2 FROM bar GROUP BY id1,id2) AS s) ORDER BY 1;
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT id1, id2 FROM bar UNION
	SELECT id1, id2 FROM bar) AS s) ORDER BY 1;

	-- These cases do not
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT DISTINCT ON (id2) id1, id2 FROM bar) AS s) ORDER BY 1;
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT id2 FROM bar GROUP BY id2) AS s) ORDER BY 1;
	SELECT * FROM foo WHERE id IN
	(SELECT id2 FROM (SELECT id2 FROM bar UNION
	SELECT id2 FROM bar) AS s) ORDER BY 1;

	--
	-- Test case to catch problems with multiply nested sub-SELECTs not getting
	-- recalculated properly. Per bug report from Didier Moens.
	--

	CREATE TABLE orderstest (
	approver_ref integer,
	po_ref integer,
	ordercancelled boolean
	);

	INSERT INTO orderstest VALUES (1, 1, false);
	INSERT INTO orderstest VALUES (66, 5, false);
	INSERT INTO orderstest VALUES (66, 6, false);
	INSERT INTO orderstest VALUES (66, 7, false);
	INSERT INTO orderstest VALUES (66, 1, true);
	INSERT INTO orderstest VALUES (66, 8, false);
	INSERT INTO orderstest VALUES (66, 1, false);
	INSERT INTO orderstest VALUES (77, 1, false);
	INSERT INTO orderstest VALUES (1, 1, false);
	INSERT INTO orderstest VALUES (66, 1, false);
	INSERT INTO orderstest VALUES (1, 1, false);

	CREATE VIEW orders_view AS
	SELECT *,
	(SELECT CASE
	WHEN ord.approver_ref=1 THEN '---' ELSE 'Approved'
	END) AS "Approved",
	(SELECT CASE
	WHEN ord.ordercancelled
	THEN 'Cancelled'
	ELSE
	(SELECT CASE
	WHEN ord.po_ref=1
	THEN
	(SELECT CASE
	WHEN ord.approver_ref=1
	THEN '---'
	ELSE 'Approved'
	END)
	ELSE 'PO'
	END)
	END) AS "Status",
	(CASE
	WHEN ord.ordercancelled
	THEN 'Cancelled'
	ELSE
	(CASE
	WHEN ord.po_ref=1
	THEN
	(CASE
	WHEN ord.approver_ref=1
	THEN '---'
	ELSE 'Approved'
	END)
	ELSE 'PO'
	END)
	END) AS "Status_OK"
	FROM orderstest ord;

	SELECT * FROM orders_view ORDER BY 1,2;

	DROP TABLE orderstest cascade;

	--
	-- Test cases to catch situations where rule rewriter fails to propagate
	-- hasSubLinks flag correctly. Per example from Kyle Bateman.
	--

	create temp table parts (
	partnum text,
	cost float8
	);

	create temp table shipped (
	ttype char(2),
	ordnum int4,
	partnum text,
	value float8
	);

	create temp view shipped_view as
	select * from shipped where ttype = 'wt';

	create rule shipped_view_insert as on insert to shipped_view do instead
	insert into shipped values('wt', new.ordnum, new.partnum, new.value);

	insert into parts (partnum, cost) values (1, 1234.56);

	insert into shipped_view (ordnum, partnum, value)
	values (0, 1, (select cost from parts where partnum = 1));

	select * from shipped_view ORDER BY 1,2;

	create rule shipped_view_update as on update to shipped_view do instead
	update shipped set partnum = new.partnum, value = new.value
	where ttype = new.ttype and ordnum = new.ordnum;

	select * from shipped_view ORDER BY 1,2;

	select f1, ss1 as relabel from
	(select *, (select sum(f1) from int4_tbl b where f1 >= a.f1) as ss1
	from int4_tbl a) ss;

	--
	-- Test cases involving PARAM_EXEC parameters and min/max index optimizations.
	-- Per bug report from David Sanchez i Gregori.
	--

	select * from (
	select max(unique1) from tenk1 as a
	where exists (select 1 from tenk1 as b where b.thousand = a.unique2)
	) ss;

	select * from (
	select min(unique1) from tenk1 as a
	where not exists (select 1 from tenk1 as b where b.unique2 = 10000)
	) ss;

	--
	-- Base tables for CSQ tests
	--

	drop table if exists csq_t1_base;
	create table csq_t1_base(x int, y int) distributed by (x);

	insert into csq_t1_base values(1,2);
	insert into csq_t1_base values(2,1);
	insert into csq_t1_base values(4,2);

	drop table if exists csq_t2_base;
	create table csq_t2_base(x int, y int) distributed by (x);

	insert into csq_t2_base values(3,2);
	insert into csq_t2_base values(3,2);
	insert into csq_t2_base values(3,2);
	insert into csq_t2_base values(3,2);
	insert into csq_t2_base values(3,1);


	--
	-- Correlated subqueries
	--

	drop table if exists csq_t1;
	drop table if exists csq_t2;

	create table csq_t1(x int, y int) distributed by (x);
	create table csq_t2(x int, y int) distributed by (x);

	insert into csq_t1 select * from csq_t1_base;
	insert into csq_t2 select * from csq_t2_base;

	select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1; -- expected (4,2)

	--
	-- correlations in the targetlist
	--

	select csq_t1.x, (select sum(bar.x) from csq_t1 bar where bar.x >= csq_t1.x) as sum from csq_t1 order by csq_t1.x;

	select csq_t1.x, (select sum(bar.x) from csq_t1 bar where bar.x = csq_t1.x) as sum from csq_t1 order by csq_t1.x;

	select csq_t1.x, (select bar.x from csq_t1 bar where bar.x = csq_t1.x) as sum from csq_t1 order by csq_t1.x;

	--
	-- CSQs with partitioned tables
	--

	drop table if exists csq_t1;
	drop table if exists csq_t2;

	create table csq_t1(x int, y int)
	distributed by (x)
	partition by range (y) ( start (0) end (4) every (1))
	;

	create table csq_t2(x int, y int)
	distributed by (x)
	partition by range (y) ( start (0) end (4) every (1))
	;

	insert into csq_t1 select * from csq_t1_base;
	insert into csq_t2 select * from csq_t2_base;

	explain select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1;

	select * from csq_t1 where csq_t1.x >ALL (select csq_t2.x from csq_t2 where csq_t2.y=csq_t1.y) order by 1; -- expected (4,2)

	drop table if exists csq_t1;
	drop table if exists csq_t2;
	drop table if exists csq_t1_base;
	drop table if exists csq_t2_base;

	--
	-- Multi-row subqueries
	--

	drop table if exists mrs_t1;
	create table mrs_t1(x int) distributed by (x);

	insert into mrs_t1 select generate_series(1,20);

	explain select * from mrs_t1 where exists (select x from mrs_t1 where x < -1);
	select * from mrs_t1 where exists (select x from mrs_t1 where x < -1) order by 1;

	explain select * from mrs_t1 where exists (select x from mrs_t1 where x = 1);
	select * from mrs_t1 where exists (select x from mrs_t1 where x = 1) order by 1;

	explain select * from mrs_t1 where x in (select x-95 from mrs_t1) or x < 5;
	select * from mrs_t1 where x in (select x-95 from mrs_t1) or x < 5 order by 1;

	explain select 1 as mrs_t1 where 1 <= ALL (Select x from mrs_t1);
	select 1 as mrs_t1 where 1 <= ALL (Select x from mrs_t1) order by 1;

	drop table if exists mrs_t1;

	--
	-- Multi-row subquery from MSTR
	--
	drop table if exists mrs_u1;
	drop table if exists mrs_u2;

	create TABLE mrs_u1 (a int, b int);
	create TABLE mrs_u2 (a int, b int);

	insert into mrs_u1 values (1,2),(11,22);
	insert into mrs_u2 values (1,2),(11,22),(33,44);

	select * from mrs_u1 join mrs_u2 on mrs_u1.a=mrs_u2.a where mrs_u1.a in (1,11) or mrs_u2.a in (select a from mrs_u1 where a=1) order by 1;

	drop table if exists mrs_u1;
	drop table if exists mrs_u2;

	--
	-- MPP-13758
	--

	drop table if exists csq_m1;
	create table csq_m1(y int);
	alter table csq_m1 add column x int default 0;
	insert into csq_m1 values(1,1);

	drop table if exists csq_d1;
	create table csq_d1(y int, x int) distributed by (x);
	insert into csq_d1 select * from csq_m1;

	explain select array(select x from csq_m1); -- no initplan
	select array(select x from csq_m1); -- {1}

	explain select array(select x from csq_d1); -- initplan
	select array(select x from csq_d1); -- {1}

	--
	-- CSQs involving master-only and distributed tables
	--

	drop table if exists t3coquicklz;

	create table t3coquicklz (c1 int , c2 varchar) with (appendonly=true, compresstype=quicklz, orientation=column) distributed by (c1);

	drop table if exists pg_attribute_storage;

	create table pg_attribute_storage (attrelid int, attnum int, attoptions text[]) distributed by (attrelid);

	insert into pg_attribute_storage values ('t3coquicklz'::regclass, 1, E'{\'something\'}');
	insert into pg_attribute_storage values ('t3coquicklz'::regclass, 2, E'{\'something2\'}');

	SELECT a.attname
	, pg_catalog.format_type(a.atttypid, a.atttypmod)

	, ( SELECT substring(pg_catalog.pg_get_expr(d.adbin, d.adrelid) for 128)
	FROM pg_catalog.pg_attrdef d
	WHERE d.adrelid = a.attrelid AND d.adnum = a.attnum AND a.atthasdef
	)
	, a.attnotnull
	, a.attnum
	, a.attstorage
	, pg_catalog.col_description(a.attrelid, a.attnum)
	, ( SELECT s.attoptions
	FROM pg_attribute_storage s
	WHERE s.attrelid = a.attrelid AND s.attnum = a.attnum
	) newcolumn

	FROM pg_catalog.pg_attribute a
	WHERE a.attrelid = 't3coquicklz'::regclass AND a.attnum > 0 AND NOT a.attisdropped
	ORDER BY a.attnum
	; -- expect to see 2 rows

	--
	-- More CSQs involving master-only and distributed relations
	--

	drop table if exists csq_m1;
	create table csq_m1(y int);
	alter table csq_m1 add column x int default 0;
	insert into csq_m1 values(1,1),(1,2),(1,3);

	drop table if exists csq_d1;
	create table csq_d1(y int, x int) distributed by (x);
	insert into csq_d1 select * from csq_m1 where x < 3;
	insert into csq_d1 values(1, 4);

	select * from csq_m1;
	select * from csq_d1;

	--
	-- outer plan node is master-only and CSQ has distributed relation
	--

	explain select * from csq_m1 where x not in (select x from csq_d1) or x < -100; -- gather motion
	select * from csq_m1 where x not in (select x from csq_d1) or x < -100; -- (3)

	--
	-- outer plan node is master-only and CSQ has distributed relation
	--

	explain select * from csq_d1 where x not in (select x from csq_m1) or x < -100; -- broadcast motion
	select * from csq_d1 where x not in (select x from csq_m1) or x < -100; -- (4)

	--
	-- MPP-14441 Don't lose track of initplans
	--
	drop table if exists csq_t1;
	CREATE TABLE csq_t1 (a int, b int, c int, d int, e text) DISTRIBUTED BY (a);
	INSERT INTO csq_t1 SELECT i, i/3, i%2, 100-i, 'text'\|\|i FROM generate_series(1,100) i;

	select count(*) from csq_t1 t1 where a > (SELECT x.b FROM ( select avg(a)::int as b,'haha'::text from csq_t1 t2 where t2.a=t1.d) x ) ;

	select count(*) from csq_t1 t1 where a > ( select avg(a)::int from csq_t1 t2 where t2.a=t1.d) ;

	--
	-- correlation in a func expr
	--
	CREATE FUNCTION csq_f(a int) RETURNS int AS $$ select $1 $$ LANGUAGE SQL;
	CREATE TABLE csq_r(a int);
	INSERT INTO csq_r VALUES (1);

	-- subqueries shouldn't be pulled into a join if the from clause has a function call
	-- with a correlated argument

	-- force_explain
	explain SELECT * FROM csq_r WHERE a IN (SELECT * FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE a IN (SELECT * FROM csq_f(csq_r.a));

	-- force_explain
	explain SELECT * FROM csq_r WHERE a not IN (SELECT * FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE a not IN (SELECT * FROM csq_f(csq_r.a));

	-- force_explain
	explain SELECT * FROM csq_r WHERE exists (SELECT * FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE exists (SELECT * FROM csq_f(csq_r.a));

	-- force_explain
	explain SELECT * FROM csq_r WHERE not exists (SELECT * FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE not exists (SELECT * FROM csq_f(csq_r.a));

	-- force_explain
	explain SELECT * FROM csq_r WHERE a > (SELECT csq_f FROM csq_f(csq_r.a) limit 1);

	SELECT * FROM csq_r WHERE a > (SELECT csq_f FROM csq_f(csq_r.a) limit 1);

	-- force_explain
	explain SELECT * FROM csq_r WHERE a < ANY (SELECT csq_f FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE a < ANY (SELECT csq_f FROM csq_f(csq_r.a));

	-- force_explain
	explain SELECT * FROM csq_r WHERE a <= ALL (SELECT csq_f FROM csq_f(csq_r.a));

	SELECT * FROM csq_r WHERE a <= ALL (SELECT csq_f FROM csq_f(csq_r.a));

	-- fails: correlation in distributed subplan
	-- force_explain
	explain SELECT * FROM csq_r WHERE a IN (SELECT csq_f FROM csq_f(csq_r.a),csq_r);

	--
	-- Test pullup of expr CSQs to joins
	--

	--
	-- Test data
	--

	drop table if exists csq_pullup;
	create table csq_pullup(t text, n numeric, i int, v varchar(10));
	insert into csq_pullup values ('abc',1, 2, 'xyz');
	insert into csq_pullup values ('xyz',2, 3, 'def');
	insert into csq_pullup values ('def',3, 1, 'abc');

	--
	-- Expr CSQs to joins
	--

	--
	-- text, text
	--

	explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.t);

	select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.t);

	--
	-- text, varchar
	--

	explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.v);

	select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.t=t1.v);

	--
	-- numeric, numeric
	--

	explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n=t1.n);

	select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n=t1.n);

	--
	-- function(numeric), function(numeric)
	--

	explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.n + 1);

	select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.n + 1);


	--
	-- function(numeric), function(int)
	--

	explain select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.i + 1);

	select * from csq_pullup t0 where 1= (select count(*) from csq_pullup t1 where t0.n + 1=t1.i + 1);


	--
	-- NOT EXISTS CSQs to joins
	--

	--
	-- text, text
	--

	explain select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.t=t1.t and t1.i = 1);

	select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.t=t1.t and t1.i = 1);

	--
	-- int, function(int)
	--

	explain select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.i=t1.i + 1);

	select * from csq_pullup t0 where not exists (select 1 from csq_pullup t1 where t0.i=t1.i + 1);