src/test/regress/expected/bfv_planner_optimizer.out - cloudberry - Git at Google

 --start_ignore
 drop table if exists testbadsql;
 NOTICE:  table "testbadsql" does not exist, skipping
 drop table if exists bfv_planner_x;
 NOTICE:  table "bfv_planner_x" does not exist, skipping
 drop table if exists bfv_planner_foo;
 NOTICE:  table "bfv_planner_foo" does not exist, skipping
 --end_ignore
 CREATE TABLE testbadsql(id int);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 CREATE TABLE bfv_planner_x(i integer);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'i' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 CREATE TABLE bfv_planner_foo AS SELECT i as a, i+1 as b from generate_series(1,10)i;
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause. Creating a NULL policy entry.
 --
 -- Test unexpected internal error (execQual.c:4413) when using subquery+window function+union in 4.2.6.x
 --
 -- Q1
 select * from
 (SELECT  MIN(id) OVER () minid FROM testbadsql
 UNION
 SELECT  MIN(id) OVER () minid FROM testbadsql
 ) tmp
 where tmp.minid=123;
  minid
 -------
 (0 rows)

 -- Q2
 select * from
 (SELECT  MIN(id) OVER () minid FROM testbadsql
 UNION
 SELECT 1
 ) tmp
 where tmp.minid=123;
  minid
 -------
 (0 rows)

 -- Q3
 select * from
 (SELECT  MIN(id) OVER () minid FROM testbadsql) tmp
 where tmp.minid=123;
  minid
 -------
 (0 rows)

 -- Q4
 SELECT * from (
   SELECT max(i) over () as w from bfv_planner_x Union Select 1 as w)
 as bfv_planner_foo where w > 0;
  w
 ---
  1
 (1 row)

 --
 -- Test query when using median function with count(*)
 --
 --start_ignore
 drop table if exists testmedian;
 NOTICE:  table "testmedian" does not exist, skipping
 --end_ignore
 CREATE TABLE testmedian
 (
   a character(2) NOT NULL,
   b character varying(8) NOT NULL,
   c character varying(8) NOT NULL,
   value1 double precision,
   value2 double precision
 )
 WITH (
   OIDS=FALSE
 )
 DISTRIBUTED BY (b,c);
 insert into testmedian
 select i, i, i, i, i
 from  (select * from generate_series(1, 99) i ) a ;
 -- Test with count()
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by b, c, value2;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with varying ORDER-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='25'
 group by a, b, c, value2
 order by c,b;
  median | count
 --------+-------
      25 |     1
 (1 row)

 -- Test with varying ORDER-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by b,c,value1
 order by b, c, value1;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with sum()
 select median(value1), sum(value2)
 from  testmedian
 where c ='55'
 group by b, c, value2;
  median | sum
 --------+-----
      55 |  55
 (1 row)

 -- Test with min()
 select median(value1), min(c)
 from  testmedian
 where c ='55'
 group by b, c, value2;
  median | min
 --------+-----
      55 | 55
 (1 row)

 -- Test with varying GROUP-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by b;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with varying GROUP-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by b,c;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with varying GROUP-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by c,b;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with varying GROUP-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='55'
 group by b,c,value1;
  median | count
 --------+-------
      55 |     1
 (1 row)

 -- Test with varying ORDER-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='25'
 group by b, value1
 order by b;
  median | count
 --------+-------
      25 |     1
 (1 row)

 -- Test with varying ORDER-BY clause
 select median(value1), count(*)
 from  testmedian
 where c ='25'
 group by b, c, value2
 order by b,c;
  median | count
 --------+-------
      25 |     1
 (1 row)

 -- Test inheritance planning, when a SubPlan is duplicated for different
 -- child tables.
 create table r (a int) distributed by (a);
 create table p (a int, b int) distributed by (a);
 create table p2 (a int, b int) inherits (p) distributed by (b);
 NOTICE:  merging column "a" with inherited definition
 NOTICE:  merging column "b" with inherited definition
 insert into r values (3);
 insert into p select a, b from generate_series(1,3) a, generate_series(1,3) b;
 delete from p where b = 1 or (b=2 and a in (select r.a from r));
 select * from p;
  a | b
 ---+---
  3 | 3
  1 | 2
  1 | 3
  2 | 2
  2 | 3
 (5 rows)

 delete from p where b = 1 or (b=2 and a in (select b from r));
 select * from p;
  a | b
 ---+---
  1 | 2
  1 | 3
  2 | 3
  3 | 3
 (4 rows)

 -- Test planning of IS NOT FALSE. We used treat "(a = b) IS NOT FALSE" as
 -- hash joinable, and create a plan with a hash join on "(a = b)". That
 -- was wrong, because NULLs are treated differently.
 create table booltest (b bool);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into booltest values ('t');
 insert into booltest values (null);
 select * from booltest a, booltest b where (a.b = b.b) is not false;
  b | b
 ---+---
    |
    | t
  t |
  t | t
 (4 rows)

 -- Lossy index qual, used as a partial index predicate, and same column is
 -- used in FOR SHARE. Once upon a time, this happened to tickle a bug in the
 -- planner at one point.
 create table tstest (t tsvector);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause, and no column type is suitable for a distribution key. Creating a NULL policy entry.
 create index i_tstest on tstest using gist (t) WHERE t @@ 'bar';
 insert into tstest values ('foo');
 insert into tstest values ('bar');
 set enable_bitmapscan =off;
 set enable_seqscan =off;
 select * from tstest where t @@ 'bar' for share of tstest;
    t
 -------
  'bar'
 (1 row)

 -- Stable (and volatile) functions need to be re-evaluated on every
 -- execution of a prepared statement. There used to be a bug, where
 -- they were evaluated once at planning time or at first execution,
 -- and the same value was incorrectly reused on subsequent executions.
 create function stabletestfunc() returns integer as $$
 begin
   raise notice 'stabletestfunc executed';
   return 123;
 end;
 $$ language plpgsql stable;
 create table stabletesttab (id integer);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into stabletesttab values (1);
 insert into stabletesttab values (1000);
 -- This might evaluate the function, for cost estimate purposes. That's
 -- not of importance for this test.
 prepare myprep as select * from stabletesttab where id < stabletestfunc();
 -- Check that the stable function should be re-executed on every execution of the prepared statetement.
 execute myprep;
 NOTICE:  stabletestfunc executed
  id
 ----
   1
 (1 row)

 execute myprep;
 NOTICE:  stabletestfunc executed
  id
 ----
   1
 (1 row)

 execute myprep;
 NOTICE:  stabletestfunc executed
  id
 ----
   1
 (1 row)

 -- Test that pl/pgsql simple expressions are not considered a
 -- oneoffPlan.  We validate this by ensuring that a simple expression
 -- involving a stable function is planned only once and the same plan
 -- is re-executed for each tuple.  The NOTICE in the immutable
 -- function allows us to detect when it is executed.  We assume that
 -- the planner folds immutablefunc() into a const.
 CREATE FUNCTION immutablefunc() RETURNS int2
 LANGUAGE plpgsql IMMUTABLE STRICT AS
 $$
 BEGIN
 	raise notice 'immutablefunc executed';
 	return 42;
 END
 $$;
 CREATE FUNCTION stablenow (dummy int2) RETURNS timestamp
 LANGUAGE plpgsql STABLE STRICT AS
 $fn$
 BEGIN
 	return now();
 END
 $fn$;
 CREATE FUNCTION volatilefunc(a int) RETURNS int
 LANGUAGE plpgsql VOLATILE STRICT AS
 $fn$
 DECLARE
   t timestamp;
 BEGIN
 	t := stablenow(immutablefunc());
 	if date_part('month', t) > a then
 		return 0;
 	else
 		return 1;
 	end if;
 END
 $fn$;
 CREATE TABLE oneoffplantest (a int) distributed by (a);
 INSERT INTO oneoffplantest VALUES (0), (0), (0);
 -- Plan for the following query should be cached such that the call to
 -- immutablefun() is folded into a const.  Note that all the
 -- statements within volatilefunc() are pl/pgsql simple expressions.
 -- Their plans should NOT be classified as oneoffPlan and should be
 -- cached.  So we expect the NOTICE to be printed only once,
 -- regardless of the number of tuples in the table.
 select volatilefunc(a) from oneoffplantest;
 NOTICE:  immutablefunc executed  (seg0 slice1 127.0.1.1:25432 pid=6257)
  volatilefunc
 --------------
             0
             0
             0
 (3 rows)

 -- Test agg on top of join subquery on partition table with ORDER-BY clause
 CREATE TABLE bfv_planner_t1 (a int, b int, c int) distributed by (c);
 CREATE TABLE bfv_planner_t2 (f int,g int) DISTRIBUTED BY (f) PARTITION BY RANGE(g)
 (
 PARTITION "201612" START (1) END (10)
 );
 NOTICE:  CREATE TABLE will create partition "bfv_planner_t2_1_prt_201612" for table "bfv_planner_t2"
 insert into bfv_planner_t1 values(1,2,3), (2,3,4), (3,4,5);
 insert into bfv_planner_t2 values(3,1), (4,2), (5,2);
 select count(*) from
 (select a,b,c from bfv_planner_t1 order by c) T1
 join
 (select f,g from bfv_planner_t2) T2
 on
 T1.a=T2.g and T1.c=T2.f;
  count
 -------
      2
 (1 row)

 -- This produced a "could not find pathkey item to sort" error at one point.
 -- The problem was that we stripped out column b from the SubqueryScan's
 -- target list, as it's not needed in the final result, but we tried to
 -- maintain the ordering (a,b) in the Gather Motion node, which would have
 -- required column b to be present, at least as a junk column.
 create table bfv_planner_t3 (a int4, b int4);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 select a from (select * from bfv_planner_t3 order by a, b) as x limit 1;
  a
 ---
 (0 rows)

 -- Similar case, but when evaluating a window function rather than LIMIT
 select first_value(a) over w, a
 from (select * from bfv_planner_t3 order by a, b) as x
 WINDOW w AS (order by a);
  first_value | a
 -------------+---
 (0 rows)

 -- volatile general
 -- General and segmentGeneral locus imply that if the corresponding
 -- slice is executed in many different segments should provide the
 -- same result data set. Thus, in some cases, General and segmentGeneral
 -- can be treated like broadcast. But if the segmentGeneral and general
 -- locus path contain volatile functions, they lose the property and
 -- can only be treated as singleQE. The following cases are to check that
 -- we correctly handle all these cases.
 -- FIXME: for ORCA the following SQL does not consider this. We should
 -- fix them when ORCA changes.
 create table t_hashdist(a int, b int, c int) distributed by (a);
 ---- pushed down filter
 explain (costs off)
 select * from
 (select a from generate_series(1, 10)a) x, t_hashdist
 where x.a > random();
                                        QUERY PLAN
 ----------------------------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Seq Scan on t_hashdist
          ->  Materialize
                ->  Result
                      Filter: ((generate_series.generate_series)::double precision > random())
                      ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (9 rows)

 ---- join qual
 explain (costs off) select * from
 t_hashdist,
 (select a from generate_series(1, 1000) a) x,
 (select a from generate_series(1, 1000) a) y
 where x.a + y.a > random();
                                                             QUERY PLAN
 -----------------------------------------------------------------------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Seq Scan on t_hashdist
          ->  Nested Loop
                Join Filter: (((generate_series_1.generate_series + generate_series.generate_series))::double precision > random())
                ->  Function Scan on generate_series generate_series_1
                ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (9 rows)

 ---- sublink & subquery
 explain (costs off) select * from t_hashdist where a > All (select random() from generate_series(1, 10));
                                                                                                                                                                                                                   QUERY PLAN
 -----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
  Result
    Filter: (SubPlan 1)
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Seq Scan on t_hashdist
    SubPlan 1
      ->  Result
            Filter: ((CASE WHEN (sum((CASE WHEN ((t_hashdist.a)::double precision <= random()) THEN 1 ELSE 0 END)) IS NULL) THEN true WHEN (sum((CASE WHEN (random() IS NULL) THEN 1 ELSE 0 END)) > '0'::bigint) THEN NULL::boolean WHEN ((t_hashdist.a)::double precision IS NULL) THEN NULL::boolean WHEN (sum((CASE WHEN ((t_hashdist.a)::double precision <= random()) THEN 1 ELSE 0 END)) = '0'::bigint) THEN true ELSE false END) = true)
            ->  Aggregate
                  ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (10 rows)

 explain (costs off) select * from t_hashdist where a in (select random()::int from generate_series(1, 10));
                         QUERY PLAN
 ----------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Hash Semi Join
          Hash Cond: (t_hashdist.a = ((random())::integer))
          ->  Seq Scan on t_hashdist
          ->  Hash
                ->  Redistribute Motion 1:3  (slice2)
                      Hash Key: ((random())::integer)
                      ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (9 rows)

 -- subplan
 explain (costs off, verbose) select * from
 t_hashdist left join (select a from generate_series(1, 10) a) x on t_hashdist.a > any (select random() from generate_series(1, 10));
                                  QUERY PLAN
 -----------------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    Output: t_hashdist.a, t_hashdist.b, t_hashdist.c, a.a
    ->  Nested Loop Left Join
          Output: t_hashdist.a, t_hashdist.b, t_hashdist.c, a.a
          Join Filter: ((SubPlan 1))
          ->  Seq Scan on public.t_hashdist
                Output: t_hashdist.a, t_hashdist.b, t_hashdist.c, (SubPlan 1)
                SubPlan 1
                  ->  Materialize
                        Output: (random())
                        ->  Broadcast Motion 1:3  (slice2)
                              Output: (random())
                              ->  Function Scan on pg_catalog.generate_series
                                    Output: random()
                                    Function Call: generate_series(1, 10)
          ->  Function Scan on pg_catalog.generate_series a
                Output: a.a
                Function Call: generate_series(1, 10)
  Optimizer: Postgres query optimizer
  Settings: enable_bitmapscan=off, enable_seqscan=off, optimizer=on
 (20 rows)

 -- targetlist
 explain (costs off) select * from t_hashdist cross join (select random () from generate_series(1, 10))x;
                             QUERY PLAN
 -------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice2; segments: 3)
                ->  Seq Scan on t_hashdist
          ->  Materialize
                ->  Result
                      One-Time Filter: (gp_execution_segment() = 2)
                      ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (10 rows)

 explain (costs off) select * from t_hashdist cross join (select a, sum(random()) from generate_series(1, 10) a group by a) x;
                               QUERY PLAN
 ----------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice3; segments: 3)
                ->  Seq Scan on t_hashdist
          ->  Materialize
                ->  Redistribute Motion 1:3  (slice2)
                      ->  HashAggregate
                            Group Key: generate_series.generate_series
                            ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (11 rows)

 explain (costs off) select * from t_hashdist cross join (select random() as k, sum(a) from generate_series(1, 10) a group by k) x;
                           QUERY PLAN
 ---------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  HashAggregate
                Group Key: (random())
                ->  Redistribute Motion 1:3  (slice3)
                      Hash Key: (random())
                      ->  Function Scan on generate_series
          ->  Materialize
                ->  Broadcast Motion 3:3  (slice2; segments: 3)
                      ->  Seq Scan on t_hashdist
  Optimizer: Pivotal Optimizer (GPORCA)
 (12 rows)

 explain (costs off) select * from t_hashdist cross join (select a, count(1) as s from generate_series(1, 10) a group by a having count(1) > random() order by a) x ;
                             QUERY PLAN
 -------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Result
                Filter: (((count(1)))::double precision > random())
                ->  HashAggregate
                      Group Key: generate_series.generate_series
                      ->  Function Scan on generate_series
          ->  Seq Scan on t_hashdist
  Optimizer: Pivotal Optimizer (GPORCA)
 (10 rows)

 -- limit
 explain (costs off) select * from t_hashdist cross join (select * from generate_series(1, 10) limit random()) x;
                      QUERY PLAN
 ----------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  Nested Loop
          Join Filter: true
          ->  Seq Scan on t_hashdist
          ->  Limit
                ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (7 rows)

 -- CTAS on general locus into replicated table
 create temp SEQUENCE test_seq;
 explain (costs off) create table t_rep as select nextval('test_seq') from (select generate_series(1, 10)) t1 distributed replicated;
               QUERY PLAN
 ---------------------------------------
  Result
    ->  Broadcast Motion 1:3  (slice1)
          ->  Result
                ->  ProjectSet
                      ->  Result
  Optimizer: Pivotal Optimizer (GPORCA)
 (6 rows)

 create table t_rep1 as select nextval('test_seq') from (select generate_series(1, 10)) t1 distributed replicated;
 select count(*) from gp_dist_random('t_rep1');
  count
 -------
     30
 (1 row)

 select count(distinct nextval) from gp_dist_random('t_rep1');
  count
 -------
     10
 (1 row)

 drop table t_rep1;
 -- CTAS on general locus into replicated table with HAVING
 explain (costs off) create table t_rep as select i from generate_series(5, 15) as i group by i having i < nextval('test_seq') distributed replicated;
                                QUERY PLAN
 -------------------------------------------------------------------------
  Result
    ->  Broadcast Motion 3:3  (slice1; segments: 3)
          ->  Result
                Filter: (generate_series < nextval('test_seq'::regclass))
                ->  HashAggregate
                      Group Key: generate_series
                      ->  Result
                            ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (9 rows)

 create table t_rep2 as select i from generate_series(5, 15) as i group by i having i < nextval('test_seq') distributed replicated;
 select count(*) from gp_dist_random('t_rep2');
  count
 -------
     33
 (1 row)

 select count(distinct i) from gp_dist_random('t_rep2');
  count
 -------
     11
 (1 row)

 drop table t_rep2;
 -- CTAS on general locus into replicated table with GROUP BY
 explain (costs off) create table t_rep as select i > nextval('test_seq') from generate_series(5, 15) as i group by i > nextval('test_seq') distributed replicated;
                                        QUERY PLAN
 -----------------------------------------------------------------------------------------
  Result
    ->  Broadcast Motion 3:3  (slice1; segments: 3)
          ->  GroupAggregate
                Group Key: ((generate_series > nextval('test_seq'::regclass)))
                ->  Sort
                      Sort Key: ((generate_series > nextval('test_seq'::regclass)))
                      ->  Redistribute Motion 1:3  (slice2)
                            Hash Key: ((generate_series > nextval('test_seq'::regclass)))
                            ->  Function Scan on generate_series
  Optimizer: Pivotal Optimizer (GPORCA)
 (10 rows)

 create table t_rep3 as select i > nextval('test_seq') as a from generate_series(5, 15) as i group by i > nextval('test_seq') distributed replicated;
 select count(*) from gp_dist_random('t_rep3');
  count
 -------
      3
 (1 row)

 select count(distinct a) from gp_dist_random('t_rep3');
  count
 -------
      1
 (1 row)

 drop table t_rep3;
 -- CTAS on replicated table into replicated table
 create table rep_tbl as select t1 from generate_series(1, 10) t1 distributed replicated;
 explain (costs off) create table t_rep as select nextval('test_seq') from rep_tbl distributed replicated;
                     QUERY PLAN
 ---------------------------------------------------
  Result
    ->  Broadcast Motion 1:3  (slice1; segments: 1)
          ->  Seq Scan on rep_tbl
  Optimizer: Pivotal Optimizer (GPORCA)
 (4 rows)

 create table t_rep4 as select nextval('test_seq') from rep_tbl distributed replicated;
 select count(*) from gp_dist_random('t_rep4');
  count
 -------
     30
 (1 row)

 select count(distinct nextval) from gp_dist_random('t_rep4');
  count
 -------
     10
 (1 row)

 drop table rep_tbl, t_rep4;
 --
 -- Test append different numsegments tables work well
 -- See Github issue: https://github.com/greenplum-db/gpdb/issues/12146
 --
 create table t1_12146 (a int, b int) distributed by (a);
 create table t2_12146 (a int, b int) distributed by (a);
 create table t3_12146 (a int, b int) distributed by (a);
 create table t4_12146 (a int, b int) distributed by (a);
 -- make t1_12146 and t2_12146 to partially-distributed
 set allow_system_table_mods = on;
 update gp_distribution_policy set numsegments = 2
 where localoid in ('t1_12146'::regclass::oid, 't2_12146'::regclass::oid);
 insert into t1_12146 select i,i from generate_series(1, 10000)i;
 insert into t2_12146 select i,i from generate_series(1, 10000)i;
 insert into t3_12146 select i,i from generate_series(1, 10)i;
 insert into t4_12146 select i,i from generate_series(1, 10)i;
 -- now set t1_12146 and t2_12146 randomly distributed;
 update gp_distribution_policy
 set distkey = '', distclass = ''
 where localoid in ('t1_12146'::regclass::oid, 't2_12146'::regclass::oid);
 analyze t1_12146;
 analyze t2_12146;
 analyze t3_12146;
 analyze t4_12146;
 explain select count(*)
 from
 (
   (
   -- t1 left join t3 to build broadcast t3 plan
   -- so that the join's locus is t1's locus:
   -- strewn on 2segs
   select
   *
   from t1_12146 left join t3_12146 on t1_12146.b = t3_12146.b
   )
   union all
   (
   -- t2 left join t4 to build broadcast t4 plan
   -- so that the join's locus is t2's locus:
   -- strewn on 2segs
   select
   *
   from t2_12146 left join t4_12146 on t2_12146.b = t4_12146.b
   ) -- the first subplan's locus is not the same
     -- because strewn locus always not the same
   union all
   (
   -- this will be a full to full redist
   select
   *
   from t3_12146 join t4_12146 on t3_12146.b = t4_12146.a
   )
 ) x;
                                                                   QUERY PLAN
 ----------------------------------------------------------------------------------------------------------------------------------------------
  Finalize Aggregate  (cost=60000000416.93..60000000416.94 rows=1 width=8)
    ->  Gather Motion 3:1  (slice1; segments: 3)  (cost=60000000416.88..60000000416.93 rows=3 width=8)
          ->  Partial Aggregate  (cost=60000000416.88..60000000416.89 rows=1 width=8)
                ->  Append  (cost=20000000001.29..60000000391.87 rows=10003 width=0)
                      ->  Subquery Scan on "*SELECT* 1"  (cost=20000000001.29..20000000169.80 rows=5000 width=0)
                            ->  Hash Left Join  (cost=20000000001.29..20000000119.80 rows=5000 width=16)
                                  Hash Cond: (t1_12146.b = t3_12146.b)
                                  ->  Seq Scan on t1_12146  (cost=10000000000.00..10000000056.00 rows=5000 width=4)
                                  ->  Hash  (cost=10000000001.17..10000000001.17 rows=10 width=4)
                                        ->  Broadcast Motion 3:3  (slice2; segments: 3)  (cost=10000000000.00..10000000001.17 rows=10 width=4)
                                              ->  Seq Scan on t3_12146  (cost=10000000000.00..10000000001.03 rows=3 width=4)
                      ->  Subquery Scan on "*SELECT* 2"  (cost=20000000001.29..20000000169.80 rows=5000 width=0)
                            ->  Hash Left Join  (cost=20000000001.29..20000000119.80 rows=5000 width=16)
                                  Hash Cond: (t2_12146.b = t4_12146.b)
                                  ->  Seq Scan on t2_12146  (cost=10000000000.00..10000000056.00 rows=5000 width=4)
                                  ->  Hash  (cost=10000000001.17..10000000001.17 rows=10 width=4)
                                        ->  Broadcast Motion 3:3  (slice3; segments: 3)  (cost=10000000000.00..10000000001.17 rows=10 width=4)
                                              ->  Seq Scan on t4_12146  (cost=10000000000.00..10000000001.03 rows=3 width=4)
                      ->  Subquery Scan on "*SELECT* 3"  (cost=20000000001.08..20000000002.25 rows=3 width=0)
                            ->  Hash Join  (cost=20000000001.08..20000000002.22 rows=3 width=16)
                                  Hash Cond: (t3_12146_1.b = t4_12146_1.a)
                                  ->  Redistribute Motion 3:3  (slice4; segments: 3)  (cost=10000000000.00..10000000001.10 rows=3 width=4)
                                        Hash Key: t3_12146_1.b
                                        ->  Seq Scan on t3_12146 t3_12146_1  (cost=10000000000.00..10000000001.03 rows=3 width=4)
                                  ->  Hash  (cost=10000000001.03..10000000001.03 rows=3 width=4)
                                        ->  Seq Scan on t4_12146 t4_12146_1  (cost=10000000000.00..10000000001.03 rows=3 width=4)
  Optimizer: Postgres query optimizer
 (27 rows)

 select count(*)
 from
 (
   (
   -- t1 left join t3 to build broadcast t3 plan
   -- so that the join's locus is t1's locus:
   -- strewn on 2segs
   select
   *
   from t1_12146 left join t3_12146 on t1_12146.b = t3_12146.b
   )
   union all
   (
   -- t2 left join t4 to build broadcast t4 plan
   -- so that the join's locus is t2's locus:
   -- strewn on 2segs
   select
   *
   from t2_12146 left join t4_12146 on t2_12146.b = t4_12146.b
   ) -- the first subplan's locus is not the same
     -- because strewn locus always not the same
   union all
   (
   -- this will be a full to full redist
   select
   *
   from t3_12146 join t4_12146 on t3_12146.b = t4_12146.a
   )
 ) x;
  count
 -------
  20010
 (1 row)

 drop table t1_12146;
 drop table t2_12146;
 drop table t3_12146;
 drop table t4_12146;
 reset allow_system_table_mods;
 --
 -- test https://github.com/apache/cloudberry/issues/593
 --
 CREATE TABLE t0_issue_593(c0 bigserial PRIMARY KEY) USING heap WITH (autovacuum_vacuum_threshold=1468046284, autovacuum_analyze_threshold=1889118206, autovacuum_vacuum_cost_delay=9, fillfactor=25, autovacuum_freeze_max_age=1860760049, autovacuum_enabled=0, autovacuum_freeze_min_age=402702412, autovacuum_vacuum_cost_limit=2500);
 CREATE TABLE IF NOT EXISTS t1_issue_593(LIKE t0_issue_593);
 NOTICE:  table doesn't have 'DISTRIBUTED BY' clause, defaulting to distribution columns from LIKE table
 CREATE TABLE IF NOT EXISTS t2_issue_593(LIKE t0_issue_593 INCLUDING INDEXES);
 NOTICE:  table doesn't have 'DISTRIBUTED BY' clause, defaulting to distribution columns from LIKE table
 CREATE UNLOGGED TABLE IF NOT EXISTS t3_issue_593(LIKE t2_issue_593);
 NOTICE:  table doesn't have 'DISTRIBUTED BY' clause, defaulting to distribution columns from LIKE table
 CREATE TEMPORARY TABLE IF NOT EXISTS t4_issue_593(LIKE t3_issue_593);
 NOTICE:  table doesn't have 'DISTRIBUTED BY' clause, defaulting to distribution columns from LIKE table
 SELECT '100.147.127.36' FROM t1_issue_593, ONLY t2_issue_593, t4_issue_593*
   CROSS JOIN t0_issue_593* CROSS JOIN ONLY t3_issue_593 GROUP BY pg_jit_available()
     HAVING inet_same_family('148.199.107.23', '214.26.36.61') UNION ALL
   SELECT '100.147.127.36' FROM t1_issue_593*, ONLY t2_issue_593, t4_issue_593*
   CROSS JOIN t0_issue_593* CROSS JOIN ONLY t3_issue_593 GROUP BY pg_jit_available()
     HAVING NOT (inet_same_family('148.199.107.23', '214.26.36.61')) UNION ALL
   SELECT '100.147.127.36' FROM t1_issue_593*, ONLY t2_issue_593, t4_issue_593*
   CROSS JOIN t0_issue_593 CROSS JOIN ONLY t3_issue_593 GROUP BY pg_jit_available()
     HAVING (inet_same_family('148.199.107.23', '214.26.36.61')) ISNULL;
  ?column?
 ----------
 (0 rows)

 drop table t0_issue_593;
 drop table t1_issue_593;
 drop table t2_issue_593;
 drop table t3_issue_593;
 drop table t4_issue_593;
 -- start_ignore
 drop table if exists bfv_planner_x;
 drop table if exists testbadsql;
 drop table if exists bfv_planner_foo;
 drop table if exists testmedian;
 drop table if exists bfv_planner_t1;
 drop table if exists bfv_planner_t2;
 -- end_ignore