ORCA: skip MVCC system columns for standalone AO tables (#1409)

yjhjstz · web-flow · commit c3be6e5d9bee · 2025-10-22T10:42:19.000+08:00
Fix ORCA fallback error when querying AO tables with multiple DISTINCT aggregates:
  "Invalid system target list found for AO table"

AO tables don't support MVCC system columns (xmin, xmax, cmin, cmax).
Skip these columns when building metadata for standalone AO tables, but
preserve them for partitioned tables to maintain column mapping consistency.
diff --git a/contrib/pax_storage/src/test/regress/expected/gporca_optimizer.out b/contrib/pax_storage/src/test/regress/expected/gporca_optimizer.out
diff --git a/contrib/pax_storage/src/test/regress/expected/tsrf_optimizer.out b/contrib/pax_storage/src/test/regress/expected/tsrf_optimizer.out
@@ -88,15 +88,16 @@ ANALYZE few;
 -- SRF with a provably-dummy relation
 explain (verbose, costs off)
 SELECT unnest(ARRAY[1, 2]) FROM few WHERE false;
-              QUERY PLAN              
---------------------------------------
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
  ProjectSet
    Output: unnest('{1,2}'::integer[])
    ->  Result
-         Output: NULL::integer, NULL::tid, NULL::xid, NULL::cid, NULL::xid, NULL::cid, NULL::oid, NULL::integer, NULL::oid
+         Output: NULL::integer, NULL::tid, NULL::oid, NULL::integer, NULL::oid
          One-Time Filter: false
- Optimizer: Pivotal Optimizer (GPORCA)
-(6 rows)
+ Settings: optimizer = 'on'
+ Optimizer: GPORCA
+(7 rows)
 
 SELECT unnest(ARRAY[1, 2]) FROM few WHERE false;
  unnest 
@@ -117,12 +118,12 @@ SELECT * FROM few f1,
          ->  ProjectSet
                Output: unnest('{1,2}'::integer[])
                ->  Result
-                     Output: NULL::integer, NULL::tid, NULL::xid, NULL::cid, NULL::xid, NULL::cid, NULL::oid, NULL::integer, NULL::oid
+                     Output: NULL::integer, NULL::tid, NULL::oid, NULL::integer, NULL::oid
                      One-Time Filter: false
          ->  Seq Scan on public.few f1
                Output: id, dataa, datab
- Settings: enable_parallel = 'off', optimizer = 'on'
- Optimizer: Pivotal Optimizer (GPORCA)
+ Settings: optimizer = 'on'
+ Optimizer: GPORCA
 (14 rows)
 
 SELECT * FROM few f1,
diff --git a/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp b/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp
@@ -862,13 +862,31 @@ CTranslatorRelcacheToDXL::RetrieveRelDistributionOpFamilies(CMemoryPool *mp,
 void
 CTranslatorRelcacheToDXL::AddSystemColumns(CMemoryPool *mp,
 										   CMDColumnArray *mdcol_array,
-										   Relation /*rel*/)
+										   Relation rel)
 {
+	// Get storage type to determine which system columns are supported
+	IMDRelation::Erelstoragetype rel_storage_type = RetrieveRelStorageType(rel);
+	BOOL is_standalone_ao_table = ((rel_storage_type == IMDRelation::ErelstorageAppendOnlyRows ||
+						rel_storage_type == IMDRelation::ErelstorageAppendOnlyCols ||
+						rel_storage_type == IMDRelation::ErelstoragePAX)) &&
+						rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE &&
+						!rel->rd_rel->relispartition;
+
 	for (INT i = SelfItemPointerAttributeNumber;
 		 i > FirstLowInvalidHeapAttributeNumber; i--)
 	{
 		AttrNumber attno = AttrNumber(i);
 		GPOS_ASSERT(0 != attno);
+		// AO tables don't support MVCC-related system columns (xmin, cmin, xmax, cmax)
+		// Skip these columns for AO tables to avoid "Invalid system target list" errors
+		if (is_standalone_ao_table &&
+			(attno == MinTransactionIdAttributeNumber ||  // xmin (-2)
+			 attno == MinCommandIdAttributeNumber ||      // cmin (-3)
+			 attno == MaxTransactionIdAttributeNumber ||  // xmax (-4)
+			 attno == MaxCommandIdAttributeNumber))       // cmax (-5)
+		{
+			continue;
+		}
 
 		const FormData_pg_attribute *att_tup = SystemAttributeDefinition(attno);
 
diff --git a/src/test/regress/expected/gp_dqa.out b/src/test/regress/expected/gp_dqa.out
@@ -3067,5 +3067,51 @@ select count(distinct a), count(distinct b) from dqa_f4 group by c;
      1 |     1
 (3 rows)
 
+-- Test AO table dqa with multiple distinct aggs
+create table dqa_f5(a int, b int, c int) using ao_column;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into dqa_f5 values(null, null, null);
+insert into dqa_f5 values(1, 1, 1);
+insert into dqa_f5 values(2, 2, 2);
+explain (verbose on, costs off) select count(distinct a), count(distinct b) from dqa_f5 group by c;
+                                                QUERY PLAN                                                 
+-----------------------------------------------------------------------------------------------------------
+ Finalize HashAggregate
+   Output: count(a), count(b), c
+   Group Key: dqa_f5.c
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Output: c, (PARTIAL count(a)), (PARTIAL count(b))
+         ->  Partial HashAggregate
+               Output: c, PARTIAL count(a), PARTIAL count(b)
+               Group Key: dqa_f5.c
+               ->  HashAggregate
+                     Output: c, a, b, (AggExprId)
+                     Group Key: (AggExprId), dqa_f5.a, dqa_f5.b, dqa_f5.c
+                     ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                           Output: c, a, b, (AggExprId)
+                           Hash Key: c, a, b, (AggExprId)
+                           ->  Streaming HashAggregate
+                                 Output: c, a, b, (AggExprId)
+                                 Group Key: AggExprId, dqa_f5.a, dqa_f5.b, dqa_f5.c
+                                 ->  TupleSplit
+                                       Output: c, a, b, AggExprId
+                                       Split by Col: (dqa_f5.a), (dqa_f5.b)
+                                       Group Key: dqa_f5.c
+                                       ->  Seq Scan on public.dqa_f5
+                                             Output: c, a, b
+ Settings: enable_groupagg = 'off', enable_hashagg = 'on', gp_motion_cost_per_row = '2', optimizer = 'off'
+ Optimizer: Postgres query optimizer
+(25 rows)
+
+select count(distinct a), count(distinct b) from dqa_f5 group by c;
+ count | count 
+-------+-------
+     0 |     0
+     1 |     1
+     1 |     1
+(3 rows)
+
 reset optimizer_enable_multiple_distinct_aggs;
 drop table dqa_f4;
+drop table dqa_f5;
diff --git a/src/test/regress/expected/gp_dqa_optimizer.out b/src/test/regress/expected/gp_dqa_optimizer.out
@@ -3304,5 +3304,67 @@ select count(distinct a), count(distinct b) from dqa_f4 group by c;
      0 |     0
 (3 rows)
 
+-- Test AO table dqa with multiple distinct aggs
+create table dqa_f5(a int, b int, c int) using ao_column;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into dqa_f5 values(null, null, null);
+insert into dqa_f5 values(1, 1, 1);
+insert into dqa_f5 values(2, 2, 2);
+explain (verbose on, costs off) select count(distinct a), count(distinct b) from dqa_f5 group by c;
+                                                                             QUERY PLAN                                                                              
+---------------------------------------------------------------------------------------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Output: (count(DISTINCT share0_ref3.a)), (count(DISTINCT share0_ref2.b))
+   ->  Sequence
+         Output: (count(DISTINCT share0_ref3.a)), (count(DISTINCT share0_ref2.b))
+         ->  Shared Scan (share slice:id 1:0)
+               Output: share0_ref1.a, share0_ref1.b, share0_ref1.c, share0_ref1.ctid, share0_ref1.tableoid, share0_ref1.gp_segment_id, share0_ref1.gp_foreign_server
+               ->  Seq Scan on public.dqa_f5
+                     Output: dqa_f5.a, dqa_f5.b, dqa_f5.c, dqa_f5.ctid, dqa_f5.tableoid, dqa_f5.gp_segment_id, dqa_f5.gp_foreign_server
+         ->  Hash Join
+               Output: (count(DISTINCT share0_ref3.a)), (count(DISTINCT share0_ref2.b))
+               Hash Cond: (NOT (share0_ref3.c IS DISTINCT FROM share0_ref2.c))
+               ->  GroupAggregate
+                     Output: count(DISTINCT share0_ref3.a), share0_ref3.c
+                     Group Key: share0_ref3.c
+                     ->  Sort
+                           Output: share0_ref3.a, share0_ref3.c
+                           Sort Key: share0_ref3.c
+                           ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                                 Output: share0_ref3.a, share0_ref3.c
+                                 Hash Key: share0_ref3.c
+                                 ->  Result
+                                       Output: share0_ref3.a, share0_ref3.c
+                                       ->  Shared Scan (share slice:id 2:0)
+                                             Output: share0_ref3.a, share0_ref3.b, share0_ref3.c
+               ->  Hash
+                     Output: (count(DISTINCT share0_ref2.b)), share0_ref2.c
+                     ->  GroupAggregate
+                           Output: count(DISTINCT share0_ref2.b), share0_ref2.c
+                           Group Key: share0_ref2.c
+                           ->  Sort
+                                 Output: share0_ref2.b, share0_ref2.c
+                                 Sort Key: share0_ref2.c
+                                 ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                                       Output: share0_ref2.b, share0_ref2.c
+                                       Hash Key: share0_ref2.c
+                                       ->  Result
+                                             Output: share0_ref2.b, share0_ref2.c
+                                             ->  Shared Scan (share slice:id 3:0)
+                                                   Output: share0_ref2.a, share0_ref2.b, share0_ref2.c
+ Settings: enable_groupagg = 'off', enable_hashagg = 'on', gp_motion_cost_per_row = '2'
+ Optimizer: GPORCA
+(41 rows)
+
+select count(distinct a), count(distinct b) from dqa_f5 group by c;
+ count | count 
+-------+-------
+     1 |     1
+     0 |     0
+     1 |     1
+(3 rows)
+
 reset optimizer_enable_multiple_distinct_aggs;
 drop table dqa_f4;
+drop table dqa_f5;
diff --git a/src/test/regress/expected/rowhints_optimizer.out b/src/test/regress/expected/rowhints_optimizer.out
@@ -33,14 +33,14 @@ ANALYZE my_table, your_table, our_table;
 EXPLAIN SELECT t1.a, t2.a FROM my_table AS t1, your_table AS t2, our_table AS t3;
                                                 QUERY PLAN
 -----------------------------------------------------------------------------------------------------------
- Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..1356765552.28 rows=1000000 width=8)
-   ->  Nested Loop  (cost=0.00..1356765522.47 rows=333334 width=8)
+ Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..1356765398.57 rows=1000000 width=8)
+   ->  Nested Loop  (cost=0.00..1356765368.75 rows=333334 width=8)
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice3; segments: 3)  (cost=0.00..431.01 rows=100 width=4)
-               ->  Seq Scan on your_table t2  (cost=0.00..431.00 rows=34 width=4)
-         ->  Nested Loop  (cost=0.00..1324091.78 rows=3334 width=4)
-               Join Filter: true
                ->  Seq Scan on my_table t1  (cost=0.00..431.00 rows=34 width=4)
+         ->  Nested Loop  (cost=0.00..1324091.63 rows=3334 width=4)
+               Join Filter: true
+               ->  Seq Scan on your_table t2  (cost=0.00..431.00 rows=34 width=4)
                ->  Materialize  (cost=0.00..431.00 rows=100 width=1)
                      ->  Broadcast Motion 3:3  (slice2; segments: 3)  (cost=0.00..431.00 rows=100 width=1)
                            ->  Dynamic Seq Scan on our_table t3  (cost=0.00..431.00 rows=34 width=1)
@@ -78,10 +78,10 @@ not used hint:
    ->  Nested Loop  (cost=xxx..xxx rows=41 width=xxx)
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice3; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
-               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
          ->  Nested Loop  (cost=xxx..xxx rows=3334 width=xxx)
                Join Filter: true
-               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
                ->  Materialize  (cost=xxx..xxx rows=100 width=xxx)
                      ->  Broadcast Motion 3:3  (slice2; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
                            ->  Dynamic Seq Scan on our_table t3  (cost=xxx..xxx rows=34 width=xxx)
@@ -110,10 +110,10 @@ not used hint:
    ->  Nested Loop  (cost=xxx..xxx rows=333375 width=xxx)
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice3; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
-               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
          ->  Nested Loop  (cost=xxx..xxx rows=3334 width=xxx)
                Join Filter: true
-               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
                ->  Materialize  (cost=xxx..xxx rows=100 width=xxx)
                      ->  Broadcast Motion 3:3  (slice2; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
                            ->  Dynamic Seq Scan on our_table t3  (cost=xxx..xxx rows=34 width=xxx)
@@ -142,10 +142,10 @@ not used hint:
    ->  Nested Loop  (cost=xxx..xxx rows=333293 width=xxx)
          Join Filter: true
          ->  Broadcast Motion 3:3  (slice3; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
-               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
          ->  Nested Loop  (cost=xxx..xxx rows=3334 width=xxx)
                Join Filter: true
-               ->  Seq Scan on my_table t1  (cost=xxx..xxx rows=34 width=xxx)
+               ->  Seq Scan on your_table t2  (cost=xxx..xxx rows=34 width=xxx)
                ->  Materialize  (cost=xxx..xxx rows=100 width=xxx)
                      ->  Broadcast Motion 3:3  (slice2; segments: 3)  (cost=xxx..xxx rows=100 width=xxx)
                            ->  Dynamic Seq Scan on our_table t3  (cost=xxx..xxx rows=34 width=xxx)
diff --git a/src/test/regress/sql/gp_dqa.sql b/src/test/regress/sql/gp_dqa.sql
@@ -604,6 +604,15 @@ select count(distinct a), count(distinct b) from dqa_f4 group by c;
 set optimizer_enable_multiple_distinct_aggs=on;
 explain (verbose on, costs off) select count(distinct a), count(distinct b) from dqa_f4 group by c;
 select count(distinct a), count(distinct b) from dqa_f4 group by c;
-reset optimizer_enable_multiple_distinct_aggs;
 
+-- Test AO table dqa with multiple distinct aggs
+create table dqa_f5(a int, b int, c int) using ao_column;
+insert into dqa_f5 values(null, null, null);
+insert into dqa_f5 values(1, 1, 1);
+insert into dqa_f5 values(2, 2, 2);
+explain (verbose on, costs off) select count(distinct a), count(distinct b) from dqa_f5 group by c;
+select count(distinct a), count(distinct b) from dqa_f5 group by c;
+
+reset optimizer_enable_multiple_distinct_aggs;
 drop table dqa_f4;
+drop table dqa_f5;