apache · phamvinh1712 · Apr 26, 2025 · May 4, 2025 · May 26, 2025 · May 26, 2025
diff --git a/docs/content.zh/docs/connectors/flink-sources/postgres-cdc.md b/docs/content.zh/docs/connectors/flink-sources/postgres-cdc.md
@@ -378,6 +378,18 @@ The following options is available only when `scan.incremental.snapshot.enabled=
               The table chunks would use evenly calculation optimization when the data distribution is even, and the query for splitting would happen when it is uneven.
               The distribution factor could be calculated by (MAX(id) - MIN(id) + 1) / rowCount.</td>
     </tr>
+    <tr>
+      <td>scan.publish-via-partition-root.enabled</td>
+      <td>optional</td>
+      <td style="word-wrap: break-word;">false</td>
+      <td>Boolean</td>
+      <td>
+        Whether to enable reading partitioned tables via partition root.<br>
+        If enabled:
+          (1) PUBLICATION must be created beforehand with parameter publish_via_partition_root=true
+          (2) Table list (regex or predefined list) should only match the parent table name, if table list matches both parent and child tables, snapshot data will be read twice.
+      </td>
+    </tr>
     </tbody>
 </table>
 </div>

diff --git a/docs/content/docs/connectors/flink-sources/postgres-cdc.md b/docs/content/docs/connectors/flink-sources/postgres-cdc.md
@@ -265,6 +265,18 @@ SELECT * FROM shipments;
         For example updating an already updated value in snapshot, or deleting an already deleted entry in snapshot. These replayed change log events should be handled specially.
       </td>
     </tr>
+    <tr>
+      <td>scan.publish-via-partition-root.enabled</td>
+      <td>optional</td>
+      <td style="word-wrap: break-word;">false</td>
+      <td>Boolean</td>
+      <td>
+        Whether to enable reading partitioned tables via partition root.<br>
+        If enabled:
+          (1) PUBLICATION must be created beforehand with parameter publish_via_partition_root=true
+          (2) Table list (regex or predefined list) should only match the parent table name, if table list matches both parent and child tables, snapshot data will be read twice.
+      </td>
+    </tr>
     </tbody>
     </table>
 </div>

diff --git a/...es-cdc/src/main/java/org/apache/flink/cdc/connectors/postgres/source/PostgresDialect.java b/...es-cdc/src/main/java/org/apache/flink/cdc/connectors/postgres/source/PostgresDialect.java
@@ -176,9 +176,14 @@ public ChunkSplitter createChunkSplitter(
     @Override
     public List<TableId> discoverDataCollections(JdbcSourceConfig sourceConfig) {
         try (JdbcConnection jdbc = openJdbcConnection(sourceConfig)) {
+            boolean publishViaPartitionRoot =
+                    ((PostgresSourceConfig) sourceConfig).getPublishViaPartitionRoot();
             return TableDiscoveryUtils.listTables(
                     // there is always a single database provided
-                    sourceConfig.getDatabaseList().get(0), jdbc, sourceConfig.getTableFilters());
+                    sourceConfig.getDatabaseList().get(0),
+                    jdbc,
+                    sourceConfig.getTableFilters(),
+                    publishViaPartitionRoot);
         } catch (SQLException e) {
             throw new FlinkRuntimeException("Error to discover tables: " + e.getMessage(), e);
         }

diff --git a/.../src/main/java/org/apache/flink/cdc/connectors/postgres/source/PostgresSourceBuilder.java b/.../src/main/java/org/apache/flink/cdc/connectors/postgres/source/PostgresSourceBuilder.java
@@ -289,6 +289,12 @@ public PostgresSourceBuilder<T> lsnCommitCheckpointsDelay(int lsnCommitDelay) {
         return this;
     }
 
+    /** Whether the connector should read partitioned tables via partition root or not. */
+    public PostgresSourceBuilder<T> publishViaPartitionRoot(boolean publishViaPartitionRoot) {
+        this.configFactory.setPublishViaPartitionRoot(publishViaPartitionRoot);
+        return this;
+    }
+
     /**
      * Build the {@link PostgresIncrementalSource}.
      *

diff --git a/...ain/java/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceConfig.java b/...ain/java/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceConfig.java
@@ -38,6 +38,7 @@ public class PostgresSourceConfig extends JdbcSourceConfig {
 
     private final int subtaskId;
     private final int lsnCommitCheckpointsDelay;
+    private final boolean publishViaPartitionRoot;
 
     public PostgresSourceConfig(
             int subtaskId,
@@ -67,7 +68,8 @@ public PostgresSourceConfig(
             boolean skipSnapshotBackfill,
             boolean isScanNewlyAddedTableEnabled,
             int lsnCommitCheckpointsDelay,
-            boolean assignUnboundedChunkFirst) {
+            boolean assignUnboundedChunkFirst,
+            boolean publishViaPartitionRoot) {
         super(
                 startupOptions,
                 databaseList,
@@ -97,6 +99,7 @@ public PostgresSourceConfig(
                 assignUnboundedChunkFirst);
         this.subtaskId = subtaskId;
         this.lsnCommitCheckpointsDelay = lsnCommitCheckpointsDelay;
+        this.publishViaPartitionRoot = publishViaPartitionRoot;
     }
 
     /**
@@ -117,6 +120,15 @@ public int getLsnCommitCheckpointsDelay() {
         return this.lsnCommitCheckpointsDelay;
     }
 
+    /**
+     * Returns {@code publishViaPartitionRoot} value.
+     *
+     * @return include partitioned table
+     */
+    public boolean getPublishViaPartitionRoot() {
+        return publishViaPartitionRoot;
+    }
+
     /**
      * Returns the slot name for backfill task.
      *

diff --git a/...a/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceConfigFactory.java b/...a/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceConfigFactory.java
@@ -52,6 +52,8 @@ public class PostgresSourceConfigFactory extends JdbcSourceConfigFactory {
 
     private int lsnCommitCheckpointsDelay;
 
+    private boolean publishViaPartitionRoot;
+
     /** Creates a new {@link PostgresSourceConfig} for the given subtask {@code subtaskId}. */
     @Override
     public PostgresSourceConfig create(int subtaskId) {
@@ -133,7 +135,8 @@ public PostgresSourceConfig create(int subtaskId) {
                 skipSnapshotBackfill,
                 scanNewlyAddedTableEnabled,
                 lsnCommitCheckpointsDelay,
-                assignUnboundedChunkFirst);
+                assignUnboundedChunkFirst,
+                publishViaPartitionRoot);
     }
 
     /**
@@ -182,4 +185,9 @@ public void heartbeatInterval(Duration heartbeatInterval) {
     public void setLsnCommitCheckpointsDelay(int lsnCommitCheckpointsDelay) {
         this.lsnCommitCheckpointsDelay = lsnCommitCheckpointsDelay;
     }
+
+    /** Enable include partitioned table. */
+    public void setPublishViaPartitionRoot(boolean publishViaPartitionRoot) {
+        this.publishViaPartitionRoot = publishViaPartitionRoot;
+    }
 }
diff --git a/...in/java/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceOptions.java b/...in/java/org/apache/flink/cdc/connectors/postgres/source/config/PostgresSourceOptions.java
@@ -88,4 +88,14 @@ public class PostgresSourceOptions extends JdbcSourceOptions {
                                     + "By setting this to higher value, the offset that is consumed by global slot will be "
                                     + "committed after multiple checkpoint delays instead of after each checkpoint completion.\n"
                                     + "This allows continuous recycle of log files in stream phase.");
+
+    public static final ConfigOption<Boolean> SCAN_PUBLISH_VIA_PARTITION_ROOT_ENABLED =
+            ConfigOptions.key("scan.publish-via-partition-root.enabled")
+                    .booleanType()
+                    .defaultValue(Boolean.FALSE)
+                    .withDescription(
+                            "Enable reading from partitioned table via partition root.\n"
+                                    + "If enabled:\n"
+                                    + "(1) PUBLICATION must be created beforehand with parameter publish_via_partition_root=true\n"
+                                    + "(2) Table list (regex or predefined list) should only match the parent table name, if table list matches both parent and child tables, snapshot data will be read twice.");
 }
diff --git a/.../main/java/org/apache/flink/cdc/connectors/postgres/source/utils/TableDiscoveryUtils.java b/.../main/java/org/apache/flink/cdc/connectors/postgres/source/utils/TableDiscoveryUtils.java
@@ -34,11 +34,17 @@ public class TableDiscoveryUtils {
     private static final Logger LOG = LoggerFactory.getLogger(TableDiscoveryUtils.class);
 
     public static List<TableId> listTables(
-            String database, JdbcConnection jdbc, RelationalTableFilters tableFilters)
+            String database,
+            JdbcConnection jdbc,
+            RelationalTableFilters tableFilters,
+            boolean publishViaPartitionRoot)
             throws SQLException {
 
-        Set<TableId> allTableIds =
-                jdbc.readTableNames(database, null, null, new String[] {"TABLE"});
+        String[] tableTypes = new String[] {"TABLE"};
+        if (publishViaPartitionRoot) {
+            tableTypes = new String[] {"TABLE", "PARTITIONED TABLE"};
+        }
+        Set<TableId> allTableIds = jdbc.readTableNames(database, null, null, tableTypes);
 
         Set<TableId> capturedTables =
                 allTableIds.stream()

diff --git a/.../src/main/java/org/apache/flink/cdc/connectors/postgres/table/PostgreSQLTableFactory.java b/.../src/main/java/org/apache/flink/cdc/connectors/postgres/table/PostgreSQLTableFactory.java
@@ -59,6 +59,7 @@
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_INCREMENTAL_SNAPSHOT_CHUNK_SIZE;
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_INCREMENTAL_SNAPSHOT_ENABLED;
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_LSN_COMMIT_CHECKPOINTS_DELAY;
+import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_PUBLISH_VIA_PARTITION_ROOT_ENABLED;
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_SNAPSHOT_FETCH_SIZE;
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SCAN_STARTUP_MODE;
 import static org.apache.flink.cdc.connectors.postgres.source.config.PostgresSourceOptions.SLOT_NAME;
@@ -117,6 +118,7 @@ public DynamicTableSource createDynamicTableSource(DynamicTableFactory.Context c
         boolean skipSnapshotBackfill = config.get(SCAN_INCREMENTAL_SNAPSHOT_BACKFILL_SKIP);
         boolean isScanNewlyAddedTableEnabled = config.get(SCAN_NEWLY_ADDED_TABLE_ENABLED);
         int lsnCommitCheckpointsDelay = config.get(SCAN_LSN_COMMIT_CHECKPOINTS_DELAY);
+        boolean publishViaPartitionRoot = config.get(SCAN_PUBLISH_VIA_PARTITION_ROOT_ENABLED);
         boolean assignUnboundedChunkFirst =
                 config.get(SCAN_INCREMENTAL_SNAPSHOT_UNBOUNDED_CHUNK_FIRST_ENABLED);
 
@@ -165,7 +167,8 @@ public DynamicTableSource createDynamicTableSource(DynamicTableFactory.Context c
                 skipSnapshotBackfill,
                 isScanNewlyAddedTableEnabled,
                 lsnCommitCheckpointsDelay,
-                assignUnboundedChunkFirst);
+                assignUnboundedChunkFirst,
+                publishViaPartitionRoot);
     }
 
     @Override
@@ -209,6 +212,7 @@ public Set<ConfigOption<?>> optionalOptions() {
         options.add(SCAN_NEWLY_ADDED_TABLE_ENABLED);
         options.add(SCAN_LSN_COMMIT_CHECKPOINTS_DELAY);
         options.add(SCAN_INCREMENTAL_SNAPSHOT_UNBOUNDED_CHUNK_FIRST_ENABLED);
+        options.add(SCAN_PUBLISH_VIA_PARTITION_ROOT_ENABLED);
         return options;
     }
 

diff --git a/...c/src/main/java/org/apache/flink/cdc/connectors/postgres/table/PostgreSQLTableSource.java b/...c/src/main/java/org/apache/flink/cdc/connectors/postgres/table/PostgreSQLTableSource.java
@@ -86,6 +86,7 @@ public class PostgreSQLTableSource implements ScanTableSource, SupportsReadingMe
     private final boolean scanNewlyAddedTableEnabled;
     private final int lsnCommitCheckpointsDelay;
     private final boolean assignUnboundedChunkFirst;
+    private final boolean publishViaPartitionRoot;
 
     // --------------------------------------------------------------------------------------------
     // Mutable attributes
@@ -126,7 +127,8 @@ public PostgreSQLTableSource(
             boolean skipSnapshotBackfill,
             boolean isScanNewlyAddedTableEnabled,
             int lsnCommitCheckpointsDelay,
-            boolean assignUnboundedChunkFirst) {
+            boolean assignUnboundedChunkFirst,
+            boolean publishViaPartitionRoot) {
         this.physicalSchema = physicalSchema;
         this.port = port;
         this.hostname = checkNotNull(hostname);
@@ -159,6 +161,7 @@ public PostgreSQLTableSource(
         this.scanNewlyAddedTableEnabled = isScanNewlyAddedTableEnabled;
         this.lsnCommitCheckpointsDelay = lsnCommitCheckpointsDelay;
         this.assignUnboundedChunkFirst = assignUnboundedChunkFirst;
+        this.publishViaPartitionRoot = publishViaPartitionRoot;
     }
 
     @Override
@@ -222,6 +225,7 @@ public ScanRuntimeProvider getScanRuntimeProvider(ScanContext scanContext) {
                             .scanNewlyAddedTableEnabled(scanNewlyAddedTableEnabled)
                             .lsnCommitCheckpointsDelay(lsnCommitCheckpointsDelay)
                             .assignUnboundedChunkFirst(assignUnboundedChunkFirst)
+                            .publishViaPartitionRoot(publishViaPartitionRoot)
                             .build();
             return SourceProvider.of(parallelSource);
         } else {
@@ -291,7 +295,8 @@ public DynamicTableSource copy() {
                         skipSnapshotBackfill,
                         scanNewlyAddedTableEnabled,
                         lsnCommitCheckpointsDelay,
-                        assignUnboundedChunkFirst);
+                        assignUnboundedChunkFirst,
+                        publishViaPartitionRoot);
         source.metadataKeys = metadataKeys;
         source.producedDataType = producedDataType;
         return source;

diff --git a/...dc/src/test/java/org/apache/flink/cdc/connectors/postgres/source/PostgresDialectTest.java b/...dc/src/test/java/org/apache/flink/cdc/connectors/postgres/source/PostgresDialectTest.java
@@ -46,6 +46,14 @@ class PostgresDialectTest extends PostgresTestBase {
                     POSTGRES_CONTAINER.getUsername(),
                     POSTGRES_CONTAINER.getPassword());
 
+    private final UniqueDatabase inventoryPartitionedDatabase =
+            new UniqueDatabase(
+                    POSTGRES_CONTAINER,
+                    "postgres3",
+                    "inventory_partitioned",
+                    POSTGRES_CONTAINER.getUsername(),
+                    POSTGRES_CONTAINER.getPassword());
+
     @Test
     void testDiscoverDataCollectionsInMultiDatabases() {
 
@@ -88,4 +96,23 @@ void testDiscoverDataCollectionsInMultiDatabases() {
                         configFactoryOfInventoryDatabase2.create(0));
         Assertions.assertThat(tableIdsOfInventoryDatabase2).isEmpty();
     }
+
+    @Test
+    void testDiscoverDataCollectionsForPartitionedTable() {
+        // initial database with partitioned table
+        inventoryPartitionedDatabase.createAndInitialize();
+
+        // get table named 'inventory_partitioned.products' from inventoryPartitionedDatabase
+        PostgresSourceConfigFactory configFactoryOfInventoryPartitionedDatabase =
+                getMockPostgresSourceConfigFactory(
+                        inventoryPartitionedDatabase, "inventory_partitioned", "products", 10);
+        configFactoryOfInventoryPartitionedDatabase.setPublishViaPartitionRoot(true);
+        PostgresDialect dialectOfInventoryPartitionedDatabase =
+                new PostgresDialect(configFactoryOfInventoryPartitionedDatabase.create(0));
+        List<TableId> tableIdsOfInventoryPartitionedDatabase =
+                dialectOfInventoryPartitionedDatabase.discoverDataCollections(
+                        configFactoryOfInventoryPartitionedDatabase.create(0));
+        Assertions.assertThat(tableIdsOfInventoryPartitionedDatabase.get(0))
+                .hasToString("inventory_partitioned.products");
+    }
 }
diff --git a/...c/test/java/org/apache/flink/cdc/connectors/postgres/table/MockPostgreSQLTableSource.java b/...c/test/java/org/apache/flink/cdc/connectors/postgres/table/MockPostgreSQLTableSource.java
@@ -66,7 +66,8 @@ public MockPostgreSQLTableSource(PostgreSQLTableSource postgreSQLTableSource) {
                 (boolean) get(postgreSQLTableSource, "skipSnapshotBackfill"),
                 (boolean) get(postgreSQLTableSource, "scanNewlyAddedTableEnabled"),
                 (int) get(postgreSQLTableSource, "lsnCommitCheckpointsDelay"),
-                (boolean) get(postgreSQLTableSource, "assignUnboundedChunkFirst"));
+                (boolean) get(postgreSQLTableSource, "assignUnboundedChunkFirst"),
+                (boolean) get(postgreSQLTableSource, "publishViaPartitionRoot"));
     }
 
     @Override