diff --git a/.github/ISSUE_TEMPLATE/config.yml b/.github/ISSUE_TEMPLATE/config.yml
index 05a81306669..74483115591 100644
--- a/.github/ISSUE_TEMPLATE/config.yml
+++ b/.github/ISSUE_TEMPLATE/config.yml
@@ -1,23 +1,3 @@
-# --------------------------------------------------------------------
-#
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements. See the NOTICE file distributed
-# with this work for additional information regarding copyright
-# ownership. The ASF licenses this file to You under the Apache
-# License, Version 2.0 (the "License"); you may not use this file
-# except in compliance with the License. You may obtain a copy of the
-# License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied. See the License for the specific language governing
-# permissions and limitations under the License.
-#
-# --------------------------------------------------------------------
-
 blank_issues_enabled: true
 contact_links:
   - name: 🙏🏻 Q&A
diff --git a/.github/workflows/build-cloudberry-rocky8.yml b/.github/workflows/build-cloudberry-rocky8.yml
index 2abf88060e3..4986eae11b2 100644
--- a/.github/workflows/build-cloudberry-rocky8.yml
+++ b/.github/workflows/build-cloudberry-rocky8.yml
@@ -320,6 +320,10 @@ jobs:
                                "gpcontrib/gp_sparse_vector:installcheck",
                                "gpcontrib/gp_toolkit:installcheck"]
               },
+              {"test":"gpcontrib-gp-stats-collector",
+               "make_configs":["gpcontrib/gp_stats_collector:installcheck"],
+               "extension":"gp_stats_collector"
+              },
               {"test":"ic-fixme",
                "make_configs":["src/test/regress:installcheck-fixme"],
                "enable_core_check":false
@@ -339,6 +343,10 @@ jobs:
               },
               {"test":"ic-cbdb-parallel",
                "make_configs":["src/test/regress:installcheck-cbdb-parallel"]
+              },
+              {"test":"ic-recovery",
+               "make_configs":["src/test/recovery:installcheck"],
+               "enable_core_check":false
               }
             ]
           }'
@@ -1396,6 +1404,7 @@ jobs:
         if: success() && needs.check-skip.outputs.should_skip != 'true'
         env:
           SRC_DIR: ${{ github.workspace }}
+          BUILD_DESTINATION: /usr/local/cloudberry-db
         shell: bash {0}
         run: |
           set -o pipefail
@@ -1419,6 +1428,30 @@ jobs:
           # 2. Follow the same pattern as optimizer
           # 3. Update matrix entries to include the new setting
 
+          # Create extension if required
+          if [[ "${{ matrix.extension != '' }}" == "true" ]]; then
+            case "${{ matrix.extension }}" in
+              gp_stats_collector)
+                if ! su - gpadmin -c "source ${BUILD_DESTINATION}/cloudberry-env.sh && \
+                  source ${SRC_DIR}/gpAux/gpdemo/gpdemo-env.sh && \
+                  gpconfig -c shared_preload_libraries -v 'gp_stats_collector' && \
+                  gpstop -ra && \
+                  echo 'CREATE EXTENSION IF NOT EXISTS gp_stats_collector; \
+                        SHOW shared_preload_libraries; \
+                        TABLE pg_extension;' | \
+                    psql postgres"
+                then
+                    echo "Error creating gp_stats_collector extension"
+                    exit 1
+                fi
+                ;;
+              *)
+                echo "Unknown extension: ${{ matrix.extension }}"
+                exit 1
+                ;;
+            esac
+          fi
+
           # Set PostgreSQL options if defined
           PG_OPTS=""
           if [[ "${{ matrix.pg_settings.optimizer != '' }}" == "true" ]]; then
@@ -1643,6 +1676,7 @@ jobs:
 
       - name: Check and Display Regression Diffs
         if: always()
+        shell: bash {0}
         run: |
           # Search for regression.diffs recursively
           found_file=$(find . -type f -name "regression.diffs" | head -n 1)
diff --git a/.github/workflows/build-cloudberry.yml b/.github/workflows/build-cloudberry.yml
index ca75f7b42e7..c00dcde0486 100644
--- a/.github/workflows/build-cloudberry.yml
+++ b/.github/workflows/build-cloudberry.yml
@@ -271,6 +271,10 @@ jobs:
                 },
                 "enable_core_check":false
               },
+              {"test":"gpcontrib-gp-stats-collector",
+               "make_configs":["gpcontrib/gp_stats_collector:installcheck"],
+               "extension":"gp_stats_collector"
+              },
               {"test":"ic-expandshrink",
                "make_configs":["src/test/isolation2:installcheck-expandshrink"]
               },
@@ -312,7 +316,8 @@ jobs:
                                "gpcontrib/zstd:installcheck",
                                "gpcontrib/gp_sparse_vector:installcheck",
                                "gpcontrib/gp_toolkit:installcheck",
-                               "gpcontrib/gp_exttable_fdw:installcheck"]
+                               "gpcontrib/gp_exttable_fdw:installcheck",
+                               "gpcontrib/gp_internal_tools:installcheck"]
               },
               {"test":"ic-diskquota",
                "make_configs":["gpcontrib/diskquota:installcheck"],
@@ -337,6 +342,9 @@ jobs:
               },
               {"test":"ic-cbdb-parallel",
                "make_configs":["src/test/regress:installcheck-cbdb-parallel"]
+              },
+              {"test":"ic-orca-parallel",
+               "make_configs":["src/test/regress:installcheck-orca-parallel"]
               }
             ]
           }'
@@ -1402,6 +1410,7 @@ jobs:
         if: success() && needs.check-skip.outputs.should_skip != 'true'
         env:
           SRC_DIR: ${{ github.workspace }}
+          BUILD_DESTINATION: /usr/local/cloudberry-db
         shell: bash {0}
         run: |
           set -o pipefail
@@ -1431,6 +1440,30 @@ jobs:
             PG_OPTS="$PG_OPTS -c optimizer=${{ matrix.pg_settings.optimizer }}"
           fi
 
+          # Create extension if required
+          if [[ "${{ matrix.extension != '' }}" == "true" ]]; then
+            case "${{ matrix.extension }}" in
+              gp_stats_collector)
+                if ! su - gpadmin -c "source ${BUILD_DESTINATION}/cloudberry-env.sh && \
+                  source ${SRC_DIR}/gpAux/gpdemo/gpdemo-env.sh && \
+                  gpconfig -c shared_preload_libraries -v 'gp_stats_collector' && \
+                  gpstop -ra && \
+                  echo 'CREATE EXTENSION IF NOT EXISTS gp_stats_collector; \
+                        SHOW shared_preload_libraries; \
+                        TABLE pg_extension;' | \
+                    psql postgres"
+                then
+                    echo "Error creating gp_stats_collector extension"
+                    exit 1
+                fi
+                ;;
+              *)
+                echo "Unknown extension: ${{ matrix.extension }}"
+                exit 1
+                ;;
+            esac
+          fi
+
           if [[ "${{ matrix.pg_settings.default_table_access_method != '' }}" == "true" ]]; then
             PG_OPTS="$PG_OPTS -c default_table_access_method=${{ matrix.pg_settings.default_table_access_method }}"
           fi
@@ -1649,6 +1682,7 @@ jobs:
 
       - name: Check and Display Regression Diffs
         if: always()
+        shell: bash {0}
         run: |
           # Search for regression.diffs recursively
           found_file=$(find . -type f -name "regression.diffs" | head -n 1)
diff --git a/.github/workflows/build-deb-cloudberry-ubuntu24.04.yml b/.github/workflows/build-deb-cloudberry-ubuntu24.04.yml
new file mode 100644
index 00000000000..041eabc252b
--- /dev/null
+++ b/.github/workflows/build-deb-cloudberry-ubuntu24.04.yml
@@ -0,0 +1,1892 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+# GitHub Actions Workflow: Apache Cloudberry Build Pipeline
+# --------------------------------------------------------------------
+# Description:
+#
+#   This workflow builds, tests, and packages Apache Cloudberry on
+#   Ubuntu 24.04. It ensures artifact integrity and performs installation
+#   tests.
+#
+# Workflow Overview:
+# 1. **Build Job**:
+#    - Configures and builds Apache Cloudberry.
+#    - Supports debug build configuration via ENABLE_DEBUG flag.
+#    - Runs unit tests and verifies build artifacts.
+#    - Creates DEB packages (regular and debug), source tarball
+#    and additional files for dupload utility.
+#    - **Key Artifacts**: DEB package, source tarball, changes and dsc files, build logs.
+#
+# 2. **DEB Install Test Job**:
+#    - Verifies DEB integrity and installs Cloudberry.
+#    - Validates successful installation.
+#    - **Key Artifacts**: Installation logs, verification results.
+#
+# 3. **Report Job**:
+#    - Aggregates job results into a final report.
+#    - Sends failure notifications if any step fails.
+#
+# Execution Environment:
+# - **Runs On**: ubuntu-22.04 with ubuntu-24.04 containers.
+# - **Resource Requirements**:
+#   - Disk: Minimum 20GB free space.
+#   - Memory: Minimum 8GB RAM.
+#   - CPU: Recommended 4+ cores.
+#
+# Triggers:
+# - Push to `main` branch.
+# - Pull request that modifies this workflow file.
+# - Scheduled: Every Monday at 02:00 UTC.
+# - Manual workflow dispatch.
+#
+# Container Images:
+# - **Build**: `apache/incubator-cloudberry:cbdb-build-ubuntu24.04-latest`
+# - **Test**: `apache/incubator-cloudberry:cbdb-test-ubuntu24.04-latest`
+#
+# Artifacts:
+# - DEB Package           (retention: ${{ env.LOG_RETENTION_DAYS }} days).
+# - Changes and DSC files (retention: ${{ env.LOG_RETENTION_DAYS }} days).
+# - Source Tarball        (retention: ${{ env.LOG_RETENTION_DAYS }} days).
+# - Logs and Test Results (retention: ${{ env.LOG_RETENTION_DAYS }} days).
+#
+# Notes:
+# - Supports concurrent job execution.
+# - Supports debug builds with preserved symbols.
+# --------------------------------------------------------------------
+
+name: Apache Cloudberry Debian Build
+
+on:
+  push:
+    branches: [main, REL_2_STABLE]
+  pull_request:
+    paths:
+      - '.github/workflows/build-deb-cloudberry-ubuntu24.04.yml'
+    # We can enable the PR test when needed
+    # branches: [main, REL_2_STABLE]
+    # types: [opened, synchronize, reopened, edited]
+  schedule:
+    # Run every Monday at 02:00 UTC
+    - cron: '0 2 * * 1'
+  workflow_dispatch:  # Manual trigger
+    inputs:
+      test_selection:
+        description: 'Select tests to run (comma-separated). Examples: ic-good-opt-off,ic-contrib'
+        required: false
+        default: 'all'
+        type: string
+      reuse_artifacts_from_run_id:
+        description: 'Reuse build artifacts from a previous run ID (leave empty to build fresh)'
+        required: false
+        default: ''
+        type: string
+
+# Note: Step details, logs, and artifacts require users to be logged into GitHub
+# even for public repositories. This is a GitHub security feature and cannot
+# be overridden by permissions.
+
+permissions:
+  # READ permissions allow viewing repository contents
+  contents: read      # Required for checking out code and reading repository files
+
+  # READ permissions for packages (Container registry, etc)
+  packages: read      # Allows reading from GitHub package registry
+
+  # WRITE permissions for actions includes read access to:
+  # - Workflow runs
+  # - Artifacts (requires GitHub login)
+  # - Logs (requires GitHub login)
+  actions: write
+
+  # READ permissions for checks API:
+  # - Step details visibility (requires GitHub login)
+  # - Check run status and details
+  checks: read
+
+  # READ permissions for pull request metadata:
+  # - PR status
+  # - Associated checks
+  # - Review states
+  pull-requests: read
+
+env:
+  LOG_RETENTION_DAYS: 7
+  ENABLE_DEBUG: false
+
+jobs:
+
+  ## ======================================================================
+  ## Job: check-skip
+  ## ======================================================================
+
+  check-skip:
+    runs-on: ubuntu-22.04
+    outputs:
+      should_skip: ${{ steps.skip-check.outputs.should_skip }}
+    steps:
+      - id: skip-check
+        shell: bash
+        env:
+          EVENT_NAME: ${{ github.event_name }}
+          PR_TITLE: ${{ github.event.pull_request.title || '' }}
+          PR_BODY: ${{ github.event.pull_request.body || '' }}
+        run: |
+          # Default to not skipping
+          echo "should_skip=false" >> "$GITHUB_OUTPUT"
+
+          # Apply skip logic only for pull_request events
+          if [[ "$EVENT_NAME" == "pull_request" ]]; then
+            # Combine PR title and body for skip check
+            MESSAGE="${PR_TITLE}\n${PR_BODY}"
+
+            # Escape special characters using printf %s
+            ESCAPED_MESSAGE=$(printf "%s" "$MESSAGE")
+
+            echo "Checking PR title and body (escaped): $ESCAPED_MESSAGE"
+
+            # Check for skip patterns
+            if echo -e "$ESCAPED_MESSAGE" | grep -qEi '\[skip[ -]ci\]|\[ci[ -]skip\]|\[no[ -]ci\]'; then
+              echo "should_skip=true" >> "$GITHUB_OUTPUT"
+            fi
+          else
+            echo "Skip logic is not applied for $EVENT_NAME events."
+          fi
+
+      - name: Report Skip Status
+        if: steps.skip-check.outputs.should_skip == 'true'
+        run: |
+          echo "CI Skip flag detected in PR - skipping all checks."
+          exit 0
+
+  ## ======================================================================
+  ## Job: prepare-test-matrix-deb
+  ## ======================================================================
+
+  prepare-test-matrix-deb:
+    runs-on: ubuntu-22.04
+    needs: [check-skip]
+    if: needs.check-skip.outputs.should_skip != 'true'
+    outputs:
+      test-matrix: ${{ steps.set-matrix.outputs.matrix }}
+
+    steps:
+      - id: set-matrix
+        run: |
+          echo "=== Matrix Preparation Diagnostics ==="
+          echo "Event type: ${{ github.event_name }}"
+          echo "Test selection input: '${{ github.event.inputs.test_selection }}'"
+
+          # Define defaults
+          DEFAULT_NUM_PRIMARY_MIRROR_PAIRS=3
+          DEFAULT_ENABLE_CGROUPS=false
+          DEFAULT_ENABLE_CORE_CHECK=true
+          DEFAULT_PG_SETTINGS_OPTIMIZER=""
+
+          # Define base test configurations
+          ALL_TESTS='{
+            "include": [
+              {"test":"ic-deb-good-opt-off",
+               "make_configs":["src/test/regress:installcheck-good"],
+               "pg_settings":{"optimizer":"off"}
+              },
+              {"test":"ic-deb-good-opt-on",
+               "make_configs":["src/test/regress:installcheck-good"],
+               "pg_settings":{"optimizer":"on"}
+              },
+              {"test":"pax-ic-deb-good-opt-off",
+               "make_configs":[
+                "contrib/pax_storage/:pax-test",
+                "contrib/pax_storage/:regress_test"
+              ],
+               "pg_settings":{
+                 "optimizer":"off",
+                 "default_table_access_method":"pax"
+                }
+              },
+              {"test":"pax-ic-deb-good-opt-on",
+               "make_configs":[
+                "contrib/pax_storage/:pax-test",
+                "contrib/pax_storage/:regress_test"
+              ],
+               "pg_settings":{
+                 "optimizer":"on",
+                 "default_table_access_method":"pax"
+                }
+              },
+              {"test":"ic-deb-contrib",
+               "make_configs":["contrib/auto_explain:installcheck",
+                               "contrib/amcheck:installcheck",
+                               "contrib/citext:installcheck",
+                               "contrib/btree_gin:installcheck",
+                               "contrib/btree_gist:installcheck",
+                               "contrib/dblink:installcheck",
+                               "contrib/dict_int:installcheck",
+                               "contrib/dict_xsyn:installcheck",
+                               "contrib/extprotocol:installcheck",
+                               "contrib/file_fdw:installcheck",
+                               "contrib/formatter_fixedwidth:installcheck",
+                               "contrib/hstore:installcheck",
+                               "contrib/indexscan:installcheck",
+                               "contrib/pg_trgm:installcheck",
+                               "contrib/indexscan:installcheck",
+                               "contrib/pgcrypto:installcheck",
+                               "contrib/pgstattuple:installcheck",
+                               "contrib/tablefunc:installcheck",
+                               "contrib/passwordcheck:installcheck",
+                               "contrib/pg_buffercache:installcheck",
+                               "contrib/sslinfo:installcheck"]
+              },
+              {"test":"ic-deb-gpcontrib",
+               "make_configs":["gpcontrib/orafce:installcheck",
+                               "gpcontrib/zstd:installcheck",
+                               "gpcontrib/gp_sparse_vector:installcheck",
+                               "gpcontrib/gp_toolkit:installcheck"]
+              },
+              {"test":"gpcontrib-gp-stats-collector",
+               "make_configs":["gpcontrib/gp_stats_collector:installcheck"],
+               "extension":"gp_stats_collector"
+              },
+              {"test":"ic-cbdb-parallel",
+               "make_configs":["src/test/regress:installcheck-cbdb-parallel"]
+              }
+            ]
+          }'
+
+          # Function to apply defaults
+          apply_defaults() {
+            echo "$1" | jq --arg     npm "$DEFAULT_NUM_PRIMARY_MIRROR_PAIRS" \
+                           --argjson ec  "$DEFAULT_ENABLE_CGROUPS" \
+                           --argjson ecc "$DEFAULT_ENABLE_CORE_CHECK" \
+                           --arg     opt "$DEFAULT_PG_SETTINGS_OPTIMIZER" \
+              'def get_defaults:
+                {
+                  num_primary_mirror_pairs: ($npm|tonumber),
+                  enable_cgroups: $ec,
+                  enable_core_check: $ecc,
+                  pg_settings: {
+                    optimizer: $opt
+                  }
+                };
+               get_defaults * .'
+          }
+
+          # Extract all valid test names from ALL_TESTS
+          VALID_TESTS=$(echo "$ALL_TESTS" | jq -r '.include[].test')
+
+          # Parse input test selection
+          IFS=',' read -ra SELECTED_TESTS <<< "${{ github.event.inputs.test_selection }}"
+
+          # Default to all tests if selection is empty or 'all'
+          if [[ "${SELECTED_TESTS[*]}" == "all" || -z "${SELECTED_TESTS[*]}" ]]; then
+            mapfile -t SELECTED_TESTS <<< "$VALID_TESTS"
+          fi
+
+          # Validate and filter selected tests
+          INVALID_TESTS=()
+          FILTERED_TESTS=()
+          for TEST in "${SELECTED_TESTS[@]}"; do
+            TEST=$(echo "$TEST" | tr -d '[:space:]') # Trim whitespace
+            if echo "$VALID_TESTS" | grep -qw "$TEST"; then
+              FILTERED_TESTS+=("$TEST")
+            else
+              INVALID_TESTS+=("$TEST")
+            fi
+          done
+
+          # Handle invalid tests
+          if [[ ${#INVALID_TESTS[@]} -gt 0 ]]; then
+            echo "::error::Invalid test(s) selected: ${INVALID_TESTS[*]}"
+            echo "Valid tests are: $(echo "$VALID_TESTS" | tr '\n' ', ')"
+            exit 1
+          fi
+
+          # Build result JSON with defaults applied
+          RESULT='{"include":['
+          FIRST=true
+          for TEST in "${FILTERED_TESTS[@]}"; do
+            CONFIG=$(jq -c --arg test "$TEST" '.include[] | select(.test == $test)' <<< "$ALL_TESTS")
+            FILTERED_WITH_DEFAULTS=$(apply_defaults "$CONFIG")
+            if [[ "$FIRST" == true ]]; then
+              FIRST=false
+            else
+              RESULT="${RESULT},"
+            fi
+            RESULT="${RESULT}${FILTERED_WITH_DEFAULTS}"
+          done
+          RESULT="${RESULT}]}"
+
+          # Output the matrix for GitHub Actions
+          echo "Final matrix configuration:"
+          echo "$RESULT" | jq .
+
+          # Fix: Use block redirection
+          {
+            echo "matrix<<EOF"
+            echo "$RESULT"
+            echo "EOF"
+          } >> "$GITHUB_OUTPUT"
+
+          echo "=== Matrix Preparation Complete ==="
+
+  ## ======================================================================
+  ## Job: build-deb
+  ## ======================================================================
+
+  build-deb:
+    name: Build Apache Cloudberry DEB (Ubuntu 24.04)
+    env:
+      JOB_TYPE: build
+    needs: [check-skip]
+    runs-on: ubuntu-22.04
+    timeout-minutes: 120
+    if: github.event.inputs.reuse_artifacts_from_run_id == ''
+    outputs:
+      build_timestamp: ${{ steps.set_timestamp.outputs.timestamp }}
+
+    container:
+      image: apache/incubator-cloudberry:cbdb-build-ubuntu24.04-latest
+      options: >-
+        --user root
+        -h cdw
+        -v /usr/share:/host_usr_share
+        -v /usr/local:/host_usr_local
+        -v /opt:/host_opt
+
+    steps:
+      - name: Free Disk Space
+        if: needs.check-skip.outputs.should_skip != 'true'
+        run: |
+          echo "=== Disk space before cleanup ==="
+          df -h /
+
+          # Remove pre-installed tools from host to free disk space
+          rm -rf /host_opt/hostedtoolcache || true   # GitHub Actions tool cache
+          rm -rf /host_usr_local/lib/android || true # Android SDK
+          rm -rf /host_usr_share/dotnet || true      # .NET SDK
+          rm -rf /host_opt/ghc || true               # Haskell GHC
+          rm -rf /host_usr_local/.ghcup || true      # Haskell GHCup
+          rm -rf /host_usr_share/swift || true       # Swift
+          rm -rf /host_usr_local/share/powershell || true  # PowerShell
+          rm -rf /host_usr_local/share/chromium || true    # Chromium
+          rm -rf /host_usr_share/miniconda || true   # Miniconda
+          rm -rf /host_opt/az || true                # Azure CLI
+          rm -rf /host_usr_share/sbt || true         # Scala Build Tool
+
+          echo "=== Disk space after cleanup ==="
+          df -h /
+
+      - name: Skip Check
+        if: needs.check-skip.outputs.should_skip == 'true'
+        run: |
+          echo "Build skipped via CI skip flag" >> "$GITHUB_STEP_SUMMARY"
+          exit 0
+
+      - name: Set build timestamp
+        id: set_timestamp  # Add an ID to reference this step
+        run: |
+          timestamp=$(date +'%Y%m%d_%H%M%S')
+          echo "timestamp=$timestamp" | tee -a "$GITHUB_OUTPUT"  # Use GITHUB_OUTPUT for job outputs
+          echo "BUILD_TIMESTAMP=$timestamp" | tee -a "$GITHUB_ENV" # Also set as environment variable
+
+      - name: Checkout Apache Cloudberry
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 1
+          submodules: true
+
+      - name: Cloudberry Environment Initialization
+        shell: bash
+        env:
+          LOGS_DIR: build-logs
+        run: |
+          set -eo pipefail
+          if ! su - gpadmin -c "/tmp/init_system.sh"; then
+            echo "::error::Container initialization failed"
+            exit 1
+          fi
+
+          mkdir -p "${LOGS_DIR}/details"
+          chown -R gpadmin:gpadmin .
+          chmod -R 755 .
+          chmod 777 "${LOGS_DIR}"
+
+          df -kh /
+          rm -rf /__t/*
+          df -kh /
+
+          df -h | tee -a "${LOGS_DIR}/details/disk-usage.log"
+          free -h | tee -a "${LOGS_DIR}/details/memory-usage.log"
+
+          {
+            echo "=== Environment Information ==="
+            uname -a
+            df -h
+            free -h
+            env
+          } | tee -a "${LOGS_DIR}/details/environment.log"
+
+          echo "SRC_DIR=${GITHUB_WORKSPACE}" | tee -a "$GITHUB_ENV"
+
+      - name: Generate Build Job Summary Start
+        run: |
+          {
+            echo "# Build Job Summary (Ubuntu 24.04)"
+            echo "## Environment"
+            echo "- Start Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+            echo "- ENABLE_DEBUG: ${{ env.ENABLE_DEBUG }}"
+            echo "- OS Version: $(lsb_release -sd)"
+            echo "- GCC Version: $(gcc --version | head -n1)"
+          } >> "$GITHUB_STEP_SUMMARY"
+
+      - name: Run Apache Cloudberry configure script
+        shell: bash
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          export BUILD_DESTINATION=${SRC_DIR}/debian/build
+
+          chmod +x "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh
+          if ! time su - gpadmin -c "cd ${SRC_DIR} && SRC_DIR=${SRC_DIR} ENABLE_DEBUG=${{ env.ENABLE_DEBUG }} BUILD_DESTINATION=${BUILD_DESTINATION} ${SRC_DIR}/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh"; then
+            echo "::error::Configure script failed"
+            exit 1
+          fi
+
+      - name: Run Apache Cloudberry build script
+        shell: bash
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          export BUILD_DESTINATION=${SRC_DIR}/debian/build
+
+          chmod +x "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/build-cloudberry.sh
+          if ! time su - gpadmin -c "cd ${SRC_DIR} && SRC_DIR=${SRC_DIR} BUILD_DESTINATION=${BUILD_DESTINATION} ${SRC_DIR}/devops/build/automation/cloudberry/scripts/build-cloudberry.sh"; then
+            echo "::error::Build script failed"
+            exit 1
+          fi
+
+      - name: Verify build artifacts
+        shell: bash
+        run: |
+          set -eo pipefail
+
+          export BUILD_DESTINATION=${SRC_DIR}/debian/build
+
+          echo "Verifying build artifacts..."
+          {
+            echo "=== Build Artifacts Verification ==="
+            echo "Timestamp: $(date -u)"
+
+            if [ ! -d "${BUILD_DESTINATION}" ]; then
+              echo "::error::Build artifacts directory not found"
+              exit 1
+            fi
+
+            # Verify critical binaries
+            critical_binaries=(
+              "${BUILD_DESTINATION}/bin/postgres"
+              "${BUILD_DESTINATION}/bin/psql"
+            )
+
+            echo "Checking critical binaries..."
+            for binary in "${critical_binaries[@]}"; do
+              if [ ! -f "$binary" ]; then
+                echo "::error::Critical binary missing: $binary"
+                exit 1
+              fi
+              if [ ! -x "$binary" ]; then
+                echo "::error::Binary not executable: $binary"
+                exit 1
+              fi
+              echo "Binary verified: $binary"
+              ls -l "$binary"
+            done
+
+            # Test binary execution
+            echo "Testing binary execution..."
+            if ! ${BUILD_DESTINATION}/bin/postgres --version; then
+              echo "::error::postgres binary verification failed"
+              exit 1
+            fi
+            if ! ${BUILD_DESTINATION}/bin/psql --version; then
+              echo "::error::psql binary verification failed"
+              exit 1
+            fi
+
+            echo "All build artifacts verified successfully"
+          } 2>&1 | tee -a build-logs/details/build-verification.log
+
+      - name: Create Source tarball, create DEB and verify artifacts
+        shell: bash
+        env:
+          CBDB_VERSION: 99.0.0
+          BUILD_NUMBER: 1
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          {
+            echo "=== Artifact Creation Log ==="
+            echo "Timestamp: $(date -u)"
+
+            cp -r "${SRC_DIR}"/devops/build/packaging/deb/ubuntu24.04/* debian/
+            chown -R "$(whoami)" debian
+            chmod -x debian/*install
+
+            # replace not supported symbols in version
+            CBDB_VERSION=$(echo "$CBDB_VERSION" | sed "s/\//./g")
+            CBDB_VERSION=$(echo "$CBDB_VERSION" | sed "s/_/-/g")
+          
+            echo "We will built ${CBDB_VERSION}"
+            export BUILD_DESTINATION=${SRC_DIR}/debian/build
+
+            if ! ${SRC_DIR}/devops/build/packaging/deb/build-deb.sh -v $CBDB_VERSION; then
+              echo "::error::Build script failed"
+              exit 1
+            fi
+
+            ARCH=$(dpkg --print-architecture)
+            # Detect OS distribution (e.g., ubuntu24.04, debian12)
+            if [ -f /etc/os-release ]; then
+              . /etc/os-release
+              OS_DISTRO=$(echo "${ID}${VERSION_ID}" | tr '[:upper:]' '[:lower:]')
+            else
+              OS_DISTRO="unknown"
+            fi
+            CBDB_PKG_VERSION=${CBDB_VERSION}-${BUILD_NUMBER}-${OS_DISTRO}
+
+            echo "Produced artifacts"
+            ls -l ../
+
+            echo "Copy artifacts to subdirectory for sign/upload"
+            mkdir ${SRC_DIR}/deb
+            DEB_FILE="apache-cloudberry-db-incubating_${CBDB_PKG_VERSION}"_"${ARCH}".deb
+            DBG_DEB_FILE="apache-cloudberry-db-incubating-dbgsym_${CBDB_PKG_VERSION}"_"${ARCH}".ddeb
+            CHANGES_DEB_FILE="apache-cloudberry-db-incubating_${CBDB_PKG_VERSION}"_"${ARCH}".changes
+            BUILDINFO_DEB_FILE="apache-cloudberry-db-incubating_${CBDB_PKG_VERSION}"_"${ARCH}".buildinfo
+            DSC_DEB_FILE="apache-cloudberry-db-incubating_${CBDB_PKG_VERSION}".dsc
+            SOURCE_FILE="apache-cloudberry-db-incubating_${CBDB_PKG_VERSION}".tar.xz
+            cp ../"${DEB_FILE}" "${SRC_DIR}/deb"
+            cp ../"${DBG_DEB_FILE}" "${SRC_DIR}/deb"
+            cp ../"${CHANGES_DEB_FILE}" "${SRC_DIR}/deb"
+            cp ../"${BUILDINFO_DEB_FILE}" "${SRC_DIR}/deb"
+            cp ../"${DSC_DEB_FILE}" "${SRC_DIR}/deb"
+            cp ../"${SOURCE_FILE}" "${SRC_DIR}/deb"
+            mkdir "${SRC_DIR}/deb/debian"
+            cp debian/changelog "${SRC_DIR}/deb/debian"
+
+            # Get package information
+            echo "Package Information:"
+            dpkg --info "${SRC_DIR}/deb/${DEB_FILE}"
+            dpkg --contents "${SRC_DIR}/deb/${DEB_FILE}"
+
+            # Verify critical files in DEB
+            echo "Verifying critical files in DEB..."
+            for binary in "bin/postgres" "bin/psql"; do
+              if ! dpkg --contents "${SRC_DIR}/deb/${DEB_FILE}" | grep -c "${binary}$"; then
+                echo "::error::Critical binary '${binary}' not found in DEB"
+                exit 1
+              fi
+            done
+
+            # Record checksums
+            echo "Calculating checksums..."
+            sha256sum "${SRC_DIR}/deb/${DEB_FILE}" | tee -a build-logs/details/checksums.log
+
+            echo "Artifacts created and verified successfully"
+
+
+          } 2>&1 | tee -a build-logs/details/artifact-creation.log
+
+      - name: Run Apache Cloudberry unittest script
+        if: needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+          chmod +x "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh
+          if ! time su - gpadmin -c "cd ${SRC_DIR} && SRC_DIR=${SRC_DIR} ${SRC_DIR}/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh"; then
+            echo "::error::Unittest script failed"
+            exit 1
+          fi
+
+      - name: Generate Build Job Summary End
+        run: |
+          {
+            echo "## Build Results"
+            echo "- End Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+          } >> "$GITHUB_STEP_SUMMARY"
+
+      - name: Upload build logs
+        uses: actions/upload-artifact@v4
+        with:
+          name: build-logs-ubuntu24.04-${{ env.BUILD_TIMESTAMP }}
+          path: |
+            build-logs/
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+      - name: Upload Cloudberry DEB build artifacts
+        uses: actions/upload-artifact@v4
+        with:
+          name: apache-cloudberry-db-incubating-deb-ubuntu24.04-build-artifacts
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+          if-no-files-found: error
+          path: |
+            deb/*.deb
+            deb/*.ddeb
+
+      - name: Upload Cloudberry deb source build artifacts
+        uses: actions/upload-artifact@v4
+        with:
+          name: apache-cloudberry-db-incubating-deb-source-build-artifacts
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+          if-no-files-found: error
+          path: |
+            deb/*.tar.xz
+            deb/*.changes
+            deb/*.dsc
+            deb/*.buildinfo
+            deb/debian/changelog
+
+  ## ======================================================================
+  ## Job: deb-install-test
+  ## ======================================================================
+
+  deb-install-test:
+    name: DEB Install Test Apache Cloudberry (Ubuntu 24.04)
+    needs: [check-skip, build-deb]
+    if: |
+      !cancelled() &&
+      (needs.build-deb.result == 'success' || needs.build-deb.result == 'skipped') &&
+      github.event.inputs.reuse_artifacts_from_run_id == ''
+    runs-on: ubuntu-22.04
+    timeout-minutes: 120
+
+    container:
+      image: apache/incubator-cloudberry:cbdb-test-ubuntu24.04-latest
+      options: >-
+        --user root
+        -h cdw
+        -v /usr/share:/host_usr_share
+        -v /usr/local:/host_usr_local
+        -v /opt:/host_opt
+
+    steps:
+      - name: Free Disk Space
+        if: needs.check-skip.outputs.should_skip != 'true'
+        run: |
+          echo "=== Disk space before cleanup ==="
+          df -h /
+
+          # Remove pre-installed tools from host to free disk space
+          rm -rf /host_opt/hostedtoolcache || true   # GitHub Actions tool cache
+          rm -rf /host_usr_local/lib/android || true # Android SDK
+          rm -rf /host_usr_share/dotnet || true      # .NET SDK
+          rm -rf /host_opt/ghc || true               # Haskell GHC
+          rm -rf /host_usr_local/.ghcup || true      # Haskell GHCup
+          rm -rf /host_usr_share/swift || true       # Swift
+          rm -rf /host_usr_local/share/powershell || true  # PowerShell
+          rm -rf /host_usr_local/share/chromium || true    # Chromium
+          rm -rf /host_usr_share/miniconda || true   # Miniconda
+          rm -rf /host_opt/az || true                # Azure CLI
+          rm -rf /host_usr_share/sbt || true         # Scala Build Tool
+
+          echo "=== Disk space after cleanup ==="
+          df -h /
+
+      - name: Skip Check
+        if: needs.check-skip.outputs.should_skip == 'true'
+        run: |
+          echo "DEB install test skipped via CI skip flag" >> "$GITHUB_STEP_SUMMARY"
+          exit 0
+
+      - name: Download Cloudberry DEB build artifacts
+        if: needs.check-skip.outputs.should_skip != 'true'
+        uses: actions/download-artifact@v4
+        with:
+          name: apache-cloudberry-db-incubating-deb-ubuntu24.04-build-artifacts
+          path: ${{ github.workspace }}/deb_build_artifacts
+          run-id: ${{ github.event.inputs.reuse_artifacts_from_run_id || github.run_id }}
+          merge-multiple: false
+
+      - name: Cloudberry Environment Initialization
+        if: needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          LOGS_DIR: install-logs
+        run: |
+          set -eo pipefail
+          if ! su - gpadmin -c "/tmp/init_system.sh"; then
+            echo "::error::Container initialization failed"
+            exit 1
+          fi
+
+          mkdir -p "${LOGS_DIR}/details"
+          chown -R gpadmin:gpadmin .
+          chmod -R 755 .
+          chmod 777 "${LOGS_DIR}"
+
+          df -kh /
+          rm -rf /__t/*
+          df -kh /
+
+          df -h | tee -a "${LOGS_DIR}/details/disk-usage.log"
+          free -h | tee -a "${LOGS_DIR}/details/memory-usage.log"
+
+          {
+            echo "=== Environment Information ==="
+            uname -a
+            df -h
+            free -h
+            env
+          } | tee -a "${LOGS_DIR}/details/environment.log"
+
+          echo "SRC_DIR=${GITHUB_WORKSPACE}" | tee -a "$GITHUB_ENV"
+
+      - name: Verify DEB artifacts
+        id: verify-artifacts
+        shell: bash
+        run: |
+          set -eo pipefail
+
+          DEB_FILE=$(ls "${GITHUB_WORKSPACE}"/deb_build_artifacts/*.deb)
+          if [ ! -f "${DEB_FILE}" ]; then
+            echo "::error::DEB file not found"
+            exit 1
+          fi
+
+          echo "deb_file=${DEB_FILE}" >> "$GITHUB_OUTPUT"
+
+          echo "Verifying DEB artifacts..."
+          {
+            echo "=== DEB Verification Summary ==="
+            echo "Timestamp: $(date -u)"
+            echo "DEB File: ${DEB_FILE}"
+
+            # Get DEB metadata and verify contents
+            echo "Package Information:"
+            dpkg-deb -f "${DEB_FILE}"
+
+            # Get key DEB attributes for verification
+            DEB_VERSION=$(dpkg-deb -f "${DEB_FILE}" Version | cut -d'-' -f 1)
+            DEB_RELEASE=$(dpkg-deb -f "${DEB_FILE}" Version | cut -d'-' -f 3)
+            echo "version=${DEB_VERSION}" >> "$GITHUB_OUTPUT"
+            echo "release=${DEB_RELEASE}" >> "$GITHUB_OUTPUT"
+
+            # Verify expected binaries are in the DEB
+            echo "Verifying critical files in DEB..."
+            for binary in "bin/postgres" "bin/psql"; do
+              if ! dpkg-deb -c "${DEB_FILE}" | grep "${binary}" > /dev/null; then
+                echo "::error::Critical binary '${binary}' not found in DEB"
+                exit 1
+              fi
+            done
+
+            echo "DEB Details:"
+            echo "- Version: ${DEB_VERSION}"
+            echo "- Release: ${DEB_RELEASE}"
+
+            # Calculate and store checksum
+            echo "Checksum:"
+            sha256sum "${DEB_FILE}"
+
+          } 2>&1 | tee -a install-logs/details/deb-verification.log
+
+      - name: Install Cloudberry DEB
+        shell: bash
+        env:
+          DEB_FILE: ${{ steps.verify-artifacts.outputs.deb_file }}
+          DEB_VERSION: ${{ steps.verify-artifacts.outputs.version }}
+          DEB_RELEASE: ${{ steps.verify-artifacts.outputs.release }}
+        run: |
+          set -eo pipefail
+
+          if [ -z "${DEB_FILE}" ]; then
+            echo "::error::DEB_FILE environment variable is not set"
+            exit 1
+          fi
+
+          {
+            echo "=== DEB Installation Log ==="
+            echo "Timestamp: $(date -u)"
+            echo "DEB File: ${DEB_FILE}"
+            echo "Version: ${DEB_VERSION}"
+            echo "Release: ${DEB_RELEASE}"
+
+            # Clean install location
+            rm -rf /usr/local/cloudberry-db
+
+            # Install DEB
+            echo "Starting installation..."
+            apt-get update
+            if ! apt-get -y install "${DEB_FILE}"; then
+              echo "::error::DEB installation failed"
+              exit 1
+            fi
+
+            # Change ownership back to gpadmin - it is needed for future tests
+            chown -R gpadmin:gpadmin /usr/local/cloudberry-db
+
+            echo "Installation completed successfully"
+            dpkg-query -s apache-cloudberry-db-incubating
+            echo "Installed files:"
+            dpkg-query -L apache-cloudberry-db-incubating
+          } 2>&1 | tee -a install-logs/details/deb-installation.log
+
+      - name: Upload install logs
+        uses: actions/upload-artifact@v4
+        with:
+          name: install-logs-${{ matrix.name }}-${{ needs.build-deb.outputs.build_timestamp }}
+          path: |
+            install-logs/
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+      - name: Generate Install Test Job Summary End
+        if: always()
+        shell: bash {0}
+        run: |
+          {
+            echo "# Installed Package Summary (Ubuntu 24.04)"
+            echo "\`\`\`"
+
+            dpkg-query -s apache-cloudberry-db-incubating
+            echo "\`\`\`"
+          } >> "$GITHUB_STEP_SUMMARY" || true
+
+  ## ======================================================================
+  ## Job: test-deb
+  ## ======================================================================
+
+  test-deb:
+    name: ${{ matrix.test }} (Ubuntu 24.04)
+    needs: [check-skip, build-deb, prepare-test-matrix-deb]
+    if: |
+      !cancelled() &&
+      (needs.build-deb.result == 'success' || needs.build-deb.result == 'skipped')
+    runs-on: ubuntu-22.04
+    timeout-minutes: 120
+    # actionlint-allow matrix[*].pg_settings
+    strategy:
+      fail-fast: false  # Continue with other tests if one fails
+      matrix: ${{ fromJson(needs.prepare-test-matrix-deb.outputs.test-matrix) }}
+
+    container:
+      image: apache/incubator-cloudberry:cbdb-build-ubuntu24.04-latest
+      options: >-
+        --privileged
+        --user root
+        --hostname cdw
+        --shm-size=2gb
+        --ulimit core=-1
+        --cgroupns=host
+        -v /sys/fs/cgroup:/sys/fs/cgroup:rw
+        -v /usr/share:/host_usr_share
+        -v /usr/local:/host_usr_local
+        -v /opt:/host_opt
+
+    steps:
+      - name: Free Disk Space
+        if: needs.check-skip.outputs.should_skip != 'true'
+        run: |
+          echo "=== Disk space before cleanup ==="
+          df -h /
+
+          # Remove pre-installed tools from host to free disk space
+          rm -rf /host_opt/hostedtoolcache || true   # GitHub Actions tool cache
+          rm -rf /host_usr_local/lib/android || true # Android SDK
+          rm -rf /host_usr_share/dotnet || true      # .NET SDK
+          rm -rf /host_opt/ghc || true               # Haskell GHC
+          rm -rf /host_usr_local/.ghcup || true      # Haskell GHCup
+          rm -rf /host_usr_share/swift || true       # Swift
+          rm -rf /host_usr_local/share/powershell || true  # PowerShell
+          rm -rf /host_usr_local/share/chromium || true    # Chromium
+          rm -rf /host_usr_share/miniconda || true   # Miniconda
+          rm -rf /host_opt/az || true                # Azure CLI
+          rm -rf /host_usr_share/sbt || true         # Scala Build Tool
+
+          echo "=== Disk space after cleanup ==="
+          df -h /
+
+      - name: Skip Check
+        if: needs.check-skip.outputs.should_skip == 'true'
+        run: |
+          echo "Test ${{ matrix.test }} skipped via CI skip flag" >> "$GITHUB_STEP_SUMMARY"
+          exit 0
+
+      - name: Use timestamp from previous job
+        if: needs.check-skip.outputs.should_skip != 'true'
+        run: |
+          echo "Timestamp from output: ${{ needs.build-deb.outputs.build_timestamp }}"
+
+      - name: Cloudberry Environment Initialization
+        shell: bash
+        env:
+          LOGS_DIR: build-logs
+        run: |
+          set -eo pipefail
+          if ! su - gpadmin -c "/tmp/init_system.sh"; then
+            echo "::error::Container initialization failed"
+            exit 1
+          fi
+
+          mkdir -p "${LOGS_DIR}/details"
+          chown -R gpadmin:gpadmin .
+          chmod -R 755 .
+          chmod 777 "${LOGS_DIR}"
+
+          df -kh /
+          rm -rf /__t/*
+          df -kh /
+
+          df -h | tee -a "${LOGS_DIR}/details/disk-usage.log"
+          free -h | tee -a "${LOGS_DIR}/details/memory-usage.log"
+
+          {
+            echo "=== Environment Information ==="
+            uname -a
+            df -h
+            free -h
+            env
+          } | tee -a "${LOGS_DIR}/details/environment.log"
+
+          echo "SRC_DIR=${GITHUB_WORKSPACE}" | tee -a "$GITHUB_ENV"
+
+      - name: Setup cgroups
+        if: needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        run: |
+          set -uxo pipefail
+
+          if [ "${{ matrix.enable_cgroups }}" = "true" ]; then
+
+            echo "Current mounts:"
+            mount | grep cgroup
+
+            CGROUP_BASEDIR=/sys/fs/cgroup
+
+            # 1. Basic setup with permissions
+            sudo chmod -R 777 ${CGROUP_BASEDIR}/
+            sudo mkdir -p ${CGROUP_BASEDIR}/gpdb
+            sudo chmod -R 777 ${CGROUP_BASEDIR}/gpdb
+            sudo chown -R gpadmin:gpadmin ${CGROUP_BASEDIR}/gpdb
+
+            # 2. Enable controllers
+            sudo bash -c "echo '+cpu +cpuset +memory +io' > ${CGROUP_BASEDIR}/cgroup.subtree_control" || true
+            sudo bash -c "echo '+cpu +cpuset +memory +io' > ${CGROUP_BASEDIR}/gpdb/cgroup.subtree_control" || true
+
+            # 3. CPU settings
+            sudo bash -c "echo 'max 100000' > ${CGROUP_BASEDIR}/gpdb/cpu.max" || true
+            sudo bash -c "echo '100' > ${CGROUP_BASEDIR}/gpdb/cpu.weight" || true
+            sudo bash -c "echo '0' > ${CGROUP_BASEDIR}/gpdb/cpu.weight.nice" || true
+            sudo bash -c "echo 0-$(( $(nproc) - 1 )) > ${CGROUP_BASEDIR}/gpdb/cpuset.cpus" || true
+            sudo bash -c "echo '0' > ${CGROUP_BASEDIR}/gpdb/cpuset.mems" || true
+
+            # 4. Memory settings
+            sudo bash -c "echo 'max' > ${CGROUP_BASEDIR}/gpdb/memory.max" || true
+            sudo bash -c "echo '0' > ${CGROUP_BASEDIR}/gpdb/memory.min" || true
+            sudo bash -c "echo 'max' > ${CGROUP_BASEDIR}/gpdb/memory.high" || true
+
+            # 5. IO settings
+            echo "Available block devices:"
+            lsblk
+
+            sudo bash -c "
+              if [ -f \${CGROUP_BASEDIR}/gpdb/io.stat ]; then
+                echo 'Detected IO devices:'
+                cat \${CGROUP_BASEDIR}/gpdb/io.stat
+              fi
+              echo '' > \${CGROUP_BASEDIR}/gpdb/io.max || true
+            "
+
+            # 6. Fix permissions again after all writes
+            sudo chmod -R 777 ${CGROUP_BASEDIR}/gpdb
+            sudo chown -R gpadmin:gpadmin ${CGROUP_BASEDIR}/gpdb
+
+            # 7. Check required files
+            echo "Checking required files:"
+            required_files=(
+                "cgroup.procs"
+                "cpu.max"
+                "cpu.pressure"
+                "cpu.weight"
+                "cpu.weight.nice"
+                "cpu.stat"
+                "cpuset.cpus"
+                "cpuset.mems"
+                "cpuset.cpus.effective"
+                "cpuset.mems.effective"
+                "memory.current"
+                "io.max"
+            )
+
+            for file in "${required_files[@]}"; do
+                if [ -f "${CGROUP_BASEDIR}/gpdb/$file" ]; then
+                    echo "✓ $file exists"
+                    ls -l "${CGROUP_BASEDIR}/gpdb/$file"
+                else
+                    echo "✗ $file missing"
+                fi
+            done
+
+            # 8. Test subdirectory creation
+            echo "Testing subdirectory creation..."
+            sudo -u gpadmin bash -c "
+              TEST_DIR=\${CGROUP_BASEDIR}/gpdb/test6448
+              if mkdir -p \$TEST_DIR; then
+                echo 'Created test directory'
+                sudo chmod -R 777 \$TEST_DIR
+                if echo \$\$ > \$TEST_DIR/cgroup.procs; then
+                  echo 'Successfully wrote to cgroup.procs'
+                  cat \$TEST_DIR/cgroup.procs
+                  # Move processes back to parent before cleanup
+                  echo \$\$ > \${CGROUP_BASEDIR}/gpdb/cgroup.procs
+                else
+                  echo 'Failed to write to cgroup.procs'
+                  ls -la \$TEST_DIR/cgroup.procs
+                fi
+                ls -la \$TEST_DIR/
+                rmdir \$TEST_DIR || {
+                  echo 'Moving all processes to parent before cleanup'
+                  cat \$TEST_DIR/cgroup.procs | while read pid; do
+                    echo \$pid > \${CGROUP_BASEDIR}/gpdb/cgroup.procs 2>/dev/null || true
+                  done
+                  rmdir \$TEST_DIR
+                }
+              else
+                echo 'Failed to create test directory'
+              fi
+            "
+
+            # 9. Verify setup as gpadmin user
+            echo "Testing cgroup access as gpadmin..."
+            sudo -u gpadmin bash -c "
+              echo 'Checking mounts...'
+              mount | grep cgroup
+
+              echo 'Checking /proc/self/mounts...'
+              cat /proc/self/mounts | grep cgroup
+
+              if ! grep -q cgroup2 /proc/self/mounts; then
+                  echo 'ERROR: cgroup2 mount NOT visible to gpadmin'
+                  exit 1
+              fi
+              echo 'SUCCESS: cgroup2 mount visible to gpadmin'
+
+              if ! [ -w ${CGROUP_BASEDIR}/gpdb ]; then
+                  echo 'ERROR: gpadmin cannot write to gpdb cgroup'
+                  exit 1
+              fi
+              echo 'SUCCESS: gpadmin can write to gpdb cgroup'
+
+              echo 'Verifying key files content:'
+              echo 'cpu.max:'
+              cat ${CGROUP_BASEDIR}/gpdb/cpu.max || echo 'Failed to read cpu.max'
+              echo 'cpuset.cpus:'
+              cat ${CGROUP_BASEDIR}/gpdb/cpuset.cpus || echo 'Failed to read cpuset.cpus'
+              echo 'cgroup.subtree_control:'
+              cat ${CGROUP_BASEDIR}/gpdb/cgroup.subtree_control || echo 'Failed to read cgroup.subtree_control'
+            "
+
+            # 10. Show final state
+            echo "Final cgroup state:"
+            ls -la ${CGROUP_BASEDIR}/gpdb/
+            echo "Cgroup setup completed successfully"
+          else
+            echo "Cgroup setup skipped"
+          fi
+
+      - name: "Generate Test Job Summary Start: ${{ matrix.test }}"
+        if: always()
+        run: |
+          {
+            echo "# Test Job Summary: ${{ matrix.test }} (Ubuntu 24.04)"
+            echo "## Environment"
+            echo "- Start Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+
+            if [[ "${{ needs.check-skip.outputs.should_skip }}" == "true" ]]; then
+              echo "## Skip Status"
+              echo "✓ Test execution skipped via CI skip flag"
+            else
+              echo "- OS Version: $(cat /etc/redhat-release)"
+            fi
+          } >> "$GITHUB_STEP_SUMMARY"
+
+      - name: Download Cloudberry DEB build artifacts
+        if: needs.check-skip.outputs.should_skip != 'true'
+        uses: actions/download-artifact@v4
+        with:
+          name: apache-cloudberry-db-incubating-deb-ubuntu24.04-build-artifacts
+          path: ${{ github.workspace }}/deb_build_artifacts
+          merge-multiple: false
+          run-id: ${{ github.event.inputs.reuse_artifacts_from_run_id || github.run_id }}
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Download Cloudberry Source build artifacts
+        if: needs.check-skip.outputs.should_skip != 'true'
+        uses: actions/download-artifact@v4
+        with:
+          name: apache-cloudberry-db-incubating-deb-source-build-artifacts
+          path: ${{ github.workspace }}/source_build_artifacts
+          merge-multiple: false
+          run-id: ${{ github.event.inputs.reuse_artifacts_from_run_id || github.run_id }}
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Verify DEB artifacts
+        if: needs.check-skip.outputs.should_skip != 'true'
+        id: verify-artifacts
+        shell: bash
+        run: |
+          set -eo pipefail
+
+          SRC_TARBALL_FILE=$(ls "${GITHUB_WORKSPACE}"/source_build_artifacts/apache-cloudberry-db-incubating_*.tar.xz)
+          if [ ! -f "${SRC_TARBALL_FILE}" ]; then
+            echo "::error::SRC TARBALL file not found"
+            exit 1
+          fi
+
+          echo "src_tarball_file=${SRC_TARBALL_FILE}" >> "$GITHUB_OUTPUT"
+
+          echo "Verifying SRC TARBALL artifacts..."
+          {
+            echo "=== SRC TARBALL Verification Summary ==="
+            echo "Timestamp: $(date -u)"
+            echo "SRC TARBALL File: ${SRC_TARBALL_FILE}"
+
+            # Calculate and store checksum
+            echo "Checksum:"
+            sha256sum "${SRC_TARBALL_FILE}"
+
+          } 2>&1 | tee -a build-logs/details/src-tarball-verification.log
+
+          DEB_FILE=$(ls "${GITHUB_WORKSPACE}"/deb_build_artifacts/*.deb)
+          if [ ! -f "${DEB_FILE}" ]; then
+            echo "::error::DEB file not found"
+            exit 1
+          fi
+
+          echo "deb_file=${DEB_FILE}" >> "$GITHUB_OUTPUT"
+
+          echo "Verifying DEB artifacts..."
+          {
+            echo "=== DEB Verification Summary ==="
+            echo "Timestamp: $(date -u)"
+            echo "DEB File: ${DEB_FILE}"
+
+            # Get DEB metadata and verify contents
+            echo "Package Information:"
+            dpkg-deb -f "${DEB_FILE}"
+
+            # Get key DEB attributes for verification
+            DEB_VERSION=$(dpkg-deb -f "${DEB_FILE}" Version | cut -d'-' -f 1)
+            DEB_RELEASE=$(dpkg-deb -f "${DEB_FILE}" Version | cut -d'-' -f 3)
+            echo "version=${DEB_VERSION}" >> "$GITHUB_OUTPUT"
+            echo "release=${DEB_RELEASE}" >> "$GITHUB_OUTPUT"
+
+            # Verify expected binaries are in the DEB
+            echo "Verifying critical files in DEB..."
+            for binary in "bin/postgres" "bin/psql"; do
+              if ! dpkg-deb -c "${DEB_FILE}" | grep "${binary}" > /dev/null; then
+                echo "::error::Critical binary '${binary}' not found in DEB"
+                exit 1
+              fi
+            done
+
+            echo "DEB Details:"
+            echo "- Version: ${DEB_VERSION}"
+            echo "- Release: ${DEB_RELEASE}"
+
+            # Calculate and store checksum
+            echo "Checksum:"
+            sha256sum "${DEB_FILE}"
+
+          } 2>&1 | tee -a build-logs/details/deb-verification.log
+
+      - name: Install Cloudberry DEB
+        if: success() && needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          DEB_FILE: ${{ steps.verify-artifacts.outputs.deb_file }}
+          DEB_VERSION: ${{ steps.verify-artifacts.outputs.version }}
+          DEB_RELEASE: ${{ steps.verify-artifacts.outputs.release }}
+        run: |
+          set -eo pipefail
+
+          if [ -z "${DEB_FILE}" ]; then
+            echo "::error::DEB_FILE environment variable is not set"
+            exit 1
+          fi
+
+          {
+            echo "=== DEB Installation Log ==="
+            echo "Timestamp: $(date -u)"
+            echo "DEB File: ${DEB_FILE}"
+            echo "Version: ${DEB_VERSION}"
+            echo "Release: ${DEB_RELEASE}"
+
+            # Clean install location
+            rm -rf /usr/local/cloudberry-db
+
+            # Install DEB
+            echo "Starting installation..."
+            apt-get update
+            if ! apt-get -y install "${DEB_FILE}"; then
+              echo "::error::DEB installation failed"
+              exit 1
+            fi
+
+            # Change ownership back to gpadmin - it is needed for future tests
+            chown -R gpadmin:gpadmin /usr/local/cloudberry-db
+
+            echo "Installation completed successfully"
+            dpkg-query -s apache-cloudberry-db-incubating
+            echo "Installed files:"
+            dpkg-query -L apache-cloudberry-db-incubating
+          } 2>&1 | tee -a build-logs/details/deb-installation.log
+
+      - name: Extract source tarball
+        if: success() && needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          SRC_TARBALL_FILE: ${{ steps.verify-artifacts.outputs.src_tarball_file }}
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          {
+            echo "=== Source Extraction Log ==="
+            echo "Timestamp: $(date -u)"
+
+            echo "Starting extraction..."
+            file "${SRC_TARBALL_FILE}"
+            if ! time tar xf "${SRC_TARBALL_FILE}" -C "${SRC_DIR}"/.. ; then
+              echo "::error::Source extraction failed"
+              exit 1
+            fi
+
+            echo "Extraction completed successfully"
+            echo "Extracted contents:"
+            ls -la "${SRC_DIR}/../cloudberry"
+            echo "Directory size:"
+            du -sh "${SRC_DIR}/../cloudberry"
+          } 2>&1 | tee -a build-logs/details/source-extraction.log
+
+      - name: Prepare DEB Environment
+        if: success() && needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          {
+
+            # change ownership to gpadmin
+            chown -R gpadmin "${SRC_DIR}/../cloudberry"
+            touch build-logs/sections.log
+            chown gpadmin build-logs/sections.log
+            chmod 777 build-logs
+
+            # configure link lib directory to temporary location, fix it
+            rm -rf "${SRC_DIR}"/debian/build/lib
+            ln -sf /usr/cloudberry-db/lib "${SRC_DIR}"/debian/build/lib
+
+            # check if regress.so exists in src directory - it is needed for contrib/dblink tests
+            if [ ! -f ${SRC_DIR}/src/test/regress/regress.so ]; then
+                ln -sf /usr/cloudberry-db/lib/postgresql/regress.so ${SRC_DIR}/src/test/regress/regress.so
+            fi
+
+            # FIXME
+            # temporary install gdb - delete after creating new docker build/test contaners
+            apt-get update
+            apt-get -y install gdb
+
+          } 2>&1 | tee -a build-logs/details/prepare-deb-env.log
+
+      - name: Create Apache Cloudberry demo cluster
+        if: success() && needs.check-skip.outputs.should_skip != 'true'
+        shell: bash
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        run: |
+          set -eo pipefail
+
+          {
+            chmod +x "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/create-cloudberry-demo-cluster.sh
+
+            # Build BLDWRAP_POSTGRES_CONF_ADDONS for shared_preload_libraries if specified
+            EXTRA_CONF=""
+            if [[ -n "${{ matrix.shared_preload_libraries }}" ]]; then
+              EXTRA_CONF="shared_preload_libraries='${{ matrix.shared_preload_libraries }}'"
+              echo "Adding shared_preload_libraries: ${{ matrix.shared_preload_libraries }}"
+            fi
+
+            if ! time su - gpadmin -c "cd ${SRC_DIR} && NUM_PRIMARY_MIRROR_PAIRS='${{ matrix.num_primary_mirror_pairs }}' BLDWRAP_POSTGRES_CONF_ADDONS=\"${EXTRA_CONF}\" SRC_DIR=${SRC_DIR} ${SRC_DIR}/devops/build/automation/cloudberry/scripts/create-cloudberry-demo-cluster.sh"; then
+              echo "::error::Demo cluster creation failed"
+              exit 1
+            fi
+
+          } 2>&1 | tee -a build-logs/details/create-cloudberry-demo-cluster.log
+
+      - name: "Run Tests: ${{ matrix.test }}"
+        if: success() && needs.check-skip.outputs.should_skip != 'true'
+        env:
+          SRC_DIR: ${{ github.workspace }}
+          BUILD_DESTINATION: ${{ github.workspace }}/debian/build
+        shell: bash {0}
+        run: |
+          set -o pipefail
+
+          # Initialize test status
+          overall_status=0
+
+          # Create logs directory structure
+          mkdir -p build-logs/details
+
+          # Core file config
+          mkdir -p "/tmp/cloudberry-cores"
+          chmod 1777 "/tmp/cloudberry-cores"
+          sysctl -w kernel.core_pattern="/tmp/cloudberry-cores/core-%e-%s-%u-%g-%p-%t"
+          sysctl kernel.core_pattern
+          su - gpadmin -c "ulimit -c"
+
+          # WARNING: PostgreSQL Settings
+          # When adding new pg_settings key/value pairs:
+          # 1. Add a new check below for the setting
+          # 2. Follow the same pattern as optimizer
+          # 3. Update matrix entries to include the new setting
+
+
+          # Create extension if required
+          if [[ "${{ matrix.extension != '' }}" == "true" ]]; then
+            case "${{ matrix.extension }}" in
+              gp_stats_collector)
+                if ! su - gpadmin -c "source ${BUILD_DESTINATION}/cloudberry-env.sh && \
+                  source ${SRC_DIR}/gpAux/gpdemo/gpdemo-env.sh && \
+                  gpconfig -c shared_preload_libraries -v 'gp_stats_collector' && \
+                  gpstop -ra && \
+                  echo 'CREATE EXTENSION IF NOT EXISTS gp_stats_collector; \
+                        SHOW shared_preload_libraries; \
+                        TABLE pg_extension;' | \
+                    psql postgres"
+                then
+                    echo "Error creating gp_stats_collector extension"
+                    exit 1
+                fi
+                ;;
+              *)
+                echo "Unknown extension: ${{ matrix.extension }}"
+                exit 1
+                ;;
+            esac
+          fi
+
+          # Set PostgreSQL options if defined
+          PG_OPTS=""
+          if [[ "${{ matrix.pg_settings.optimizer != '' }}" == "true" ]]; then
+            PG_OPTS="$PG_OPTS -c optimizer=${{ matrix.pg_settings.optimizer }}"
+          fi
+
+          if [[ "${{ matrix.pg_settings.default_table_access_method != '' }}" == "true" ]]; then
+            PG_OPTS="$PG_OPTS -c default_table_access_method=${{ matrix.pg_settings.default_table_access_method }}"
+          fi
+
+          # Read configs into array
+          IFS=' ' read -r -a configs <<< "${{ join(matrix.make_configs, ' ') }}"
+
+          echo "=== Starting test execution for ${{ matrix.test }} ==="
+          echo "Number of configurations to execute: ${#configs[@]}"
+          echo ""
+
+          # Execute each config separately
+          for ((i=0; i<${#configs[@]}; i++)); do
+            config="${configs[$i]}"
+            IFS=':' read -r dir target <<< "$config"
+
+            echo "=== Executing configuration $((i+1))/${#configs[@]} ==="
+            echo "Make command: make -C $dir $target"
+            echo "Environment:"
+            echo "- PGOPTIONS: ${PG_OPTS}"
+
+            # Create unique log file for this configuration
+            config_log="build-logs/details/make-${{ matrix.test }}-config$i.log"
+
+            # Clean up any existing core files
+            echo "Cleaning up existing core files..."
+            rm -f /tmp/cloudberry-cores/core-*
+
+            # Execute test script with proper environment setup
+            if ! time su - gpadmin -c "cd ${SRC_DIR} && \
+                 MAKE_NAME='${{ matrix.test }}-config$i' \
+                 MAKE_TARGET='$target' \
+                 MAKE_DIRECTORY='-C $dir' \
+                 PGOPTIONS='${PG_OPTS}' \
+                 SRC_DIR='${SRC_DIR}' \
+                 ${SRC_DIR}/devops/build/automation/cloudberry/scripts/test-cloudberry.sh" \
+                 2>&1 | tee "$config_log"; then
+              echo "::warning::Test execution failed for configuration $((i+1)): make -C $dir $target"
+              overall_status=1
+            fi
+
+            # Check for results directory
+            results_dir="${dir}/results"
+
+            if [[ -d "$results_dir" ]]; then
+              echo "-----------------------------------------" | tee -a build-logs/details/make-${{ matrix.test }}-config$i-results.log
+              echo "Found results directory: $results_dir" | tee -a build-logs/details/make-${{ matrix.test }}-config$i-results.log
+              echo "Contents of results directory:" | tee -a build-logs/details/make-${{ matrix.test }}-config$i-results.log
+
+              find "$results_dir" -type f -ls >> "$log_file" 2>&1 | tee -a build-logs/details/make-${{ matrix.test }}-config$i-results.log
+              echo "-----------------------------------------" | tee -a build-logs/details/make-${{ matrix.test }}-config$i-results.log
+            else
+              echo "-----------------------------------------"
+              echo "Results directory $results_dir does not exit"
+              echo "-----------------------------------------"
+            fi
+
+            # Analyze any core files generated by this test configuration
+            echo "Analyzing core files for configuration ${{ matrix.test }}-config$i..."
+            test_id="${{ matrix.test }}-config$i"
+
+            # List the cores directory
+            echo "-----------------------------------------"
+            echo "Cores directory: /tmp/cloudberry-cores"
+            echo "Contents of cores directory:"
+            ls -Rl "/tmp/cloudberry-cores"
+            echo "-----------------------------------------"
+
+            "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/analyze_core_dumps.sh "$test_id"
+            core_analysis_rc=$?
+            case "$core_analysis_rc" in
+              0) echo "No core dumps found for this configuration" ;;
+              1) echo "Core dumps were found and analyzed successfully" ;;
+              2) echo "::warning::Issues encountered during core dump analysis" ;;
+              *) echo "::error::Unexpected return code from core dump analysis: $core_analysis_rc" ;;
+            esac
+
+            echo "Log file: $config_log"
+            echo "=== End configuration $((i+1)) execution ==="
+            echo ""
+          done
+
+          echo "=== Test execution completed ==="
+          echo "Log files:"
+          ls -l build-logs/details/
+
+          # Store number of configurations for parsing step
+          echo "NUM_CONFIGS=${#configs[@]}" >> "$GITHUB_ENV"
+
+          # Report overall status
+          if [ $overall_status -eq 0 ]; then
+            echo "All test executions completed successfully"
+          else
+            echo "::warning::Some test executions failed, check individual logs for details"
+          fi
+
+          exit $overall_status
+
+      - name: "Parse Test Results: ${{ matrix.test }}"
+        id: test-results
+        if: always() && needs.check-skip.outputs.should_skip != 'true'
+        env:
+          SRC_DIR: ${{ github.workspace }}
+        shell: bash {0}
+        run: |
+          set -o pipefail
+
+          overall_status=0
+
+          # Get configs array to create context for results
+          IFS=' ' read -r -a configs <<< "${{ join(matrix.make_configs, ' ') }}"
+
+          echo "=== Starting results parsing for ${{ matrix.test }} ==="
+          echo "Number of configurations to parse: ${#configs[@]}"
+          echo ""
+
+          # Parse each configuration's results independently
+          for ((i=0; i<NUM_CONFIGS; i++)); do
+            config="${configs[$i]}"
+            IFS=':' read -r dir target <<< "$config"
+
+            config_log="build-logs/details/make-${{ matrix.test }}-config$i.log"
+
+            echo "=== Parsing results for configuration $((i+1))/${NUM_CONFIGS} ==="
+            echo "Make command: make -C $dir $target"
+            echo "Log file: $config_log"
+
+            if [ ! -f "$config_log" ]; then
+              echo "::error::Log file not found: $config_log"
+              {
+                echo "MAKE_COMMAND=make -C $dir $target"
+                echo "STATUS=missing_log"
+                echo "TOTAL_TESTS=0"
+                echo "FAILED_TESTS=0"
+                echo "PASSED_TESTS=0"
+                echo "IGNORED_TESTS=0"
+              } > "test_results.$i.txt"
+              overall_status=1
+              continue
+            fi
+
+            # Parse this configuration's results
+
+            MAKE_NAME="${{ matrix.test }}-config$i" \
+            "${SRC_DIR}"/devops/build/automation/cloudberry/scripts/parse-test-results.sh "$config_log"
+            status_code=$?
+
+            {
+                echo "SUITE_NAME=${{ matrix.test }}"
+                echo "DIR=${dir}"
+                echo "TARGET=${target}"
+            } >> test_results.txt
+
+            # Process return code
+            case $status_code in
+              0)  # All tests passed
+                  echo "All tests passed successfully"
+                  if [ -f test_results.txt ]; then
+                    (echo "MAKE_COMMAND=\"make -C $dir $target\""; cat test_results.txt) | tee "test_results.${{ matrix.test }}.$i.txt"
+                    rm test_results.txt
+                  fi
+                  ;;
+              1)  # Tests failed but parsed successfully
+                  echo "Test failures detected but properly parsed"
+                  if [ -f test_results.txt ]; then
+                    (echo "MAKE_COMMAND=\"make -C $dir $target\""; cat test_results.txt) | tee "test_results.${{ matrix.test }}.$i.txt"
+                    rm test_results.txt
+                  fi
+                  overall_status=1
+                  ;;
+              2)  # Parse error or missing file
+                  echo "::warning::Could not parse test results properly for configuration $((i+1))"
+                  {
+                    echo "MAKE_COMMAND=\"make -C $dir $target\""
+                    echo "STATUS=parse_error"
+                    echo "TOTAL_TESTS=0"
+                    echo "FAILED_TESTS=0"
+                    echo "PASSED_TESTS=0"
+                    echo "IGNORED_TESTS=0"
+                  } | tee "test_results.${{ matrix.test }}.$i.txt"
+                  overall_status=1
+                  ;;
+              *)  # Unexpected error
+                  echo "::warning::Unexpected error during test results parsing for configuration $((i+1))"
+                  {
+                    echo "MAKE_COMMAND=\"make -C $dir $target\""
+                    echo "STATUS=unknown_error"
+                    echo "TOTAL_TESTS=0"
+                    echo "FAILED_TESTS=0"
+                    echo "PASSED_TESTS=0"
+                    echo "IGNORED_TESTS=0"
+                  } | tee "test_results.${{ matrix.test }}.$i.txt"
+                  overall_status=1
+                  ;;
+            esac
+
+            echo "Results stored in test_results.$i.txt"
+            echo "=== End parsing for configuration $((i+1)) ==="
+            echo ""
+          done
+
+          # Report status of results files
+          echo "=== Results file status ==="
+          echo "Generated results files:"
+          for ((i=0; i<NUM_CONFIGS; i++)); do
+            if [ -f "test_results.${{ matrix.test }}.$i.txt" ]; then
+              echo "- test_results.${{ matrix.test }}.$i.txt exists"
+              echo ""
+            else
+              echo "::error::Missing results file: test_results.${{ matrix.test }}.$i.txt"
+              overall_status=1
+            fi
+          done
+
+          exit $overall_status
+
+      - name: Check and Display Regression Diffs
+        if: always()
+        shell: bash {0}
+        run: |
+          # Search for regression.diffs recursively
+          found_file=$(find . -type f -name "regression.diffs" | head -n 1)
+          if [[ -n "$found_file" ]]; then
+            echo "Found regression.diffs at: $found_file"
+            cat "$found_file"
+          else
+            echo "No regression.diffs file found in the hierarchy."
+          fi
+
+      - name: "Check for Core Dumps Across All Configurations: ${{ matrix.test }}"
+        if: always() && needs.check-skip.outputs.should_skip != 'true'
+        shell: bash {0}
+        run: |
+          # Look for any core analysis files from this test matrix entry
+          core_files=$(find "${SRC_DIR}/build-logs" -name "core_analysis_*.log")
+
+          if [ -n "$core_files" ]; then
+            echo "::error::Core dumps were found during test execution:"
+            echo "$core_files" | while read -r file; do
+              echo "Core analysis file: $file"
+              echo "=== Content ==="
+              cat "$file"
+              echo "=============="
+            done
+            if [ "${{ matrix.enable_core_check }}" = "true" ]; then
+              exit 1
+            else
+              echo "::warning::Special case - core checks will generate a warning"
+            fi
+          else
+            echo "No core dumps were found during test execution"
+          fi
+
+      - name: "Generate Test Job Summary End: ${{ matrix.test }}"
+        if: always()
+        shell: bash {0}
+        run: |
+          {
+            if [[ "${{ needs.check-skip.outputs.should_skip }}" == "true" ]]; then
+              echo "## Test Results - SKIPPED"
+              echo "- End Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+              exit 0
+            fi
+
+            echo "## Test Results"
+            echo "- End Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+
+            # Check if job was cancelled
+            if [[ "${{ job.status }}" == "cancelled" ]]; then
+              echo "### Test Status"
+              echo "🚫 Test execution was cancelled"
+              echo ""
+              echo "### Execution Summary"
+              echo "Test run was interrupted and did not complete. No test results are available."
+              exit 0
+            fi
+
+            # Check for core analysis files
+            core_files=$(find "${SRC_DIR}/build-logs" -name "core_analysis_*.log")
+
+            if [ -n "$core_files" ]; then
+              if [ "${{ matrix.enable_core_check }}" = "true" ]; then
+                echo "❌ Core dumps were detected"
+              else
+                echo "⚠️  Core dumps were detected - enable_core_check: false"
+              fi
+              echo ""
+              echo "#### Core Analysis Files"
+              echo "\`\`\`"
+              echo "$core_files"
+              echo "\`\`\`"
+
+              echo ""
+              echo "#### Analysis Details"
+              echo "\`\`\`"
+              while read -r file; do
+                echo "=== $file ==="
+                cat "$file"
+                echo ""
+              done <<< "$core_files"
+              echo "\`\`\`"
+            else
+              echo "✅ No core dumps detected"
+            fi
+
+            # Process results for each configuration
+            IFS=' ' read -r -a configs <<< "${{ join(matrix.make_configs, ' ') }}"
+
+            for ((i=0; i<NUM_CONFIGS; i++)); do
+              config="${configs[$i]}"
+              IFS=':' read -r dir target <<< "$config"
+
+              echo "### Configuration $((i+1)): \`make -C $dir $target\`"
+
+              if [[ ! -f "test_results.${{ matrix.test }}.$i.txt" ]]; then
+                echo "⚠️ No results file found for this configuration"
+                continue
+              fi
+
+              # Source configuration results
+              # shellcheck source=/dev/null
+              . "test_results.${{ matrix.test }}.$i.txt"
+
+              # Rest of the code remains the same...
+              # Display status with emoji
+              echo "#### Status"
+              case "${STATUS:-unknown}" in
+                passed)
+                  echo "✅ All tests passed"
+                  ;;
+                failed)
+                  echo "❌ Some tests failed"
+                  ;;
+                parse_error)
+                  echo "⚠️ Could not parse test results"
+                  ;;
+                unknown_error)
+                  echo "⚠️ Unexpected error during test execution/parsing"
+                  ;;
+                missing_log)
+                  echo "⚠️ Test log file missing"
+                  ;;
+                *)
+                  echo "⚠️ Unknown status: ${status:-unknown}"
+                  ;;
+              esac
+
+              echo ""
+              echo "#### Test Counts"
+              echo "| Metric | Count |"
+              echo "|--------|-------|"
+              echo "| Total Tests | ${TOTAL_TESTS:-0} |"
+              echo "| Passed Tests | ${PASSED_TESTS:-0} |"
+              echo "| Failed Tests | ${FAILED_TESTS:-0} |"
+              echo "| Ignored Tests | ${IGNORED_TESTS:-0} |"
+
+              # Add failed tests if any
+              if [[ -n "${FAILED_TEST_NAMES:-}" && "${FAILED_TESTS:-0}" != "0" ]]; then
+                echo ""
+                echo "#### Failed Tests"
+                echo "${FAILED_TEST_NAMES}" | tr ',' '\n' | while read -r test; do
+                  if [[ -n "$test" ]]; then
+                    echo "* \`${test}\`"
+                  fi
+                done
+              fi
+
+              # Add ignored tests if any
+              if [[ -n "${IGNORED_TEST_NAMES:-}" && "${IGNORED_TESTS:-0}" != "0" ]]; then
+                echo ""
+                echo "#### Ignored Tests"
+                echo "${IGNORED_TEST_NAMES}" | tr ',' '\n' | while read -r test; do
+                  if [[ -n "$test" ]]; then
+                    echo "* \`${test}\`"
+                  fi
+                done
+              fi
+
+              echo ""
+              echo "---"
+            done
+
+          } >> "$GITHUB_STEP_SUMMARY" || true
+
+      - name: Upload test logs
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: test-logs-${{ matrix.test }}-${{ needs.build-deb.outputs.build_timestamp }}
+          path: |
+            build-logs/
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+      - name: Upload Test Metadata
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: test-metadata-${{ matrix.test }}
+          path: |
+            test_results*.txt
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+      - name: Upload test results files
+        uses: actions/upload-artifact@v4
+        with:
+          name: results-${{ matrix.test }}-${{ needs.build-deb.outputs.build_timestamp }}
+          path: |
+            **/regression.out
+            **/regression.diffs
+            **/results/
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+      - name: Upload test regression logs
+        if: failure() || cancelled()
+        uses: actions/upload-artifact@v4
+        with:
+          name: regression-logs-${{ matrix.test }}-${{ needs.build-deb.outputs.build_timestamp }}
+          path: |
+            **/regression.out
+            **/regression.diffs
+            **/results/
+            gpAux/gpdemo/datadirs/standby/log/
+            gpAux/gpdemo/datadirs/qddir/demoDataDir-1/log/
+            gpAux/gpdemo/datadirs/dbfast1/demoDataDir0/log/
+            gpAux/gpdemo/datadirs/dbfast2/demoDataDir1/log/
+            gpAux/gpdemo/datadirs/dbfast3/demoDataDir2/log/
+            gpAux/gpdemo/datadirs/dbfast_mirror1/demoDataDir0/log/
+            gpAux/gpdemo/datadirs/dbfast_mirror2/demoDataDir1/log/
+            gpAux/gpdemo/datadirs/dbfast_mirror3/demoDataDir2/log/
+          retention-days: ${{ env.LOG_RETENTION_DAYS }}
+
+  ## ======================================================================
+  ## Job: report-deb
+  ## ======================================================================
+
+  report-deb:
+    name: Generate Apache Cloudberry Build Report (Ubuntu 24.04)
+    needs: [check-skip, build-deb, prepare-test-matrix-deb, deb-install-test, test-deb]
+    if: always()
+    runs-on: ubuntu-22.04
+    steps:
+      - name: Generate Final Report
+        run: |
+          {
+            echo "# Apache Cloudberry Build Pipeline Report"
+
+            if [[ "${{ needs.check-skip.outputs.should_skip }}" == "true" ]]; then
+              echo "## CI Skip Status"
+              echo "✅ CI checks skipped via skip flag"
+              echo "- Completion Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+            else
+              echo "## Job Status"
+              echo "- Build Job: ${{ needs.build-deb.result }}"
+              echo "- Test Job: ${{ needs.test-deb.result }}"
+              echo "- Completion Time: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+
+              if [[ "${{ needs.build-deb.result }}" == "success" && "${{ needs.test-deb.result }}" == "success" ]]; then
+                echo "✅ Pipeline completed successfully"
+              else
+                echo "⚠️ Pipeline completed with failures"
+
+                if [[ "${{ needs.build-deb.result }}" != "success" ]]; then
+                  echo "### Build Job Failure"
+                  echo "Check build logs for details"
+                fi
+
+                if [[ "${{ needs.test-deb.result }}" != "success" ]]; then
+                  echo "### Test Job Failure"
+                  echo "Check test logs and regression files for details"
+                fi
+              fi
+            fi
+          } >> "$GITHUB_STEP_SUMMARY"
+
+      - name: Notify on failure
+        if: |
+          needs.check-skip.outputs.should_skip != 'true' &&
+          (needs.build-deb.result != 'success' || needs.test-deb.result != 'success')
+        run: |
+          echo "::error::Build/Test pipeline failed! Check job summaries and logs for details"
+          echo "Timestamp: $(date -u +'%Y-%m-%d %H:%M:%S UTC')"
+          echo "Build Result: ${{ needs.build-deb.result }}"
+          echo "Test Result: ${{ needs.test-deb.result }}"
diff --git a/.github/workflows/build-deb-cloudberry.yml b/.github/workflows/build-deb-cloudberry.yml
index 85d917b8ff0..f8eadee3c8f 100644
--- a/.github/workflows/build-deb-cloudberry.yml
+++ b/.github/workflows/build-deb-cloudberry.yml
@@ -252,6 +252,10 @@ jobs:
                                "gpcontrib/gp_sparse_vector:installcheck",
                                "gpcontrib/gp_toolkit:installcheck"]
               },
+              {"test":"gpcontrib-gp-stats-collector",
+               "make_configs":["gpcontrib/gp_stats_collector:installcheck"],
+               "extension":"gp_stats_collector"
+              },
               {"test":"ic-cbdb-parallel",
                "make_configs":["src/test/regress:installcheck-cbdb-parallel"]
               }
@@ -1341,6 +1345,7 @@ jobs:
         if: success() && needs.check-skip.outputs.should_skip != 'true'
         env:
           SRC_DIR: ${{ github.workspace }}
+          BUILD_DESTINATION: ${{ github.workspace }}/debian/build
         shell: bash {0}
         run: |
           set -o pipefail
@@ -1365,6 +1370,30 @@ jobs:
           # 3. Update matrix entries to include the new setting
 
 
+          # Create extension if required
+          if [[ "${{ matrix.extension != '' }}" == "true" ]]; then
+            case "${{ matrix.extension }}" in
+              gp_stats_collector)
+                if ! su - gpadmin -c "source ${BUILD_DESTINATION}/cloudberry-env.sh && \
+                  source ${SRC_DIR}/gpAux/gpdemo/gpdemo-env.sh && \
+                  gpconfig -c shared_preload_libraries -v 'gp_stats_collector' && \
+                  gpstop -ra && \
+                  echo 'CREATE EXTENSION IF NOT EXISTS gp_stats_collector; \
+                        SHOW shared_preload_libraries; \
+                        TABLE pg_extension;' | \
+                    psql postgres"
+                then
+                    echo "Error creating gp_stats_collector extension"
+                    exit 1
+                fi
+                ;;
+              *)
+                echo "Unknown extension: ${{ matrix.extension }}"
+                exit 1
+                ;;
+            esac
+          fi
+
           # Set PostgreSQL options if defined
           PG_OPTS=""
           if [[ "${{ matrix.pg_settings.optimizer != '' }}" == "true" ]]; then
@@ -1589,6 +1618,7 @@ jobs:
 
       - name: Check and Display Regression Diffs
         if: always()
+        shell: bash {0}
         run: |
           # Search for regression.diffs recursively
           found_file=$(find . -type f -name "regression.diffs" | head -n 1)
diff --git a/.github/workflows/coverity.yml b/.github/workflows/coverity.yml
index 4f7f74d54b2..2b6a81c91f4 100644
--- a/.github/workflows/coverity.yml
+++ b/.github/workflows/coverity.yml
@@ -90,7 +90,7 @@ jobs:
              /usr/local/cloudberry-db/lib
         sudo chown -R gpadmin:gpadmin /usr/local/cloudberry-db
         su - gpadmin -c "cd $WORKSPACE"
-        export LD_LIBRARY_PATH=/usr/local/cloudberry-db/lib:LD_LIBRARY_PATH
+        export LD_LIBRARY_PATH=/usr/local/cloudberry-db/lib:${LD_LIBRARY_PATH:-""}
         export PATH=$WORKSPACE/coverity_tool/bin:$PATH
         ./configure --prefix=/usr/local/cloudberry-db \
             --disable-external-fts \
diff --git a/.github/workflows/docker-cbdb-build-containers.yml b/.github/workflows/docker-cbdb-build-containers.yml
index dd9ea9acd27..538b4e9b179 100644
--- a/.github/workflows/docker-cbdb-build-containers.yml
+++ b/.github/workflows/docker-cbdb-build-containers.yml
@@ -60,6 +60,7 @@ on:
     paths:
       - 'devops/deploy/docker/build/rocky8/**'
       - 'devops/deploy/docker/build/rocky9/**'
+      - 'devops/deploy/docker/build/rocky10/**'
       - 'devops/deploy/docker/build/ubuntu22.04/**'
       - 'devops/deploy/docker/build/ubuntu24.04/**'
   pull_request:
@@ -81,7 +82,7 @@ jobs:
     # Matrix strategy to build for both Rocky Linux 8 and 9, Ubuntu 22.04 and 24.04
     strategy:
       matrix:
-        platform: ['rocky8', 'rocky9', 'ubuntu22.04', 'ubuntu24.04']
+        platform: ['rocky8', 'rocky9', 'rocky10', 'ubuntu22.04', 'ubuntu24.04']
 
     steps:
       # Checkout repository code with full history
@@ -108,6 +109,8 @@ jobs:
               - 'devops/deploy/docker/build/rocky8/**'
             rocky9:
               - 'devops/deploy/docker/build/rocky9/**'
+            rocky10:
+              - 'devops/deploy/docker/build/rocky10/**'
             ubuntu22.04:
               - 'devops/deploy/docker/build/ubuntu22.04/**'
             ubuntu24.04:
@@ -117,13 +120,13 @@ jobs:
       # This allows building ARM64 images on AMD64 infrastructure and vice versa
       - name: Set up QEMU
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' }}
-        uses: docker/setup-qemu-action@v3
+        uses: docker/setup-qemu-action@ce360397dd3f832beb865e1373c09c0e9f86d70a # v4.0.0
 
       # Login to DockerHub for pushing images
       # Requires DOCKERHUB_USER and DOCKERHUB_TOKEN secrets to be set
       - name: Login to Docker Hub
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' && github.event_name == 'push' && github.ref == 'refs/heads/main' }}
-        uses: docker/login-action@v3
+        uses: docker/login-action@c94ce9fb468520275223c153574b00df6fe4bcc9 # v3.7.0
         with:
           username: ${{ secrets.DOCKERHUB_USER }}
           password: ${{ secrets.DOCKERHUB_TOKEN }}
@@ -132,7 +135,7 @@ jobs:
       # Enable debug mode for better troubleshooting
       - name: Set up Docker Buildx
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' }}
-        uses: docker/setup-buildx-action@v3
+        uses: docker/setup-buildx-action@8d2750c68a42422c14e847fe6c8ac0403b4cbd6f # v3.12.0
         with:
           buildkitd-flags: --debug
 
@@ -172,7 +175,7 @@ jobs:
       # This creates a manifest list that supports both architectures
       - name: Build and Push Multi-arch Docker images
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' && github.event_name == 'push' && github.ref == 'refs/heads/main' }}
-        uses: docker/build-push-action@v6
+        uses: docker/build-push-action@10e90e3645eae34f1e60eeb005ba3a3d33f178e8 # v6.19.2
         with:
           context: ./devops/deploy/docker/build/${{ matrix.platform }}
           push: true
diff --git a/.github/workflows/docker-cbdb-test-containers.yml b/.github/workflows/docker-cbdb-test-containers.yml
index 1c8e1c8a9a2..4d0fb8def33 100644
--- a/.github/workflows/docker-cbdb-test-containers.yml
+++ b/.github/workflows/docker-cbdb-test-containers.yml
@@ -49,6 +49,7 @@ on:
     paths:
       - 'devops/deploy/docker/test/rocky8/**'
       - 'devops/deploy/docker/test/rocky9/**'
+      - 'devops/deploy/docker/test/rocky10/**'
       - 'devops/deploy/docker/test/ubuntu22.04/**'
       - 'devops/deploy/docker/test/ubuntu24.04/**'
   pull_request:
@@ -68,7 +69,7 @@ jobs:
     strategy:
       matrix:
         # Build for Rocky Linux 8 and 9, Ubuntu 22.04 and 24.04
-        platform: ['rocky8', 'rocky9', 'ubuntu22.04', 'ubuntu24.04']
+        platform: ['rocky8', 'rocky9', 'rocky10', 'ubuntu22.04', 'ubuntu24.04']
 
     steps:
       # Checkout repository code
@@ -92,6 +93,8 @@ jobs:
               - 'devops/deploy/docker/test/rocky8/**'
             rocky9:
               - 'devops/deploy/docker/test/rocky9/**'
+            rocky10:
+              - 'devops/deploy/docker/test/rocky10/**'
             ubuntu22.04:
               - 'devops/deploy/docker/test/ubuntu22.04/**'
             ubuntu24.04:
@@ -106,12 +109,12 @@ jobs:
       # This allows building ARM64 images on AMD64 infrastructure and vice versa
       - name: Set up QEMU
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' }}
-        uses: docker/setup-qemu-action@v3
+        uses: docker/setup-qemu-action@ce360397dd3f832beb865e1373c09c0e9f86d70a # v4.0.0
 
       # Login to DockerHub for pushing images
       - name: Login to Docker Hub
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' && github.event_name == 'push' && github.ref == 'refs/heads/main' }}
-        uses: docker/login-action@v3
+        uses: docker/login-action@c94ce9fb468520275223c153574b00df6fe4bcc9 # v3.7.0
         with:
           username: ${{ secrets.DOCKERHUB_USER }}
           password: ${{ secrets.DOCKERHUB_TOKEN }}
@@ -119,7 +122,7 @@ jobs:
       # Setup Docker Buildx for efficient multi-architecture builds
       - name: Set up Docker Buildx
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' }}
-        uses: docker/setup-buildx-action@v3
+        uses: docker/setup-buildx-action@8d2750c68a42422c14e847fe6c8ac0403b4cbd6f # v3.12.0
         with:
           buildkitd-flags: --debug
 
@@ -142,7 +145,7 @@ jobs:
       # Creates a manifest list that supports both architectures
       - name: Build and Push Multi-arch Docker images
         if: ${{ steps.platform-filter.outputs[matrix.platform] == 'true' && github.event_name == 'push' && github.ref == 'refs/heads/main' }}
-        uses: docker/build-push-action@v6
+        uses: docker/build-push-action@10e90e3645eae34f1e60eeb005ba3a3d33f178e8 # v6.19.2
         with:
           context: ./devops/deploy/docker/test/${{ matrix.platform }}
           push: true
diff --git a/.github/workflows/sonarqube.yml b/.github/workflows/sonarqube.yml
index e67c2d96a54..93379d184ea 100644
--- a/.github/workflows/sonarqube.yml
+++ b/.github/workflows/sonarqube.yml
@@ -94,7 +94,7 @@ jobs:
              /usr/local/xerces-c/lib/libxerces-c-3.3.so \
              /usr/local/cloudberry-db/lib
         sudo chown -R gpadmin:gpadmin /usr/local/cloudberry-db
-        export LD_LIBRARY_PATH=/usr/local/cloudberry-db/lib:LD_LIBRARY_PATH
+        export LD_LIBRARY_PATH=/usr/local/cloudberry-db/lib:${LD_LIBRARY_PATH:-""}
         ./configure --prefix=/usr/local/cloudberry-db \
             --disable-external-fts \
             --enable-gpcloud \
diff --git a/LICENSE b/LICENSE
index 28796e982e1..0ccd7072122 100644
--- a/LICENSE
+++ b/LICENSE
@@ -246,7 +246,7 @@ The PostgreSQL software includes:
       
       src/backend/utils/adt/inet_cidr_ntop.c
       src/backend/utils/adt/inet_net_pton.c
-      see licenses/licenses/LICENSE-isc.txt
+      see licenses/LICENSE-isc.txt
 
 ----------------------------
    Perl Artistic License 2.0 (exception)
diff --git a/configure b/configure
index e91414fb52c..74d1415d637 100755
--- a/configure
+++ b/configure
@@ -721,6 +721,9 @@ GREP
 with_apr_config
 with_libcurl
 with_rt
+PROTOC
+with_gp_stats_collector
+with_diskquota
 with_zstd
 with_libbz2
 LZ4_LIBS
@@ -943,6 +946,8 @@ with_zlib
 with_lz4
 with_libbz2
 with_zstd
+with_diskquota
+with_gp_stats_collector
 with_rt
 with_libcurl
 with_apr_config
@@ -1703,11 +1708,14 @@ Optional Packages:
   --with-lz4              build with LZ4 support
   --without-libbz2        do not use bzip2
   --without-zstd          do not build with Zstandard
+  --with-diskquota        build with diskquota extension
+  --with-gp_stats_collector
+                          build with stats collector extension
   --without-rt            do not use Realtime Library
   --without-libcurl       do not use libcurl
   --with-apr-config=PATH  path to apr-1-config utility
   --with-gnu-ld           assume the C compiler uses GNU ld [default=no]
-  --without-mdblocales    build without MDB locales
+  --with-mdblocales       build with MDB locales
   --with-ssl=LIB          use LIB for SSL/TLS support (openssl)
   --with-openssl          obsolete spelling of --with-ssl=openssl
 
@@ -2924,6 +2932,7 @@ PG_PACKAGE_VERSION=14.7
 
 
 
+
 ac_aux_dir=
 for ac_dir in config "$srcdir"/config; do
   if test -f "$ac_dir/install-sh"; then
@@ -11157,6 +11166,184 @@ fi
 $as_echo "$with_zstd" >&6; }
 
 
+#
+# diskquota
+#
+
+
+
+# Check whether --with-diskquota was given.
+if test "${with_diskquota+set}" = set; then :
+  withval=$with_diskquota;
+  case $withval in
+    yes)
+      :
+      ;;
+    no)
+      :
+      ;;
+    *)
+      as_fn_error $? "no argument expected for --with-diskquota option" "$LINENO" 5
+      ;;
+  esac
+
+else
+  with_diskquota=no
+
+fi
+
+
+
+
+#
+# gp_stats_collector
+#
+
+
+
+# Check whether --with-gp_stats_collector was given.
+if test "${with_gp_stats_collector+set}" = set; then :
+  withval=$with_gp_stats_collector;
+  case $withval in
+    yes)
+      :
+      ;;
+    no)
+      :
+      ;;
+    *)
+      as_fn_error $? "no argument expected for --with-gp_stats_collector option" "$LINENO" 5
+      ;;
+  esac
+
+else
+  with_gp_stats_collector=no
+
+fi
+
+
+
+
+if test "$with_gp_stats_collector" = yes; then
+
+pkg_failed=no
+{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for protobuf >= 3.0.0" >&5
+$as_echo_n "checking for protobuf >= 3.0.0... " >&6; }
+
+if test -n "$PROTOBUF_CFLAGS"; then
+    pkg_cv_PROTOBUF_CFLAGS="$PROTOBUF_CFLAGS"
+ elif test -n "$PKG_CONFIG"; then
+    if test -n "$PKG_CONFIG" && \
+    { { $as_echo "$as_me:${as_lineno-$LINENO}: \$PKG_CONFIG --exists --print-errors \"protobuf >= 3.0.0\""; } >&5
+  ($PKG_CONFIG --exists --print-errors "protobuf >= 3.0.0") 2>&5
+  ac_status=$?
+  $as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
+  test $ac_status = 0; }; then
+  pkg_cv_PROTOBUF_CFLAGS=`$PKG_CONFIG --cflags "protobuf >= 3.0.0" 2>/dev/null`
+		      test "x$?" != "x0" && pkg_failed=yes
+else
+  pkg_failed=yes
+fi
+ else
+    pkg_failed=untried
+fi
+if test -n "$PROTOBUF_LIBS"; then
+    pkg_cv_PROTOBUF_LIBS="$PROTOBUF_LIBS"
+ elif test -n "$PKG_CONFIG"; then
+    if test -n "$PKG_CONFIG" && \
+    { { $as_echo "$as_me:${as_lineno-$LINENO}: \$PKG_CONFIG --exists --print-errors \"protobuf >= 3.0.0\""; } >&5
+  ($PKG_CONFIG --exists --print-errors "protobuf >= 3.0.0") 2>&5
+  ac_status=$?
+  $as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
+  test $ac_status = 0; }; then
+  pkg_cv_PROTOBUF_LIBS=`$PKG_CONFIG --libs "protobuf >= 3.0.0" 2>/dev/null`
+		      test "x$?" != "x0" && pkg_failed=yes
+else
+  pkg_failed=yes
+fi
+ else
+    pkg_failed=untried
+fi
+
+
+
+if test $pkg_failed = yes; then
+        { $as_echo "$as_me:${as_lineno-$LINENO}: result: no" >&5
+$as_echo "no" >&6; }
+
+if $PKG_CONFIG --atleast-pkgconfig-version 0.20; then
+        _pkg_short_errors_supported=yes
+else
+        _pkg_short_errors_supported=no
+fi
+        if test $_pkg_short_errors_supported = yes; then
+	        PROTOBUF_PKG_ERRORS=`$PKG_CONFIG --short-errors --print-errors --cflags --libs "protobuf >= 3.0.0" 2>&1`
+        else
+	        PROTOBUF_PKG_ERRORS=`$PKG_CONFIG --print-errors --cflags --libs "protobuf >= 3.0.0" 2>&1`
+        fi
+	# Put the nasty error message in config.log where it belongs
+	echo "$PROTOBUF_PKG_ERRORS" >&5
+
+	as_fn_error $? "protobuf >= 3.0.0 is required for gp_stats_collector" "$LINENO" 5
+
+elif test $pkg_failed = untried; then
+        { $as_echo "$as_me:${as_lineno-$LINENO}: result: no" >&5
+$as_echo "no" >&6; }
+	as_fn_error $? "protobuf >= 3.0.0 is required for gp_stats_collector" "$LINENO" 5
+
+else
+	PROTOBUF_CFLAGS=$pkg_cv_PROTOBUF_CFLAGS
+	PROTOBUF_LIBS=$pkg_cv_PROTOBUF_LIBS
+        { $as_echo "$as_me:${as_lineno-$LINENO}: result: yes" >&5
+$as_echo "yes" >&6; }
+
+fi
+  # Extract the first word of "protoc", so it can be a program name with args.
+set dummy protoc; ac_word=$2
+{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for $ac_word" >&5
+$as_echo_n "checking for $ac_word... " >&6; }
+if ${ac_cv_path_PROTOC+:} false; then :
+  $as_echo_n "(cached) " >&6
+else
+  case $PROTOC in
+  [\\/]* | ?:[\\/]*)
+  ac_cv_path_PROTOC="$PROTOC" # Let the user override the test with a path.
+  ;;
+  *)
+  as_save_IFS=$IFS; IFS=$PATH_SEPARATOR
+for as_dir in $PATH
+do
+  IFS=$as_save_IFS
+  test -z "$as_dir" && as_dir=.
+    for ac_exec_ext in '' $ac_executable_extensions; do
+  if as_fn_executable_p "$as_dir/$ac_word$ac_exec_ext"; then
+    ac_cv_path_PROTOC="$as_dir/$ac_word$ac_exec_ext"
+    $as_echo "$as_me:${as_lineno-$LINENO}: found $as_dir/$ac_word$ac_exec_ext" >&5
+    break 2
+  fi
+done
+  done
+IFS=$as_save_IFS
+
+  test -z "$ac_cv_path_PROTOC" && ac_cv_path_PROTOC="no"
+  ;;
+esac
+fi
+PROTOC=$ac_cv_path_PROTOC
+if test -n "$PROTOC"; then
+  { $as_echo "$as_me:${as_lineno-$LINENO}: result: $PROTOC" >&5
+$as_echo "$PROTOC" >&6; }
+else
+  { $as_echo "$as_me:${as_lineno-$LINENO}: result: no" >&5
+$as_echo "no" >&6; }
+fi
+
+
+  if test "$PROTOC" = no; then
+    as_fn_error $? "protoc is required for gp_stats_collector but was not found in PATH" "$LINENO" 5
+  fi
+fi
+
 if test "$with_zstd" = yes; then
 
 pkg_failed=no
@@ -12979,56 +13166,6 @@ $as_echo "${python_libspec} ${python_additional_libs}" >&6; }
 
 
 
-fi
-
-if test "$with_mdblocales" = yes; then
-  { $as_echo "$as_me:${as_lineno-$LINENO}: checking for mdb_setlocale in -lmdblocales" >&5
-$as_echo_n "checking for mdb_setlocale in -lmdblocales... " >&6; }
-if ${ac_cv_lib_mdblocales_mdb_setlocale+:} false; then :
-  $as_echo_n "(cached) " >&6
-else
-  ac_check_lib_save_LIBS=$LIBS
-LIBS="-lmdblocales  $LIBS"
-cat confdefs.h - <<_ACEOF >conftest.$ac_ext
-/* end confdefs.h.  */
-
-/* Override any GCC internal prototype to avoid an error.
-   Use char because int might match the return type of a GCC
-   builtin and then its argument prototype would still apply.  */
-#ifdef __cplusplus
-extern "C"
-#endif
-char mdb_setlocale ();
-int
-main ()
-{
-return mdb_setlocale ();
-  ;
-  return 0;
-}
-_ACEOF
-if ac_fn_c_try_link "$LINENO"; then :
-  ac_cv_lib_mdblocales_mdb_setlocale=yes
-else
-  ac_cv_lib_mdblocales_mdb_setlocale=no
-fi
-rm -f core conftest.err conftest.$ac_objext \
-    conftest$ac_exeext conftest.$ac_ext
-LIBS=$ac_check_lib_save_LIBS
-fi
-{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $ac_cv_lib_mdblocales_mdb_setlocale" >&5
-$as_echo "$ac_cv_lib_mdblocales_mdb_setlocale" >&6; }
-if test "x$ac_cv_lib_mdblocales_mdb_setlocale" = xyes; then :
-  cat >>confdefs.h <<_ACEOF
-#define HAVE_LIBMDBLOCALES 1
-_ACEOF
-
-  LIBS="-lmdblocales $LIBS"
-
-else
-  as_fn_error $? "mdblocales library not found" "$LINENO" 5
-fi
-
 fi
 
 if test x"$cross_compiling" = x"yes" && test -z "$with_system_tzdata"; then
@@ -14953,6 +15090,56 @@ fi
 
 fi
 
+if test "$with_mdblocales" = yes; then
+  { $as_echo "$as_me:${as_lineno-$LINENO}: checking for mdb_setlocale in -lmdblocales" >&5
+$as_echo_n "checking for mdb_setlocale in -lmdblocales... " >&6; }
+if ${ac_cv_lib_mdblocales_mdb_setlocale+:} false; then :
+  $as_echo_n "(cached) " >&6
+else
+  ac_check_lib_save_LIBS=$LIBS
+LIBS="-lmdblocales  $LIBS"
+cat confdefs.h - <<_ACEOF >conftest.$ac_ext
+/* end confdefs.h.  */
+
+/* Override any GCC internal prototype to avoid an error.
+   Use char because int might match the return type of a GCC
+   builtin and then its argument prototype would still apply.  */
+#ifdef __cplusplus
+extern "C"
+#endif
+char mdb_setlocale ();
+int
+main ()
+{
+return mdb_setlocale ();
+  ;
+  return 0;
+}
+_ACEOF
+if ac_fn_c_try_link "$LINENO"; then :
+  ac_cv_lib_mdblocales_mdb_setlocale=yes
+else
+  ac_cv_lib_mdblocales_mdb_setlocale=no
+fi
+rm -f core conftest.err conftest.$ac_objext \
+    conftest$ac_exeext conftest.$ac_ext
+LIBS=$ac_check_lib_save_LIBS
+fi
+{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $ac_cv_lib_mdblocales_mdb_setlocale" >&5
+$as_echo "$ac_cv_lib_mdblocales_mdb_setlocale" >&6; }
+if test "x$ac_cv_lib_mdblocales_mdb_setlocale" = xyes; then :
+  cat >>confdefs.h <<_ACEOF
+#define HAVE_LIBMDBLOCALES 1
+_ACEOF
+
+  LIBS="-lmdblocales $LIBS"
+
+else
+  as_fn_error $? "mdblocales library not found" "$LINENO" 5
+fi
+
+fi
+
 if test "$enable_external_fts" = yes; then
 { $as_echo "$as_me:${as_lineno-$LINENO}: checking for jansson_version_str in -ljansson" >&5
 $as_echo_n "checking for jansson_version_str in -ljansson... " >&6; }
diff --git a/configure.ac b/configure.ac
index 9a07159cecf..f0584d65076 100644
--- a/configure.ac
+++ b/configure.ac
@@ -1368,6 +1368,31 @@ PGAC_ARG_BOOL(with, zstd, yes, [do not build with Zstandard],
 AC_MSG_RESULT([$with_zstd])
 AC_SUBST(with_zstd)
 
+#
+# diskquota
+#
+PGAC_ARG_BOOL(with, diskquota, no,
+              [build with diskquota extension])
+AC_SUBST(with_diskquota)
+
+#
+# gp_stats_collector
+#
+PGAC_ARG_BOOL(with, gp_stats_collector, no,
+              [build with stats collector extension])
+AC_SUBST(with_gp_stats_collector)
+
+if test "$with_gp_stats_collector" = yes; then
+  PKG_CHECK_MODULES([PROTOBUF], [protobuf >= 3.0.0],
+    [],
+    [AC_MSG_ERROR([protobuf >= 3.0.0 is required for gp_stats_collector])]
+  )
+  AC_PATH_PROG([PROTOC], [protoc], [no])
+  if test "$PROTOC" = no; then
+    AC_MSG_ERROR([protoc is required for gp_stats_collector but was not found in PATH])
+  fi
+fi
+
 if test "$with_zstd" = yes; then
   dnl zstd_errors.h was renamed from error_public.h in v1.4.0
   PKG_CHECK_MODULES([ZSTD], [libzstd >= 1.4.0])
@@ -1469,7 +1494,7 @@ AC_SUBST(install_bin)
 # MDB locales
 #
 
-PGAC_ARG_BOOL(with, mdblocales, yes, [build without MDB locales],
+PGAC_ARG_BOOL(with, mdblocales, no, [build with MDB locales],
               [AC_DEFINE([USE_MDBLOCALES], 1, [Define to 1 to build with MDB locales. (--with-mdblocales)])])
 AC_SUBST(USE_MDBLOCALES)
 
@@ -3194,4 +3219,11 @@ AC_OUTPUT
 # The configure args contain '-Wl,-rpath,\$$ORIGIN`, when it falls
 # as a C literal string, it's invalid, so converting `\` to `\\`
 # to be correct for C program.
-sed -i '/define CONFIGURE_ARGS/s,\([[^\\]]\)\\\$\$,\1\\\\$$,g' src/include/pg_config.h
+case $build_os in
+darwin*)
+  sed -i '' '/define CONFIGURE_ARGS/s,\([[^\\]]\)\\\$\$,\1\\\\$$,g' src/include/pg_config.h
+  ;;
+*)
+  sed -i '/define CONFIGURE_ARGS/s,\([[^\\]]\)\\\$\$,\1\\\\$$,g' src/include/pg_config.h
+  ;;
+esac
diff --git a/contrib/btree_gist/expected/cash_optimizer.out b/contrib/btree_gist/expected/cash_optimizer.out
index 171dec7e511..f2c9ac07420 100644
--- a/contrib/btree_gist/expected/cash_optimizer.out
+++ b/contrib/btree_gist/expected/cash_optimizer.out
@@ -77,12 +77,11 @@ SELECT a, a <-> '21472.79' FROM moneytmp ORDER BY a <-> '21472.79' LIMIT 3;
                          QUERY PLAN                         
 ------------------------------------------------------------
  Limit
-   ->  Sort
-         Sort Key: ((a <-> '$21,472.79'::money))
-         ->  Result
-               ->  Gather Motion 3:1  (slice1; segments: 3)
-                     ->  Seq Scan on moneytmp
- Optimizer: GPORCA
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Merge Key: ((a <-> '$21,472.79'::money))
+         ->  Limit
+               ->  Index Only Scan using moneyidx on moneytmp
+                     Order By: (a <-> '$21,472.79'::money)
 (7 rows)
 
 SELECT a, a <-> '21472.79' FROM moneytmp ORDER BY a <-> '21472.79' LIMIT 3;
diff --git a/contrib/btree_gist/expected/date_optimizer.out b/contrib/btree_gist/expected/date_optimizer.out
index a77041f847f..12269cf169b 100644
--- a/contrib/btree_gist/expected/date_optimizer.out
+++ b/contrib/btree_gist/expected/date_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '2001-02-13' FROM datetmp ORDER BY a <-> '2001-02-13' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '02-13-2001'::date))
-         ->  Sort
-               Sort Key: ((a <-> '02-13-2001'::date))
-               ->  Seq Scan on datetmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using dateidx on datetmp
+                     Order By: (a <-> '02-13-2001'::date)
 (7 rows)
 
 SELECT a, a <-> '2001-02-13' FROM datetmp ORDER BY a <-> '2001-02-13' LIMIT 3;
diff --git a/contrib/btree_gist/expected/float4_optimizer.out b/contrib/btree_gist/expected/float4_optimizer.out
index cc40e9bd1ae..7b71a2f5112 100644
--- a/contrib/btree_gist/expected/float4_optimizer.out
+++ b/contrib/btree_gist/expected/float4_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '-179.0' FROM float4tmp ORDER BY a <-> '-179.0' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '-179'::real))
-         ->  Sort
-               Sort Key: ((a <-> '-179'::real))
-               ->  Seq Scan on float4tmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using float4idx on float4tmp
+                     Order By: (a <-> '-179'::real)
 (7 rows)
 
 SELECT a, a <-> '-179.0' FROM float4tmp ORDER BY a <-> '-179.0' LIMIT 3;
diff --git a/contrib/btree_gist/expected/float8_optimizer.out b/contrib/btree_gist/expected/float8_optimizer.out
index 1bd96c44d3b..18e5c195286 100644
--- a/contrib/btree_gist/expected/float8_optimizer.out
+++ b/contrib/btree_gist/expected/float8_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '-1890.0' FROM float8tmp ORDER BY a <-> '-1890.0' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '-1890'::double precision))
-         ->  Sort
-               Sort Key: ((a <-> '-1890'::double precision))
-               ->  Seq Scan on float8tmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using float8idx on float8tmp
+                     Order By: (a <-> '-1890'::double precision)
 (7 rows)
 
 SELECT a, a <-> '-1890.0' FROM float8tmp ORDER BY a <-> '-1890.0' LIMIT 3;
diff --git a/contrib/btree_gist/expected/int2_optimizer.out b/contrib/btree_gist/expected/int2_optimizer.out
index fdfc859097b..f8f6a428b93 100644
--- a/contrib/btree_gist/expected/int2_optimizer.out
+++ b/contrib/btree_gist/expected/int2_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '237' FROM int2tmp ORDER BY a <-> '237' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '237'::smallint))
-         ->  Sort
-               Sort Key: ((a <-> '237'::smallint))
-               ->  Seq Scan on int2tmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using int2idx on int2tmp
+                     Order By: (a <-> '237'::smallint)
 (7 rows)
 
 SELECT a, a <-> '237' FROM int2tmp ORDER BY a <-> '237' LIMIT 3;
diff --git a/contrib/btree_gist/expected/int4_optimizer.out b/contrib/btree_gist/expected/int4_optimizer.out
index 67107e63bfa..6877fb09af5 100644
--- a/contrib/btree_gist/expected/int4_optimizer.out
+++ b/contrib/btree_gist/expected/int4_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '237' FROM int4tmp ORDER BY a <-> '237' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> 237))
-         ->  Sort
-               Sort Key: ((a <-> 237))
-               ->  Seq Scan on int4tmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using int4idx on int4tmp
+                     Order By: (a <-> 237)
 (7 rows)
 
 SELECT a, a <-> '237' FROM int4tmp ORDER BY a <-> '237' LIMIT 3;
diff --git a/contrib/btree_gist/expected/int8_optimizer.out b/contrib/btree_gist/expected/int8_optimizer.out
index ba8e21135e8..962dd314661 100644
--- a/contrib/btree_gist/expected/int8_optimizer.out
+++ b/contrib/btree_gist/expected/int8_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '464571291354841' FROM int8tmp ORDER BY a <-> '464571291354841'
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '464571291354841'::bigint))
-         ->  Sort
-               Sort Key: ((a <-> '464571291354841'::bigint))
-               ->  Seq Scan on int8tmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using int8idx on int8tmp
+                     Order By: (a <-> '464571291354841'::bigint)
 (7 rows)
 
 SELECT a, a <-> '464571291354841' FROM int8tmp ORDER BY a <-> '464571291354841' LIMIT 3;
diff --git a/contrib/btree_gist/expected/interval_optimizer.out b/contrib/btree_gist/expected/interval_optimizer.out
index f5afd17456b..f0a4e850aeb 100644
--- a/contrib/btree_gist/expected/interval_optimizer.out
+++ b/contrib/btree_gist/expected/interval_optimizer.out
@@ -74,15 +74,15 @@ SELECT count(*) FROM intervaltmp WHERE a >  '199 days 21:21:23'::interval;
 
 EXPLAIN (COSTS OFF)
 SELECT a, a <-> '199 days 21:21:23' FROM intervaltmp ORDER BY a <-> '199 days 21:21:23' LIMIT 3;
-                                    QUERY PLAN                                     
------------------------------------------------------------------------------------
+                                      QUERY PLAN                                       
+---------------------------------------------------------------------------------------
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval))
-         ->  Sort
-               Sort Key: ((a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval))
-               ->  Seq Scan on intervaltmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using intervalidx on intervaltmp
+                     Order By: (a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval)
+ Optimizer: Postgres query optimizer
 (7 rows)
 
 SELECT a, a <-> '199 days 21:21:23' FROM intervaltmp ORDER BY a <-> '199 days 21:21:23' LIMIT 3;
@@ -96,15 +96,15 @@ SELECT a, a <-> '199 days 21:21:23' FROM intervaltmp ORDER BY a <-> '199 days 21
 SET enable_indexonlyscan=off;
 EXPLAIN (COSTS OFF)
 SELECT a, a <-> '199 days 21:21:23' FROM intervaltmp ORDER BY a <-> '199 days 21:21:23' LIMIT 3;
-                                    QUERY PLAN                                     
------------------------------------------------------------------------------------
+                                      QUERY PLAN                                       
+---------------------------------------------------------------------------------------
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval))
-         ->  Sort
-               Sort Key: ((a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval))
-               ->  Seq Scan on intervaltmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Scan using intervalidx on intervaltmp
+                     Order By: (a <-> '@ 199 days 21 hours 21 mins 23 secs'::interval)
+ Optimizer: Postgres query optimizer
 (7 rows)
 
 SELECT a, a <-> '199 days 21:21:23' FROM intervaltmp ORDER BY a <-> '199 days 21:21:23' LIMIT 3;
diff --git a/contrib/btree_gist/expected/time_optimizer.out b/contrib/btree_gist/expected/time_optimizer.out
index 590ada880b9..40d49e79b02 100644
--- a/contrib/btree_gist/expected/time_optimizer.out
+++ b/contrib/btree_gist/expected/time_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '10:57:11' FROM timetmp ORDER BY a <-> '10:57:11' LIMIT 3;
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> '10:57:11'::time without time zone))
-         ->  Sort
-               Sort Key: ((a <-> '10:57:11'::time without time zone))
-               ->  Seq Scan on timetmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using timeidx on timetmp
+                     Order By: (a <-> '10:57:11'::time without time zone)
 (7 rows)
 
 SELECT a, a <-> '10:57:11' FROM timetmp ORDER BY a <-> '10:57:11' LIMIT 3;
diff --git a/contrib/btree_gist/expected/timestamp_optimizer.out b/contrib/btree_gist/expected/timestamp_optimizer.out
index 1b8e709fe90..85c3a1a5e5d 100644
--- a/contrib/btree_gist/expected/timestamp_optimizer.out
+++ b/contrib/btree_gist/expected/timestamp_optimizer.out
@@ -79,10 +79,9 @@ SELECT a, a <-> '2004-10-26 08:55:08' FROM timestamptmp ORDER BY a <-> '2004-10-
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> 'Tue Oct 26 08:55:08 2004'::timestamp without time zone))
-         ->  Sort
-               Sort Key: ((a <-> 'Tue Oct 26 08:55:08 2004'::timestamp without time zone))
-               ->  Seq Scan on timestamptmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using timestampidx on timestamptmp
+                     Order By: (a <-> 'Tue Oct 26 08:55:08 2004'::timestamp without time zone)
 (7 rows)
 
 SELECT a, a <-> '2004-10-26 08:55:08' FROM timestamptmp ORDER BY a <-> '2004-10-26 08:55:08' LIMIT 3;
diff --git a/contrib/btree_gist/expected/timestamptz_optimizer.out b/contrib/btree_gist/expected/timestamptz_optimizer.out
index 2173c5dca35..a9e043f98a6 100644
--- a/contrib/btree_gist/expected/timestamptz_optimizer.out
+++ b/contrib/btree_gist/expected/timestamptz_optimizer.out
@@ -199,10 +199,9 @@ SELECT a, a <-> '2018-12-18 10:59:54 GMT+2' FROM timestamptztmp ORDER BY a <-> '
  Limit
    ->  Gather Motion 3:1  (slice1; segments: 3)
          Merge Key: ((a <-> 'Tue Dec 18 04:59:54 2018 PST'::timestamp with time zone))
-         ->  Sort
-               Sort Key: ((a <-> 'Tue Dec 18 04:59:54 2018 PST'::timestamp with time zone))
-               ->  Seq Scan on timestamptztmp
- Optimizer: GPORCA
+         ->  Limit
+               ->  Index Only Scan using timestamptzidx on timestamptztmp
+                     Order By: (a <-> 'Tue Dec 18 04:59:54 2018 PST'::timestamp with time zone)
 (7 rows)
 
 SELECT a, a <-> '2018-12-18 10:59:54 GMT+2' FROM timestamptztmp ORDER BY a <-> '2018-12-18 10:59:54 GMT+2' LIMIT 3;
diff --git a/contrib/pax_storage/expected/cbdb_parallel.out b/contrib/pax_storage/expected/cbdb_parallel.out
index db583090026..ec6ceba7e3c 100644
--- a/contrib/pax_storage/expected/cbdb_parallel.out
+++ b/contrib/pax_storage/expected/cbdb_parallel.out
@@ -41,13 +41,29 @@ set gp_appendonly_insert_files = 4;
 begin;
 set local enable_parallel = on;
 create table test_131_ao1(x int, y int) using ao_row with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_ao2(x int, y int) using ao_row with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_ao3(x int, y int) using ao_row with(parallel_workers=0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_ao4(x int, y int) using ao_row with(parallel_workers=0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_aoco1(x int, y int) using ao_column with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_aoco2(x int, y int) using ao_column with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_aoco3(x int, y int) using ao_column with(parallel_workers=0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table test_131_aoco4(x int, y int) using ao_column with(parallel_workers=0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 select relname, reloptions from pg_catalog.pg_class where relname like 'test_131_ao%';
     relname     |      reloptions      
 ----------------+----------------------
@@ -155,8 +171,14 @@ explain(locus, costs off) select count(*) from test_131_aoco3, test_131_aoco4 wh
 
 abort;
 create table ao1(x int, y int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table ao2(x int, y int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table aocs1(x int, y int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'x' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 begin;
 -- encourage use of parallel plans
 set local min_parallel_table_scan_size = 0;
@@ -367,6 +389,8 @@ abort;
 begin;
 set local max_parallel_workers_per_gather = 2;
 create table t1(a int, b int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table rt1(a int, b int) with(parallel_workers=2) distributed replicated;
 create table rt2(a int, b int) distributed replicated;
 create table rt3(a int, b int) distributed replicated;
@@ -599,6 +623,8 @@ select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
   5 |  6 |  4 |  5 |  5 |  6
   8 |  9 |  7 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
+  1 |  2 |  1 |  1 |  1 |  2
+  2 |  3 |  1 |  2 |  2 |  3
   5 |  6 |  5 |  5 |  5 |  6
   6 |  7 |  6 |  6 |  6 |  7
   9 | 10 |  9 |  9 |  9 | 10
@@ -606,8 +632,6 @@ select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
   6 |  7 |  5 |  6 |  6 |  7
   7 |  8 |  6 |  7 |  7 |  8
  10 | 11 |  9 | 10 | 10 | 11
-  1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
 (19 rows)
 
 -- parallel hash join
@@ -650,13 +674,6 @@ explain(locus, costs off) select * from rt1 join t1 on rt1.a = t1.b join rt2 on
 select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
-  5 |  6 |  5 |  5 |  5 |  6
-  6 |  7 |  5 |  6 |  6 |  7
-  6 |  7 |  6 |  6 |  6 |  7
-  7 |  8 |  6 |  7 |  7 |  8
-  9 | 10 |  9 |  9 |  9 | 10
- 10 | 11 |  9 | 10 | 10 | 11
- 10 | 11 | 10 | 10 | 10 | 11
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  2 |  3 |  3 |  4
   3 |  4 |  3 |  3 |  3 |  4
@@ -669,6 +686,13 @@ select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
   9 | 10 |  8 |  9 |  9 | 10
   1 |  2 |  1 |  1 |  1 |  2
   2 |  3 |  1 |  2 |  2 |  3
+  5 |  6 |  5 |  5 |  5 |  6
+  6 |  7 |  5 |  6 |  6 |  7
+  6 |  7 |  6 |  6 |  6 |  7
+  7 |  8 |  6 |  7 |  7 |  8
+  9 | 10 |  9 |  9 |  9 | 10
+ 10 | 11 |  9 | 10 | 10 | 11
+ 10 | 11 | 10 | 10 | 10 | 11
 (19 rows)
 
 --
@@ -702,6 +726,8 @@ explain(locus, costs off) select * from rt1 join t1 on rt1.a = t1.b join rt3 on
 select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
+  1 |  2 |  1 |  1 |  1 |  2
+  2 |  3 |  1 |  2 |  2 |  3
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  3 |  3 |  3 |  4
   4 |  5 |  4 |  4 |  4 |  5
@@ -712,8 +738,6 @@ select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
   5 |  6 |  4 |  5 |  5 |  6
   8 |  9 |  7 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
-  1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
   5 |  6 |  5 |  5 |  5 |  6
   6 |  7 |  6 |  6 |  6 |  7
   9 | 10 |  9 |  9 |  9 | 10
@@ -779,6 +803,8 @@ select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
 (19 rows)
 
 create table t2(a int, b int) with(parallel_workers=0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table rt4(a int, b int) with(parallel_workers=2) distributed replicated;
 insert into t2 select i, i+1 from generate_series(1, 10) i;
 insert into rt4 select i, i+1 from generate_series(1, 10000) i;
@@ -788,16 +814,16 @@ set local enable_parallel = off;
 select * from rt4 join t2 using(b);
  b  | a  | a  
 ----+----+----
-  2 |  1 |  1
-  6 |  5 |  5
-  7 |  6 |  6
- 10 |  9 |  9
- 11 | 10 | 10
   3 |  2 |  2
   4 |  3 |  3
   5 |  4 |  4
   8 |  7 |  7
   9 |  8 |  8
+  2 |  1 |  1
+  6 |  5 |  5
+  7 |  6 |  6
+ 10 |  9 |  9
+ 11 | 10 | 10
 (10 rows)
 
 set local enable_parallel = on;
@@ -828,19 +854,21 @@ explain(locus, costs off) select * from rt4 join t2 using(b);
 select * from rt4 join t2 using(b);
  b  | a  | a  
 ----+----+----
-  2 |  1 |  1
+  6 |  5 |  5
+  7 |  6 |  6
+ 10 |  9 |  9
+ 11 | 10 | 10
   3 |  2 |  2
   4 |  3 |  3
   5 |  4 |  4
   8 |  7 |  7
   9 |  8 |  8
-  6 |  5 |  5
-  7 |  6 |  6
- 10 |  9 |  9
- 11 | 10 | 10
+  2 |  1 |  1
 (10 rows)
 
 create table t3(a int, b int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t3 select i, i+1 from generate_series(1, 9000) i;
 analyze t3;
 set local enable_parallel = off;
@@ -919,10 +947,10 @@ explain(locus, costs off) select * from t_replica_workers_2 join t_random_worker
 select * from t_replica_workers_2 join t_random_workers_0 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
- 3 | 4 | 4
  1 | 2 | 2
+ 2 | 3 | 3
  4 | 5 | 5
+ 3 | 4 | 4
  5 | 6 | 6
 (5 rows)
 
@@ -931,11 +959,11 @@ set local enable_parallel=false;
 select * from t_replica_workers_2 join t_random_workers_0 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
  3 | 4 | 4
- 1 | 2 | 2
- 4 | 5 | 5
  5 | 6 | 6
+ 4 | 5 | 5
+ 1 | 2 | 2
+ 2 | 3 | 3
 (5 rows)
 
 abort;
@@ -976,11 +1004,11 @@ explain(locus, costs off) select * from t_replica_workers_2 right join t_random_
 select * from t_replica_workers_2 right join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
- 5 | 6 | 6
  1 | 2 | 2
  2 | 3 | 3
  3 | 4 | 4
  4 | 5 | 5
+ 5 | 6 | 6
 (5 rows)
 
 -- non parallel results
@@ -1028,14 +1056,14 @@ explain(locus, costs off) select * from t_replica_workers_2 join t_random_worker
                      Locus: Strewn
                      Parallel Workers: 2
  Optimizer: Postgres query optimizer
-(16 rows)
+(15 rows)
 
 select * from t_replica_workers_2 join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
  1 | 2 | 2
  3 | 4 | 4
+ 2 | 3 | 3
  4 | 5 | 5
  5 | 6 | 6
 (5 rows)
@@ -1045,9 +1073,9 @@ set local enable_parallel=false;
 select * from t_replica_workers_2 join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
  1 | 2 | 2
  3 | 4 | 4
+ 2 | 3 | 3
  4 | 5 | 5
  5 | 6 | 6
 (5 rows)
@@ -1059,7 +1087,11 @@ abort;
 --
 begin;
 create table t1(a int, b int) with(parallel_workers=3);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table t2(b int, a int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i, i+1 from generate_series(1, 10) i;
 insert into t2 select i, i+1 from generate_series(1, 5) i;
 analyze t1;
@@ -1071,17 +1103,17 @@ explain(costs off) select * from t1 right join t2 on t1.b = t2.a;
                             QUERY PLAN                            
 ------------------------------------------------------------------
  Gather Motion 9:1  (slice1; segments: 9)
-   ->  Parallel Hash Left Join
-         Hash Cond: (t2.a = t1.b)
-         ->  Redistribute Motion 6:9  (slice2; segments: 6)
-               Hash Key: t2.a
+   ->  Parallel Hash Right Join
+         Hash Cond: (t1.b = t2.a)
+         ->  Redistribute Motion 9:9  (slice2; segments: 9)
+               Hash Key: t1.b
                Hash Module: 3
-               ->  Parallel Seq Scan on t2
+               ->  Parallel Seq Scan on t1
          ->  Parallel Hash
-               ->  Redistribute Motion 9:9  (slice3; segments: 9)
-                     Hash Key: t1.b
+               ->  Redistribute Motion 6:9  (slice3; segments: 6)
+                     Hash Key: t2.a
                      Hash Module: 3
-                     ->  Parallel Seq Scan on t1
+                     ->  Parallel Seq Scan on t2
  Optimizer: Postgres query optimizer
 (13 rows)
 
@@ -1091,7 +1123,11 @@ abort;
 --
 begin;
 create table t1(a int, b int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table t2(a int, b int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i%10, i from generate_series(1, 5) i;
 insert into t1 values (100000);
 insert into t2 select i%10, i from generate_series(1, 100000) i;
@@ -1100,34 +1136,34 @@ analyze t2;
 set local enable_parallel = on;
 -- parallel hash join with shared table, SinglQE as outer partial path.
 explain(locus, costs off) select * from (select count(*) as a from t2) t2 left join t1 on t1.a = t2.a;
-                            QUERY PLAN                            
-------------------------------------------------------------------
+                               QUERY PLAN                               
+------------------------------------------------------------------------
  Gather Motion 6:1  (slice1; segments: 6)
    Locus: Entry
-   ->  Parallel Hash Left Join
-         Locus: Hashed
+   ->  Parallel Hash Right Join
+         Locus: HashedWorkers
          Parallel Workers: 2
-         Hash Cond: ((count(*)) = t1.a)
-         ->  Redistribute Motion 1:6  (slice2; segments: 1)
-               Locus: Hashed
+         Hash Cond: (t1.a = (count(*)))
+         ->  Parallel Seq Scan on t1
+               Locus: HashedWorkers
                Parallel Workers: 2
-               Hash Key: (count(*))
-               Hash Module: 3
-               ->  Finalize Aggregate
-                     Locus: SingleQE
-                     ->  Gather Motion 6:1  (slice3; segments: 6)
-                           Locus: SingleQE
-                           ->  Partial Aggregate
-                                 Locus: HashedWorkers
-                                 Parallel Workers: 2
-                                 ->  Parallel Seq Scan on t2
-                                       Locus: HashedWorkers
-                                       Parallel Workers: 2
          ->  Parallel Hash
                Locus: Hashed
-               ->  Parallel Seq Scan on t1
-                     Locus: HashedWorkers
+               ->  Redistribute Motion 1:6  (slice2; segments: 1)
+                     Locus: Hashed
                      Parallel Workers: 2
+                     Hash Key: (count(*))
+                     Hash Module: 3
+                     ->  Finalize Aggregate
+                           Locus: SingleQE
+                           ->  Gather Motion 6:1  (slice3; segments: 6)
+                                 Locus: SingleQE
+                                 ->  Partial Aggregate
+                                       Locus: HashedWorkers
+                                       Parallel Workers: 2
+                                       ->  Parallel Seq Scan on t2
+                                             Locus: HashedWorkers
+                                             Parallel Workers: 2
  Optimizer: Postgres query optimizer
 (27 rows)
 
@@ -1323,12 +1359,18 @@ begin;
 create table rt1(a int, b int) distributed replicated;
 create table rt2(a int, b int) with (parallel_workers = 0) distributed replicated;
 create table t1(a int, b int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table t2(a int, b int) with (parallel_workers = 0);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i, i+1 from generate_series(1, 10000) i;
 insert into t2 select i, i+1 from generate_series(1, 10000) i;
 insert into rt1 select i, i+1 from generate_series(1, 10000) i;
 insert into rt2 select i, i+1 from generate_series(1, 10000) i;
 CREATE TABLE sq1 AS SELECT a, b FROM t1 WHERE gp_segment_id = 0;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 set local optimizer=off;
 set local enable_parallel=on;
 set local min_parallel_table_scan_size to 0;
@@ -1385,7 +1427,7 @@ explain (locus, costs off) select * from rt1 union all select * from t1;
          ->  Result
                Locus: Strewn
                Parallel Workers: 2
-               One-Time Filter: (gp_execution_segment() = 1)
+               One-Time Filter: (gp_execution_segment() = 0)
                ->  Parallel Seq Scan on rt1
                      Locus: SegmentGeneralWorkers
                      Parallel Workers: 2
@@ -1409,7 +1451,7 @@ explain (locus, costs off) select * from rt1 union all select * from t2;
          ->  Result
                Locus: Strewn
                Parallel Workers: 2
-               One-Time Filter: (gp_execution_segment() = 1)
+               One-Time Filter: (gp_execution_segment() = 0)
                ->  Parallel Seq Scan on rt1
                      Locus: SegmentGeneralWorkers
                      Parallel Workers: 2
@@ -1482,6 +1524,8 @@ abort;
 --
 begin;
 create table t1(c1 int, c2 int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i, i+1 from generate_series(1, 100000) i;
 analyze t1;
 set local optimizer = off;
@@ -1549,6 +1593,8 @@ abort;
 --
 begin;
 create table t1(c1 int, c2 int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i, i+1 from generate_series(1, 100000) i;
 analyze t1;
 set local optimizer = off;
@@ -1768,6 +1814,8 @@ set local optimizer = off;
 set local enable_parallel = on;
 -- ao table
 create table ao (a INT, b INT) using ao_row;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into ao select i as a, i as b from generate_series(1, 100) AS i;
 alter table ao set (parallel_workers = 2);
 explain(costs off) select count(*) from ao;
@@ -1789,6 +1837,8 @@ select count(*) from ao;
 alter table ao reset (parallel_workers);
 -- aocs table
 create table aocs (a INT, b INT) using ao_column;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into aocs select i as a, i as b from generate_series(1, 100) AS i;
 alter table aocs set (parallel_workers = 2);
 explain(costs off) select count(*) from aocs;
@@ -1862,9 +1912,14 @@ select * from
 abort;
 begin;
 create table pagg_tab (a int, b int, c text, d int) partition by list(c);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table pagg_tab_p1 partition of pagg_tab for values in ('0000', '0001', '0002', '0003', '0004');
+NOTICE:  table has parent, setting distribution columns to match parent table
 create table pagg_tab_p2 partition of pagg_tab for values in ('0005', '0006', '0007', '0008');
+NOTICE:  table has parent, setting distribution columns to match parent table
 create table pagg_tab_p3 partition of pagg_tab for values in ('0009', '0010', '0011');
+NOTICE:  table has parent, setting distribution columns to match parent table
 insert into pagg_tab select i % 20, i % 30, to_char(i % 12, 'FM0000'), i % 30 from generate_series(0, 2999) i;
 analyze pagg_tab;
 set local enable_parallel to off;
@@ -1939,7 +1994,11 @@ abort;
 --
 begin;
 create table t1(a int, b int) with(parallel_workers=3);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table t2(b int, a int) with(parallel_workers=2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t1 select i, i+1 from generate_series(1, 10) i;
 insert into t2 select i, i+1 from generate_series(1, 5) i;
 analyze t1;
@@ -2329,6 +2388,8 @@ abort;
 -- prepare, execute locus is null
 begin;
 create table t1(c1 int, c2 int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 analyze t1;
 prepare t1_count(integer) as select count(*) from t1;
 explain(locus, costs off) execute t1_count(1);
diff --git a/contrib/pax_storage/src/test/isolation2/expected/pax/copy_to_concurrent_reorganize.out b/contrib/pax_storage/src/test/isolation2/expected/pax/copy_to_concurrent_reorganize.out
deleted file mode 100644
index b4beed7d035..00000000000
--- a/contrib/pax_storage/src/test/isolation2/expected/pax/copy_to_concurrent_reorganize.out
+++ /dev/null
@@ -1,289 +0,0 @@
--- Test: PAX table — relation-based COPY TO concurrent with ALTER TABLE SET WITH (reorganize=true)
--- Issue: https://github.com/apache/cloudberry/issues/1545
--- Same as test 2.1 in the main isolation2 suite but for PAX storage.
-
-CREATE TABLE copy_reorg_pax_test (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_reorg_pax_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_pax_test;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_reorg_pax_test SET WITH (reorganize=true);
-ALTER
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_pax_test TO '/tmp/copy_reorg_pax_test.csv';  <waiting ...>
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_reorg_pax_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-COMMIT
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_reorg_pax_verify FROM '/tmp/copy_reorg_pax_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_reorg_pax_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_reorg_pax_verify;
-DROP
-DROP TABLE copy_reorg_pax_test;
-DROP
-
--- ============================================================
--- Test 2.2c: PAX — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_pax_test (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_query_reorg_pax_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_query_reorg_pax_test;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_query_reorg_pax_test SET WITH (reorganize=true);
-ALTER
-
-2&: COPY (SELECT * FROM copy_query_reorg_pax_test) TO '/tmp/copy_query_reorg_pax_test.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY (SELECT%copy_query_reorg_pax_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_query_reorg_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_query_reorg_pax_verify FROM '/tmp/copy_query_reorg_pax_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_query_reorg_pax_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_query_reorg_pax_verify;
-DROP
-DROP TABLE copy_query_reorg_pax_test;
-DROP
-
--- ============================================================
--- Test 2.3c: PAX — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_pax (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE
-CREATE TABLE copy_part_child1_pax PARTITION OF copy_part_parent_pax FOR VALUES FROM (1) TO (501);
-CREATE
-CREATE TABLE copy_part_child2_pax PARTITION OF copy_part_parent_pax FOR VALUES FROM (501) TO (1001);
-CREATE
-INSERT INTO copy_part_parent_pax SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_part_parent_pax;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_part_child1_pax SET WITH (reorganize=true);
-ALTER
-
-2&: COPY copy_part_parent_pax TO '/tmp/copy_part_parent_pax.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_part_parent_pax%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_part_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_part_pax_verify FROM '/tmp/copy_part_parent_pax.csv';
-COPY 1000
-SELECT count(*) FROM copy_part_pax_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_part_pax_verify;
-DROP
-DROP TABLE copy_part_parent_pax;
-DROP
-
--- ============================================================
--- Test 2.4c: PAX — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.2c — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_pax_lookup (cat INT) DISTRIBUTED BY (cat);
-CREATE
-INSERT INTO copy_rls_pax_lookup SELECT i FROM generate_series(1, 2) i;
-INSERT 2
-
-CREATE TABLE copy_rls_pax_main (a INT, category INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_rls_pax_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-INSERT 1000
-
-ALTER TABLE copy_rls_pax_main ENABLE ROW LEVEL SECURITY;
-ALTER
-CREATE POLICY p_rls_pax ON copy_rls_pax_main USING (category IN (SELECT cat from copy_rls_pax_lookup));
-CREATE
-
-CREATE ROLE copy_rls_pax_testuser;
-CREATE
-GRANT pg_write_server_files TO copy_rls_pax_testuser;
-GRANT
-GRANT ALL ON copy_rls_pax_main TO copy_rls_pax_testuser;
-GRANT
-GRANT ALL ON copy_rls_pax_lookup TO copy_rls_pax_testuser;
-GRANT
-
-SELECT count(*) FROM copy_rls_pax_main;
- count 
--------
- 1000  
-(1 row)
-
-2: SET ROLE copy_rls_pax_testuser; COPY copy_rls_pax_main TO '/tmp/copy_rls_pax_main.csv';
-SET 400
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_rls_pax_lookup SET WITH (reorganize=true);
-ALTER
-
-2&: SET ROLE copy_rls_pax_testuser; COPY copy_rls_pax_main TO '/tmp/copy_rls_pax_main.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE '%COPY copy_rls_pax_main%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-SET 400
-
--- Reset session 2's role to avoid leaking to subsequent tests
-2: RESET ROLE;
-RESET
-
-RESET ROLE;
-RESET
-CREATE TABLE copy_rls_pax_verify (a INT, category INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_rls_pax_verify FROM '/tmp/copy_rls_pax_main.csv';
-COPY 400
-SELECT count(*) FROM copy_rls_pax_verify;
- count 
--------
- 400   
-(1 row)
-
-DROP TABLE copy_rls_pax_verify;
-DROP
-DROP POLICY p_rls_pax ON copy_rls_pax_main;
-DROP
-DROP TABLE copy_rls_pax_main;
-DROP
-DROP TABLE copy_rls_pax_lookup;
-DROP
-DROP ROLE copy_rls_pax_testuser;
-DROP
-
--- ============================================================
--- Test 2.5c: PAX — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_pax_src (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO ctas_reorg_pax_src SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM ctas_reorg_pax_src;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE ctas_reorg_pax_src SET WITH (reorganize=true);
-ALTER
-
-2&: CREATE TABLE ctas_reorg_pax_dst AS SELECT * FROM ctas_reorg_pax_src DISTRIBUTED BY (a);  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'CREATE TABLE ctas_reorg_pax_dst%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-CREATE 1000
-
-SELECT count(*) FROM ctas_reorg_pax_dst;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE ctas_reorg_pax_dst;
-DROP
-DROP TABLE ctas_reorg_pax_src;
-DROP
-
--- NOTE: Test 2.6c (PAX variant of change distribution key + query-based COPY TO)
--- removed for the same reason as test 2.6 (server crash, pre-existing bug).
diff --git a/contrib/pax_storage/src/test/isolation2/isolation2_schedule b/contrib/pax_storage/src/test/isolation2/isolation2_schedule
index fa163aa96b6..72fa06f5204 100644
--- a/contrib/pax_storage/src/test/isolation2/isolation2_schedule
+++ b/contrib/pax_storage/src/test/isolation2/isolation2_schedule
@@ -157,7 +157,6 @@ test: pax/vacuum_while_vacuum
 # test: uao/bad_buffer_on_temp_ao_row
 
 test: reorganize_after_ao_vacuum_skip_drop truncate_after_ao_vacuum_skip_drop mark_all_aoseg_await_drop
-test: pax/copy_to_concurrent_reorganize
 # below test(s) inject faults so each of them need to be in a separate group
 test: segwalrep/master_wal_switch
 
diff --git a/contrib/pax_storage/src/test/isolation2/sql/pax/copy_to_concurrent_reorganize.sql b/contrib/pax_storage/src/test/isolation2/sql/pax/copy_to_concurrent_reorganize.sql
deleted file mode 100644
index 05ef25852e9..00000000000
--- a/contrib/pax_storage/src/test/isolation2/sql/pax/copy_to_concurrent_reorganize.sql
+++ /dev/null
@@ -1,170 +0,0 @@
--- Test: PAX table — relation-based COPY TO concurrent with ALTER TABLE SET WITH (reorganize=true)
--- Issue: https://github.com/apache/cloudberry/issues/1545
--- Same as test 2.1 in the main isolation2 suite but for PAX storage.
-
-CREATE TABLE copy_reorg_pax_test (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO copy_reorg_pax_test SELECT i, i FROM generate_series(1, 1000) i;
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_pax_test;
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-1: ALTER TABLE copy_reorg_pax_test SET WITH (reorganize=true);
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_pax_test TO '/tmp/copy_reorg_pax_test.csv';
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_reorg_pax_test%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_reorg_pax_verify FROM '/tmp/copy_reorg_pax_test.csv';
-SELECT count(*) FROM copy_reorg_pax_verify;
-
--- Cleanup
-DROP TABLE copy_reorg_pax_verify;
-DROP TABLE copy_reorg_pax_test;
-
--- ============================================================
--- Test 2.2c: PAX — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_pax_test (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO copy_query_reorg_pax_test SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_query_reorg_pax_test;
-
-1: BEGIN;
-1: ALTER TABLE copy_query_reorg_pax_test SET WITH (reorganize=true);
-
-2&: COPY (SELECT * FROM copy_query_reorg_pax_test) TO '/tmp/copy_query_reorg_pax_test.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY (SELECT%copy_query_reorg_pax_test%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_query_reorg_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_query_reorg_pax_verify FROM '/tmp/copy_query_reorg_pax_test.csv';
-SELECT count(*) FROM copy_query_reorg_pax_verify;
-
-DROP TABLE copy_query_reorg_pax_verify;
-DROP TABLE copy_query_reorg_pax_test;
-
--- ============================================================
--- Test 2.3c: PAX — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_pax (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE TABLE copy_part_child1_pax PARTITION OF copy_part_parent_pax FOR VALUES FROM (1) TO (501);
-CREATE TABLE copy_part_child2_pax PARTITION OF copy_part_parent_pax FOR VALUES FROM (501) TO (1001);
-INSERT INTO copy_part_parent_pax SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_part_parent_pax;
-
-1: BEGIN;
-1: ALTER TABLE copy_part_child1_pax SET WITH (reorganize=true);
-
-2&: COPY copy_part_parent_pax TO '/tmp/copy_part_parent_pax.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_part_parent_pax%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_part_pax_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_part_pax_verify FROM '/tmp/copy_part_parent_pax.csv';
-SELECT count(*) FROM copy_part_pax_verify;
-
-DROP TABLE copy_part_pax_verify;
-DROP TABLE copy_part_parent_pax;
-
--- ============================================================
--- Test 2.4c: PAX — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.2c — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_pax_lookup (cat INT) DISTRIBUTED BY (cat);
-INSERT INTO copy_rls_pax_lookup SELECT i FROM generate_series(1, 2) i;
-
-CREATE TABLE copy_rls_pax_main (a INT, category INT) DISTRIBUTED BY (a);
-INSERT INTO copy_rls_pax_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-
-ALTER TABLE copy_rls_pax_main ENABLE ROW LEVEL SECURITY;
-CREATE POLICY p_rls_pax ON copy_rls_pax_main USING (category IN (SELECT cat from copy_rls_pax_lookup));
-
-CREATE ROLE copy_rls_pax_testuser;
-GRANT pg_write_server_files TO copy_rls_pax_testuser;
-GRANT ALL ON copy_rls_pax_main TO copy_rls_pax_testuser;
-GRANT ALL ON copy_rls_pax_lookup TO copy_rls_pax_testuser;
-
-SELECT count(*) FROM copy_rls_pax_main;
-
-2: SET ROLE copy_rls_pax_testuser; COPY copy_rls_pax_main TO '/tmp/copy_rls_pax_main.csv';
-
-1: BEGIN;
-1: ALTER TABLE copy_rls_pax_lookup SET WITH (reorganize=true);
-
-2&: SET ROLE copy_rls_pax_testuser; COPY copy_rls_pax_main TO '/tmp/copy_rls_pax_main.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE '%COPY copy_rls_pax_main%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
--- Reset session 2's role to avoid leaking to subsequent tests
-2: RESET ROLE;
-
-RESET ROLE;
-CREATE TABLE copy_rls_pax_verify (a INT, category INT) DISTRIBUTED BY (a);
-COPY copy_rls_pax_verify FROM '/tmp/copy_rls_pax_main.csv';
-SELECT count(*) FROM copy_rls_pax_verify;
-
-DROP TABLE copy_rls_pax_verify;
-DROP POLICY p_rls_pax ON copy_rls_pax_main;
-DROP TABLE copy_rls_pax_main;
-DROP TABLE copy_rls_pax_lookup;
-DROP ROLE copy_rls_pax_testuser;
-
--- ============================================================
--- Test 2.5c: PAX — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_pax_src (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO ctas_reorg_pax_src SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM ctas_reorg_pax_src;
-
-1: BEGIN;
-1: ALTER TABLE ctas_reorg_pax_src SET WITH (reorganize=true);
-
-2&: CREATE TABLE ctas_reorg_pax_dst AS SELECT * FROM ctas_reorg_pax_src DISTRIBUTED BY (a);
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'CREATE TABLE ctas_reorg_pax_dst%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-SELECT count(*) FROM ctas_reorg_pax_dst;
-
-DROP TABLE ctas_reorg_pax_dst;
-DROP TABLE ctas_reorg_pax_src;
-
--- NOTE: Test 2.6c (PAX variant of change distribution key + query-based COPY TO)
--- removed for the same reason as test 2.6 (server crash, pre-existing bug).
diff --git a/contrib/pax_storage/src/test/regress/expected/groupingsets_optimizer.out b/contrib/pax_storage/src/test/regress/expected/groupingsets_optimizer.out
index b3da68b1f9d..382fb46fdfd 100644
--- a/contrib/pax_storage/src/test/regress/expected/groupingsets_optimizer.out
+++ b/contrib/pax_storage/src/test/regress/expected/groupingsets_optimizer.out
@@ -949,21 +949,21 @@ select v.c, (select count(*) from gstest2 group by () having v.c)
 explain (costs off)
   select v.c, (select count(*) from gstest2 group by () having v.c)
     from (values (false),(true)) v(c) order by v.c;
-                                QUERY PLAN                                
---------------------------------------------------------------------------
- Sort
-   Sort Key: "*VALUES*".column1
-   ->  Values Scan on "*VALUES*"
-         SubPlan 1
-           ->  Aggregate
-                 Group Key: ()
-                 Filter: "*VALUES*".column1
-                 ->  Result
-                       One-Time Filter: "*VALUES*".column1
-                       ->  Materialize
-                             ->  Gather Motion 3:1  (slice1; segments: 3)
+                             QUERY PLAN
+--------------------------------------------------------------------
+ Result
+   ->  Sort
+         Sort Key: "Values".column1
+         ->  Values Scan on "Values"
+   SubPlan 1
+     ->  Result
+           One-Time Filter: "Values".column1
+           ->  Finalize Aggregate
+                 ->  Materialize
+                       ->  Gather Motion 3:1  (slice1; segments: 3)
+                             ->  Partial Aggregate
                                    ->  Seq Scan on gstest2
- Optimizer: Postgres query optimizer
+ Optimizer: GPORCA
 (13 rows)
 
 -- HAVING with GROUPING queries
diff --git a/contrib/pax_storage/src/test/regress/expected/stats.out b/contrib/pax_storage/src/test/regress/expected/stats.out
index d3f407656fc..150dab3ead4 100644
--- a/contrib/pax_storage/src/test/regress/expected/stats.out
+++ b/contrib/pax_storage/src/test/regress/expected/stats.out
@@ -34,14 +34,13 @@ declare
   updated3 bool;
   updated4 bool;
   updated5 bool;
+  updated6 bool;
 begin
   -- we don't want to wait forever; loop will exit after 30 seconds
   for i in 1 .. 300 loop
 
-    -- With parallel query, the seqscan and indexscan on tenk2 might be done
-    -- in parallel worker processes, which will send their stats counters
-    -- asynchronously to what our own session does.  So we must check for
-    -- those counts to be registered separately from the update counts.
+    -- Segment stats are sent asynchronously to the coordinator, so we must
+    -- check for each counter independently to avoid false exits.
 
     -- check to see if seqscan has been sensed
     SELECT (st.seq_scan >= pr.seq_scan + 1) INTO updated1
@@ -68,7 +67,13 @@ begin
       FROM pg_stat_user_tables AS st, pg_class AS cl, prevstats AS pr
      WHERE st.relname='tenk2' AND cl.relname='tenk2';
 
-    exit when updated1 and updated2 and updated3 and updated4 and updated5;
+    -- check to see if seq_tup_read has been sensed; segment stats may arrive
+    -- after seq_scan count, so wait for this explicitly
+    SELECT (st.seq_tup_read >= pr.seq_tup_read + cl.reltuples) INTO updated6
+      FROM gp_stat_user_tables_summary AS st, pg_class AS cl, prevstats AS pr
+     WHERE st.relname='tenk2' AND cl.relname='tenk2';
+
+    exit when updated1 and updated2 and updated3 and updated4 and updated5 and updated6;
 
     -- wait a little
     perform pg_sleep_for('100 milliseconds');
diff --git a/contrib/pax_storage/src/test/regress/sql/stats.sql b/contrib/pax_storage/src/test/regress/sql/stats.sql
index 36878562f87..8f32a97cf18 100644
--- a/contrib/pax_storage/src/test/regress/sql/stats.sql
+++ b/contrib/pax_storage/src/test/regress/sql/stats.sql
@@ -33,14 +33,13 @@ declare
   updated3 bool;
   updated4 bool;
   updated5 bool;
+  updated6 bool;
 begin
   -- we don't want to wait forever; loop will exit after 30 seconds
   for i in 1 .. 300 loop
 
-    -- With parallel query, the seqscan and indexscan on tenk2 might be done
-    -- in parallel worker processes, which will send their stats counters
-    -- asynchronously to what our own session does.  So we must check for
-    -- those counts to be registered separately from the update counts.
+    -- Segment stats are sent asynchronously to the coordinator, so we must
+    -- check for each counter independently to avoid false exits.
 
     -- check to see if seqscan has been sensed
     SELECT (st.seq_scan >= pr.seq_scan + 1) INTO updated1
@@ -67,7 +66,13 @@ begin
       FROM pg_stat_user_tables AS st, pg_class AS cl, prevstats AS pr
      WHERE st.relname='tenk2' AND cl.relname='tenk2';
 
-    exit when updated1 and updated2 and updated3 and updated4 and updated5;
+    -- check to see if seq_tup_read has been sensed; segment stats may arrive
+    -- after seq_scan count, so wait for this explicitly
+    SELECT (st.seq_tup_read >= pr.seq_tup_read + cl.reltuples) INTO updated6
+      FROM gp_stat_user_tables_summary AS st, pg_class AS cl, prevstats AS pr
+     WHERE st.relname='tenk2' AND cl.relname='tenk2';
+
+    exit when updated1 and updated2 and updated3 and updated4 and updated5 and updated6;
 
     -- wait a little
     perform pg_sleep_for('100 milliseconds');
diff --git a/contrib/pg_trgm/expected/pg_trgm_optimizer.out b/contrib/pg_trgm/expected/pg_trgm_optimizer.out
index 4597b8ca047..a1e9b3d299d 100644
--- a/contrib/pg_trgm/expected/pg_trgm_optimizer.out
+++ b/contrib/pg_trgm/expected/pg_trgm_optimizer.out
@@ -2351,6 +2351,7 @@ select t <-> 'q0987wertyu0988', t from test_trgm order by t <-> 'q0987wertyu0988
          ->  Limit
                ->  Index Scan using trgm_idx on test_trgm
                      Order By: (t <-> 'q0987wertyu0988'::text)
+ Optimizer: Postgres query optimizer
 (7 rows)
 
 select t <-> 'q0987wertyu0988', t from test_trgm order by t <-> 'q0987wertyu0988' limit 2;
@@ -5003,8 +5004,8 @@ select * from test2 where t ~ '/\d+/-\d';
 -- test = operator
 explain (costs off)
   select * from test2 where t = 'abcdef';
-                QUERY PLAN                
-------------------------------------------
+                   QUERY PLAN                   
+------------------------------------------------
  Gather Motion 1:1  (slice1; segments: 1)
    ->  Bitmap Heap Scan on test2
          Recheck Cond: (t = 'abcdef'::text)
@@ -5020,8 +5021,8 @@ select * from test2 where t = 'abcdef';
 
 explain (costs off)
   select * from test2 where t = '%line%';
-                QUERY PLAN                
-------------------------------------------
+                   QUERY PLAN                   
+------------------------------------------------
  Gather Motion 1:1  (slice1; segments: 1)
    ->  Bitmap Heap Scan on test2
          Recheck Cond: (t = '%line%'::text)
@@ -5311,14 +5312,15 @@ select * from test2 where t ~ '/\d+/-\d';
 -- test = operator
 explain (costs off)
   select * from test2 where t = 'abcdef';
-                QUERY PLAN                
-------------------------------------------
+                   QUERY PLAN                    
+-------------------------------------------------
  Gather Motion 1:1  (slice1; segments: 1)
    ->  Bitmap Heap Scan on test2
          Recheck Cond: (t = 'abcdef'::text)
          ->  Bitmap Index Scan on test2_idx_gist
                Index Cond: (t = 'abcdef'::text)
-(2 rows)
+ Optimizer: Postgres query optimizer
+(6 rows)
 
 select * from test2 where t = 'abcdef';
    t    
@@ -5328,13 +5330,14 @@ select * from test2 where t = 'abcdef';
 
 explain (costs off)
   select * from test2 where t = '%line%';
-                QUERY PLAN                
-------------------------------------------
+                   QUERY PLAN                    
+-------------------------------------------------
  Gather Motion 1:1  (slice1; segments: 1)
    ->  Bitmap Heap Scan on test2
          Recheck Cond: (t = '%line%'::text)
          ->  Bitmap Index Scan on test2_idx_gist
                Index Cond: (t = '%line%'::text)
+ Optimizer: Postgres query optimizer
 (6 rows)
 
 select * from test2 where t = '%line%';
@@ -5423,7 +5426,7 @@ SELECT DISTINCT city, similarity(city, 'Warsaw'), show_limit()
                ->  Index Scan using restaurants_city_idx on restaurants
                      Index Cond: (city % 'Warsaw'::text)
                      Filter: (city % 'Warsaw'::text)
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (9 rows)
 
 SELECT set_limit(0.3);
diff --git a/contrib/postgres_fdw/expected/postgres_fdw.out b/contrib/postgres_fdw/expected/postgres_fdw.out
index 10700d6fd4a..9b70906a4a9 100644
--- a/contrib/postgres_fdw/expected/postgres_fdw.out
+++ b/contrib/postgres_fdw/expected/postgres_fdw.out
@@ -707,6 +707,17 @@ EXPLAIN (VERBOSE, COSTS OFF) SELECT * FROM ft_empty ORDER BY c1;
    Remote SQL: SELECT c1, c2 FROM public.loct_empty ORDER BY c1 ASC NULLS LAST
 (3 rows)
 
+-- test restriction on non-system foreign tables.
+SET restrict_nonsystem_relation_kind TO 'foreign-table';
+SELECT * from ft1 where c1 < 1; -- ERROR
+ERROR:  access to non-system foreign table is restricted
+INSERT INTO ft1 (c1) VALUES (1); -- ERROR
+ERROR:  access to non-system foreign table is restricted
+DELETE FROM ft1 WHERE c1 = 1; -- ERROR
+ERROR:  access to non-system foreign table is restricted
+TRUNCATE ft1; -- ERROR
+ERROR:  access to non-system foreign table is restricted
+RESET restrict_nonsystem_relation_kind;
 -- ===================================================================
 -- WHERE with remotely-executable conditions
 -- ===================================================================
diff --git a/contrib/postgres_fdw/sql/postgres_fdw.sql b/contrib/postgres_fdw/sql/postgres_fdw.sql
index 793dd64811d..ac290d3ba30 100644
--- a/contrib/postgres_fdw/sql/postgres_fdw.sql
+++ b/contrib/postgres_fdw/sql/postgres_fdw.sql
@@ -321,6 +321,14 @@ DELETE FROM loct_empty;
 ANALYZE ft_empty;
 EXPLAIN (VERBOSE, COSTS OFF) SELECT * FROM ft_empty ORDER BY c1;
 
+-- test restriction on non-system foreign tables.
+SET restrict_nonsystem_relation_kind TO 'foreign-table';
+SELECT * from ft1 where c1 < 1; -- ERROR
+INSERT INTO ft1 (c1) VALUES (1); -- ERROR
+DELETE FROM ft1 WHERE c1 = 1; -- ERROR
+TRUNCATE ft1; -- ERROR
+RESET restrict_nonsystem_relation_kind;
+
 -- ===================================================================
 -- WHERE with remotely-executable conditions
 -- ===================================================================
diff --git a/contrib/xml2/xpath.c b/contrib/xml2/xpath.c
index 1e5b71d9a02..0555294f234 100644
--- a/contrib/xml2/xpath.c
+++ b/contrib/xml2/xpath.c
@@ -74,8 +74,6 @@ pgxml_parser_init(PgXmlStrictness strictness)
 	/* Initialize libxml */
 	xmlInitParser();
 
-	xmlSubstituteEntitiesDefault(1);
-	xmlLoadExtDtdDefaultValue = 1;
 
 	return xmlerrcxt;
 }
@@ -425,8 +423,9 @@ pgxml_xpath(text *document, xmlChar *xpath, xpath_workspace *workspace)
 
 	PG_TRY();
 	{
-		workspace->doctree = xmlParseMemory((char *) VARDATA_ANY(document),
-											docsize);
+		workspace->doctree = xmlReadMemory((char *) VARDATA_ANY(document),
+										   docsize, NULL, NULL,
+										   XML_PARSE_NOENT);
 		if (workspace->doctree != NULL)
 		{
 			workspace->ctxt = xmlXPathNewContext(workspace->doctree);
@@ -719,7 +718,9 @@ xpath_table(PG_FUNCTION_ARGS)
 
 			/* Parse the document */
 			if (xmldoc)
-				doctree = xmlParseMemory(xmldoc, strlen(xmldoc));
+				doctree = xmlReadMemory(xmldoc, strlen(xmldoc),
+										NULL, NULL,
+										XML_PARSE_NOENT);
 			else				/* treat NULL as not well-formed */
 				doctree = NULL;
 
diff --git a/contrib/xml2/xslt_proc.c b/contrib/xml2/xslt_proc.c
index 2189bca86ff..f30a3a42c03 100644
--- a/contrib/xml2/xslt_proc.c
+++ b/contrib/xml2/xslt_proc.c
@@ -85,16 +85,18 @@ xslt_process(PG_FUNCTION_ARGS)
 		bool		xslt_sec_prefs_error;
 
 		/* Parse document */
-		doctree = xmlParseMemory((char *) VARDATA_ANY(doct),
-								 VARSIZE_ANY_EXHDR(doct));
+		doctree = xmlReadMemory((char *) VARDATA_ANY(doct),
+								VARSIZE_ANY_EXHDR(doct), NULL, NULL,
+								XML_PARSE_NOENT);
 
 		if (doctree == NULL)
 			xml_ereport(xmlerrcxt, ERROR, ERRCODE_EXTERNAL_ROUTINE_EXCEPTION,
 						"error parsing XML document");
 
 		/* Same for stylesheet */
-		ssdoc = xmlParseMemory((char *) VARDATA_ANY(ssheet),
-							   VARSIZE_ANY_EXHDR(ssheet));
+		ssdoc = xmlReadMemory((char *) VARDATA_ANY(ssheet),
+							  VARSIZE_ANY_EXHDR(ssheet), NULL, NULL,
+							  XML_PARSE_NOENT);
 
 		if (ssdoc == NULL)
 			xml_ereport(xmlerrcxt, ERROR, ERRCODE_EXTERNAL_ROUTINE_EXCEPTION,
diff --git a/devops/build/automation/cloudberry/scripts/build-cloudberry.sh b/devops/build/automation/cloudberry/scripts/build-cloudberry.sh
index efa061a0f83..ca4c73d55cb 100755
--- a/devops/build/automation/cloudberry/scripts/build-cloudberry.sh
+++ b/devops/build/automation/cloudberry/scripts/build-cloudberry.sh
@@ -71,7 +71,7 @@ init_environment "Cloudberry Build Script" "${BUILD_LOG}"
 
 # Set environment
 log_section "Environment Setup"
-export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:LD_LIBRARY_PATH
+export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:${LD_LIBRARY_PATH:-""}
 log_section_end "Environment Setup"
 
 # Build process
diff --git a/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh b/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh
index 32a9f3d8657..cc9e7376239 100755
--- a/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh
+++ b/devops/build/automation/cloudberry/scripts/configure-cloudberry.sh
@@ -121,7 +121,7 @@ log_section "Initial Setup"
 execute_cmd sudo rm -rf ${BUILD_DESTINATION} || exit 2
 execute_cmd sudo chmod a+w /usr/local || exit 2
 execute_cmd sudo mkdir -p ${BUILD_DESTINATION}/lib || exit 2
-if [[ "$OS_ID" == "rocky" && "$OS_VERSION" =~ ^(8|9) ]]; then
+if [[ "$OS_ID" == "rocky" && "$OS_VERSION" =~ ^(8|9|10) ]]; then
     execute_cmd sudo cp /usr/local/xerces-c/lib/libxerces-c.so \
                 /usr/local/xerces-c/lib/libxerces-c-3.3.so \
                 ${BUILD_DESTINATION}/lib || exit 3
@@ -131,7 +131,7 @@ log_section_end "Initial Setup"
 
 # Set environment
 log_section "Environment Setup"
-export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:LD_LIBRARY_PATH
+export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:${LD_LIBRARY_PATH:-""}
 log_section_end "Environment Setup"
 
 # Add debug options if ENABLE_DEBUG is set to "true"
@@ -162,6 +162,8 @@ execute_cmd ./configure --prefix=${BUILD_DESTINATION} \
             --disable-pxf \
             --enable-tap-tests \
             ${CONFIGURE_DEBUG_OPTS} \
+            --with-diskquota \
+            --with-gp-stats-collector \
             --with-gssapi \
             --with-ldap \
             --with-libxml \
diff --git a/devops/build/automation/cloudberry/scripts/parse-results.pl b/devops/build/automation/cloudberry/scripts/parse-results.pl
index d09085d5fb9..2c754bcae9d 100755
--- a/devops/build/automation/cloudberry/scripts/parse-results.pl
+++ b/devops/build/automation/cloudberry/scripts/parse-results.pl
@@ -110,7 +110,7 @@
 my @ignored_test_list = ();
 
 while (<$fh>) {
-    # Match the summary lines
+    # Match the summary lines (pg_regress format)
     if (/All (\d+) tests passed\./) {
         $status = 'passed';
         $total_tests = $1;
@@ -132,8 +132,22 @@
         $status = 'failed';
         $failed_tests = $1 - $3;
         $ignored_tests = $3;
-        $total_tests = $2;
-        $passed_tests = $2 - $1;
+
+    # TAP/prove summary format: "Files=N, Tests=N, ..."
+    } elsif (/^Files=\d+, Tests=(\d+),/) {
+        $total_tests = $1;
+
+    # TAP/prove result: "Result: PASS" or "Result: FAIL"
+    } elsif (/^Result: PASS/) {
+        $status = 'passed';
+        $passed_tests = $total_tests;
+        $failed_tests = 0;
+    } elsif (/^Result: FAIL/) {
+        $status = 'failed';
+
+    # TAP individual test failure: "  t/xxx.pl (Wstat: ...)"
+    } elsif (/^\s+(t\/\S+\.pl)\s+\(Wstat:/) {
+        push @failed_test_list, $1;
     }
 
     # Capture failed tests
@@ -150,8 +164,15 @@
 # Close the log file
 close $fh;
 
-# Validate failed test count matches found test names
-if ($status eq 'failed' && scalar(@failed_test_list) != $failed_tests) {
+# For TAP format, derive failed/passed counts from collected test names
+if ($status eq 'failed' && $failed_tests == 0 && scalar(@failed_test_list) > 0) {
+    $failed_tests = scalar(@failed_test_list);
+    $passed_tests = $total_tests - $failed_tests if $total_tests > 0;
+}
+
+# Validate failed test count matches found test names (pg_regress format only)
+if ($status eq 'failed' && $failed_tests > 0 && scalar(@failed_test_list) > 0
+    && scalar(@failed_test_list) != $failed_tests) {
     print "Error: Found $failed_tests failed tests in summary but found " . scalar(@failed_test_list) . " failed test names\n";
     print "Failed test names found:\n";
     foreach my $test (@failed_test_list) {
diff --git a/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh b/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh
index 97107ea1a9f..69536f0067f 100755
--- a/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh
+++ b/devops/build/automation/cloudberry/scripts/unittest-cloudberry.sh
@@ -56,7 +56,7 @@ init_environment "Cloudberry Unittest Script" "${UNITTEST_LOG}"
 
 # Set environment
 log_section "Environment Setup"
-export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:LD_LIBRARY_PATH
+export LD_LIBRARY_PATH=${BUILD_DESTINATION}/lib:${LD_LIBRARY_PATH:-""}
 log_section_end "Environment Setup"
 
 # Unittest process
diff --git a/devops/build/packaging/deb/build-deb.sh b/devops/build/packaging/deb/build-deb.sh
index 1f5aef2258a..61a29e50fc9 100755
--- a/devops/build/packaging/deb/build-deb.sh
+++ b/devops/build/packaging/deb/build-deb.sh
@@ -109,7 +109,7 @@ export CBDB_FULL_VERSION=$VERSION
 
 # Set version if not provided
 if [ -z "${VERSION}" ]; then
-  export CBDB_FULL_VERSION=$(./getversion | cut -d'-' -f 1 | cut -d'+' -f 1)
+  export CBDB_FULL_VERSION=$(./getversion 2>/dev/null | cut -d'-' -f 1 | cut -d'+' -f 1 || echo "unknown")
 fi
 
 if [[ ! $CBDB_FULL_VERSION =~ ^[0-9] ]]; then
@@ -127,22 +127,48 @@ fi
 # Detect OS distribution (e.g., ubuntu22.04, debian12)
 if [ -z ${OS_DISTRO+x} ]; then
   if [ -f /etc/os-release ]; then
+    # Temporarily disable unbound variable check for sourcing os-release
+    set +u
     . /etc/os-release
-    OS_DISTRO=$(echo "${ID}${VERSION_ID}" | tr '[:upper:]' '[:lower:]')
+    set -u
+    # Ensure ID and VERSION_ID are set before using them
+    OS_DISTRO=$(echo "${ID:-unknown}${VERSION_ID:-}" | tr '[:upper:]' '[:lower:]')
   else
     OS_DISTRO="unknown"
   fi
 fi
 
+# Ensure OS_DISTRO is exported and not empty
+export OS_DISTRO=${OS_DISTRO:-unknown}
+
 export CBDB_PKG_VERSION=${CBDB_FULL_VERSION}-${BUILD_NUMBER}-${OS_DISTRO}
 
 # Check if required commands are available
 check_commands
 
-# Define the control file path
-CONTROL_FILE=debian/control
+# Find project root (assumed to be four levels up from scripts directory: devops/build/packaging/deb/)
+PROJECT_ROOT="$(cd "$(dirname "$0")/../../../../" && pwd)"
+
+# Define where the debian metadata is located
+DEBIAN_SRC_DIR="$(dirname "$0")/${OS_DISTRO}"
+
+# Prepare the debian directory at the project root (required by dpkg-buildpackage)
+if [ -d "$DEBIAN_SRC_DIR" ]; then
+    echo "Preparing debian directory from $DEBIAN_SRC_DIR..."
+    mkdir -p "$PROJECT_ROOT/debian"
+    # Use /. to copy directory contents if target exists instead of nested directories
+    cp -rf "$DEBIAN_SRC_DIR"/. "$PROJECT_ROOT/debian/"
+else
+    if [ ! -d "$PROJECT_ROOT/debian" ]; then
+        echo "Error: Debian metadata not found at $DEBIAN_SRC_DIR and no debian/ directory exists at root."
+        exit 1
+    fi
+fi
+
+# Define the control file path (at the project root)
+CONTROL_FILE="$PROJECT_ROOT/debian/control"
 
-# Check if the spec file exists
+# Check if the control file exists
 if [ ! -f "$CONTROL_FILE" ]; then
   echo "Error: Control file not found at $CONTROL_FILE."
   exit 1
@@ -160,10 +186,15 @@ if [ "${DRY_RUN:-false}" = true ]; then
   exit 0
 fi
 
-# Run debbuild with the provided options
-echo "Building DEB with Version $CBDB_FULL_VERSION ..."
+# Run debbuild from the project root
+echo "Building DEB with Version $CBDB_FULL_VERSION in $PROJECT_ROOT ..."
+
+print_changelog > "$PROJECT_ROOT/debian/changelog"
 
-print_changelog > debian/changelog
+# Only cd if we are not already at the project root
+if [ "$(pwd)" != "$PROJECT_ROOT" ]; then
+    cd "$PROJECT_ROOT"
+fi
 
 if ! eval "$DEBBUILD_CMD"; then
   echo "Error: deb build failed."
diff --git a/devops/build/packaging/deb/ubuntu22.04/control b/devops/build/packaging/deb/ubuntu22.04/control
index 4bc5d90b84d..6b05863b780 100644
--- a/devops/build/packaging/deb/ubuntu22.04/control
+++ b/devops/build/packaging/deb/ubuntu22.04/control
@@ -46,6 +46,8 @@ Provides: apache-cloudberry-db
 Architecture: any
 Depends: curl,
     cgroup-tools,
+    debianutils,
+    hostname,
     iputils-ping,
     iproute2,
     keyutils,
diff --git a/devops/build/packaging/deb/ubuntu22.04/rules b/devops/build/packaging/deb/ubuntu22.04/rules
index cb387d209e6..463486cf03f 100755
--- a/devops/build/packaging/deb/ubuntu22.04/rules
+++ b/devops/build/packaging/deb/ubuntu22.04/rules
@@ -19,7 +19,22 @@ include /usr/share/dpkg/default.mk
 	dh $@ --parallel
 
 gpinstall:
-	make install DESTDIR=${DEBIAN_DESTINATION} prefix=
+	# If the build staging directory is empty, copy from the pre-installed location.
+	# In CI, BUILD_DESTINATION already points here so it will be populated.
+	# For local manual packaging, copy from the installed Cloudberry path.
+	@mkdir -p ${DEBIAN_DESTINATION}
+	@if [ -z "$$(ls -A ${DEBIAN_DESTINATION} 2>/dev/null)" ]; then \
+		echo "Copying pre-built binaries from ${CBDB_BIN_PATH} to ${DEBIAN_DESTINATION}..."; \
+		cp -a ${CBDB_BIN_PATH}/* ${DEBIAN_DESTINATION}/; \
+	else \
+		echo "Build staging directory already populated, skipping copy."; \
+	fi
+	# Copy Apache compliance files into the build staging directory
+	cp -a LICENSE NOTICE DISCLAIMER ${DEBIAN_DESTINATION}/
+	cp -a licenses ${DEBIAN_DESTINATION}/
+	# Create debian/copyright for Debian policy compliance
+	mkdir -p $(shell pwd)/debian
+	cat LICENSE NOTICE > $(shell pwd)/debian/copyright
 
 override_dh_auto_install: gpinstall
 	# the staging directory for creating a debian is NOT the right GPHOME.
diff --git a/devops/build/packaging/deb/ubuntu24.04/control b/devops/build/packaging/deb/ubuntu24.04/control
index a561d8a4386..9e2c3eab451 100644
--- a/devops/build/packaging/deb/ubuntu24.04/control
+++ b/devops/build/packaging/deb/ubuntu24.04/control
@@ -46,6 +46,8 @@ Provides: apache-cloudberry-db
 Architecture: amd64
 Depends: curl,
     cgroup-tools,
+    debianutils,
+    hostname,
     iputils-ping,
     iproute2,
     keyutils,
diff --git a/devops/build/packaging/rpm/apache-cloudberry-db-incubating.spec b/devops/build/packaging/rpm/apache-cloudberry-db-incubating.spec
index 03fa0a34570..e228f8fe76a 100644
--- a/devops/build/packaging/rpm/apache-cloudberry-db-incubating.spec
+++ b/devops/build/packaging/rpm/apache-cloudberry-db-incubating.spec
@@ -52,12 +52,15 @@ Prefix:         %{cloudberry_install_dir}
 # List runtime dependencies
 
 Requires:       bash
+Requires:       hostname
 Requires:       iproute
 Requires:       iputils
+Requires:       less
 Requires:       openssh
 Requires:       openssh-clients
 Requires:       openssh-server
 Requires:       rsync
+Requires:       which
 
 %if 0%{?rhel} == 8
 Requires:       apr
@@ -152,6 +155,12 @@ mkdir -p %{buildroot}%{cloudberry_install_dir}-%{version}
 
 cp -R %{cloudberry_install_dir}/* %{buildroot}%{cloudberry_install_dir}-%{version}
 
+# Copy Apache mandatory compliance files from the SOURCES directory into the installation directory
+cp %{_sourcedir}/LICENSE %{buildroot}%{cloudberry_install_dir}-%{version}/
+cp %{_sourcedir}/NOTICE %{buildroot}%{cloudberry_install_dir}-%{version}/
+cp %{_sourcedir}/DISCLAIMER %{buildroot}%{cloudberry_install_dir}-%{version}/
+cp -R %{_sourcedir}/licenses %{buildroot}%{cloudberry_install_dir}-%{version}/
+
 # Create the symbolic link
 ln -sfn %{cloudberry_install_dir}-%{version} %{buildroot}%{cloudberry_install_dir}
 
@@ -159,8 +168,6 @@ ln -sfn %{cloudberry_install_dir}-%{version} %{buildroot}%{cloudberry_install_di
 %{prefix}-%{version}
 %{prefix}
 
-%license %{cloudberry_install_dir}-%{version}/LICENSE
-
 %debug_package
 
 %post
diff --git a/devops/build/packaging/rpm/build-rpm.sh b/devops/build/packaging/rpm/build-rpm.sh
index ceb7d18d392..2c490166f45 100755
--- a/devops/build/packaging/rpm/build-rpm.sh
+++ b/devops/build/packaging/rpm/build-rpm.sh
@@ -118,10 +118,46 @@ fi
 # Check if required commands are available
 check_commands
 
-# Define the spec file path
+# Define the source spec file path (assuming it is in the same directory as the script)
+SOURCE_SPEC_FILE="$(dirname "$0")/apache-cloudberry-db-incubating.spec"
+
+# Ensure rpmbuild SPECS and SOURCES directories exist
+mkdir -p ~/rpmbuild/SPECS
+mkdir -p ~/rpmbuild/SOURCES
+
+# Find project root (assumed to be four levels up from scripts directory: devops/build/packaging/rpm/)
+PROJECT_ROOT="$(cd "$(dirname "$0")/../../../../" && pwd)"
+
+# Define the target spec file path
 SPEC_FILE=~/rpmbuild/SPECS/apache-cloudberry-db-incubating.spec
 
-# Check if the spec file exists
+# Copy the spec file to rpmbuild/SPECS if the source exists and is different
+if [ -f "$SOURCE_SPEC_FILE" ]; then
+  # Avoid copying if SPEC_FILE is already a symlink/file pointing to SOURCE_SPEC_FILE (common in CI)
+  if [ ! "$SOURCE_SPEC_FILE" -ef "$SPEC_FILE" ]; then
+    cp -f "$SOURCE_SPEC_FILE" "$SPEC_FILE"
+  fi
+else
+  echo "Warning: Source spec file not found at $SOURCE_SPEC_FILE, assuming it is already in ~/rpmbuild/SPECS/"
+fi
+
+# Copy Apache mandatory compliance files to rpmbuild/SOURCES
+echo "Copying compliance files from $PROJECT_ROOT to ~/rpmbuild/SOURCES..."
+for f in LICENSE NOTICE DISCLAIMER; do
+    if [ -f "$PROJECT_ROOT/$f" ]; then
+        cp -af "$PROJECT_ROOT/$f" ~/rpmbuild/SOURCES/
+    else
+        echo "Warning: $f not found in $PROJECT_ROOT"
+    fi
+done
+
+if [ -d "$PROJECT_ROOT/licenses" ]; then
+    cp -af "$PROJECT_ROOT/licenses" ~/rpmbuild/SOURCES/
+else
+    echo "Warning: licenses directory not found in $PROJECT_ROOT"
+fi
+
+# Check if the spec file exists at the target location before proceeding
 if [ ! -f "$SPEC_FILE" ]; then
   echo "Error: Spec file not found at $SPEC_FILE."
   exit 1
diff --git a/devops/deploy/docker/build/rocky10/Dockerfile b/devops/deploy/docker/build/rocky10/Dockerfile
new file mode 100644
index 00000000000..3ab40229020
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/Dockerfile
@@ -0,0 +1,217 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+#
+# Apache Cloudberry (Incubating) is an effort undergoing incubation at
+# the Apache Software Foundation (ASF), sponsored by the Apache
+# Incubator PMC.
+#
+# Incubation is required of all newly accepted projects until a
+# further review indicates that the infrastructure, communications,
+# and decision making process have stabilized in a manner consistent
+# with other successful ASF projects.
+#
+# While incubation status is not necessarily a reflection of the
+# completeness or stability of the code, it does indicate that the
+# project has yet to be fully endorsed by the ASF.
+#
+# --------------------------------------------------------------------
+# Dockerfile for Apache Cloudberry Build Environment
+# --------------------------------------------------------------------
+# This Dockerfile sets up a Rocky Linux 10-based container for building
+# and developing Apache Cloudberry. It installs necessary system
+# utilities, development tools, and configures the environment for SSH
+# access and systemd support.
+#
+# Key Features:
+# - Locale setup for en_US.UTF-8
+# - SSH daemon setup for remote access
+# - Essential development tools and libraries installation
+# - User configuration for 'gpadmin' with sudo privileges
+#
+# Usage:
+#   docker build -t cloudberry-db-env .
+#   docker run -h cdw -it cloudberry-db-env
+# --------------------------------------------------------------------
+
+# Base image: Rocky Linux 10
+FROM rockylinux/rockylinux:10
+
+# Argument for configuring the timezone
+ARG TIMEZONE_VAR="America/Los_Angeles"
+
+# Environment variables for locale and user
+ENV container=docker
+ENV LANG=en_US.UTF-8
+ENV USER=gpadmin
+
+# --------------------------------------------------------------------
+# Install Development Tools and Utilities
+# --------------------------------------------------------------------
+# Install various development tools, system utilities, and libraries
+# required for building and running Apache Cloudberry.
+# - EPEL repository is enabled for additional packages.
+# - Cleanup steps are added to reduce image size after installation.
+# --------------------------------------------------------------------
+RUN dnf makecache && \
+    dnf install -y \
+        epel-release \
+        git && \
+    dnf makecache && \
+    dnf config-manager --disable epel && \
+    dnf install -y --enablerepo=epel \
+        bat \
+        libssh2-devel \
+        python3-devel \
+        htop && \
+    dnf install -y \
+        bison \
+        cmake3 \
+        ed \
+        file \
+        flex \
+        gcc \
+        gcc-c++ \
+        gdb \
+        glibc-langpack-en \
+        glibc-locale-source \
+        initscripts \
+        iproute \
+        less \
+        lsof \
+        m4 \
+        net-tools \
+        openssh-clients \
+        openssh-server \
+        perl \
+        rpm-build \
+        rpmdevtools \
+        rsync \
+        sudo \
+        tar \
+        unzip \
+        util-linux-ng \
+        wget \
+        sshpass \
+        which && \
+    dnf install -y \
+        apr-devel \
+        bzip2-devel \
+        java-21-openjdk \
+        java-21-openjdk-devel \
+        krb5-devel \
+        libcurl-devel \
+        libevent-devel \
+        libicu-devel \
+        libxml2-devel \
+        libuuid-devel \
+        libzstd-devel \
+        lz4 \
+        lz4-devel \
+        openldap-devel \
+        openssl-devel \
+        pam-devel \
+        perl-ExtUtils-Embed \
+        perl-Test-Simple \
+        perl-core \
+        python3-setuptools \
+        readline-devel \
+        zlib-devel && \
+    dnf install -y --enablerepo=crb \
+        liburing-devel \
+        libuv-devel \
+        libyaml-devel \
+        perl-IPC-Run \
+        python3-wheel \
+        protobuf-devel && \
+    dnf clean all && \
+    cd && XERCES_LATEST_RELEASE=3.3.0 && \
+    wget -nv "https://archive.apache.org/dist/xerces/c/3/sources/xerces-c-${XERCES_LATEST_RELEASE}.tar.gz" && \
+    echo "$(curl -sL https://archive.apache.org/dist/xerces/c/3/sources/xerces-c-${XERCES_LATEST_RELEASE}.tar.gz.sha256)" | sha256sum -c - && \
+    tar xf "xerces-c-${XERCES_LATEST_RELEASE}.tar.gz"; rm "xerces-c-${XERCES_LATEST_RELEASE}.tar.gz" && \
+    cd xerces-c-${XERCES_LATEST_RELEASE} && \
+    ./configure --prefix=/usr/local/xerces-c && \
+    make -j$(nproc) && \
+    make install -C ~/xerces-c-${XERCES_LATEST_RELEASE} && \
+    rm -rf ~/xerces-c* && \
+    cd && GO_VERSION="go1.25.10" && \
+    ARCH=$(uname -m) && \
+    if [ "${ARCH}" = "aarch64" ]; then \
+        GO_ARCH="arm64" && \
+        GO_SHA256="654da1f9b50a5d1c2a85ccf8ed405aa89c06e94d18384628bf186f7712677b08"; \
+    elif [ "${ARCH}" = "x86_64" ]; then \
+        GO_ARCH="amd64" && \
+        GO_SHA256="42d4f7a32316aa66591eca7e89867256057a4264451aca10570a715b3637ba70"; \
+    else \
+        echo "Unsupported architecture: ${ARCH}" && exit 1; \
+    fi && \
+    GO_URL="https://go.dev/dl/${GO_VERSION}.linux-${GO_ARCH}.tar.gz" && \
+    wget -nv "${GO_URL}" && \
+    echo "${GO_SHA256}  ${GO_VERSION}.linux-${GO_ARCH}.tar.gz" | sha256sum -c - && \
+    tar xf "${GO_VERSION}.linux-${GO_ARCH}.tar.gz" && \
+    mv go "/usr/local/${GO_VERSION}" && \
+    ln -s "/usr/local/${GO_VERSION}" /usr/local/go && \
+    rm -f "${GO_VERSION}.linux-${GO_ARCH}.tar.gz" && \
+    echo 'export PATH=$PATH:/usr/local/go/bin' | tee -a /etc/profile.d/go.sh > /dev/null
+
+# --------------------------------------------------------------------
+# Copy Configuration Files and Setup the Environment
+# --------------------------------------------------------------------
+# - Copy custom configuration files from the build context to /tmp/.
+# - Apply custom system limits and timezone.
+# - Create and configure the 'gpadmin' user with sudo privileges.
+# - Set up SSH for password-based authentication.
+# - Generate locale and set the default locale to en_US.UTF-8.
+# --------------------------------------------------------------------
+
+# Copy configuration files from their respective locations
+COPY ./configs/* /tmp/
+
+RUN cp /tmp/90-cbdb-limits /etc/security/limits.d/90-cbdb-limits && \
+    sed -i.bak -r 's/^(session\s+required\s+pam_limits.so)/#\1/' /etc/pam.d/* && \
+    cat /usr/share/zoneinfo/${TIMEZONE_VAR} > /etc/localtime && \
+    chmod 777 /tmp/init_system.sh && \
+    /usr/sbin/groupadd gpadmin && \
+    /usr/sbin/useradd gpadmin -g gpadmin -G wheel && \
+    setcap cap_net_raw+ep /usr/bin/ping && \
+    echo 'gpadmin ALL=(ALL) NOPASSWD: ALL' > /etc/sudoers.d/90-gpadmin && \
+    echo -e '\n# Add Cloudberry entries\nif [ -f /usr/local/cbdb/cloudberry-env.sh ]; then\n  source /usr/local/cbdb/cloudberry-env.sh\nfi' >> /home/gpadmin/.bashrc && \
+    ssh-keygen -A && \
+    echo "PasswordAuthentication yes" >> /etc/ssh/sshd_config && \
+    localedef -i en_US -f UTF-8 en_US.UTF-8 && \
+    echo "LANG=en_US.UTF-8" | tee /etc/locale.conf && \
+    dnf clean all  # Final cleanup to remove unnecessary files
+
+# Install testinfra via pip
+RUN pip3 install pytest-testinfra
+
+# Copying test files into the container
+COPY ./tests /tests
+
+# --------------------------------------------------------------------
+# Set the Default User and Command
+# --------------------------------------------------------------------
+# The default user is set to 'gpadmin', and the container starts by
+# running the init_system.sh script. The container also mounts the
+# /sys/fs/cgroup volume for systemd compatibility.
+# --------------------------------------------------------------------
+USER gpadmin
+
+VOLUME [ "/sys/fs/cgroup" ]
+CMD ["bash","-c","/tmp/init_system.sh"]
diff --git a/devops/deploy/docker/build/rocky10/configs/90-cbdb-limits b/devops/deploy/docker/build/rocky10/configs/90-cbdb-limits
new file mode 100644
index 00000000000..474957c42f6
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/configs/90-cbdb-limits
@@ -0,0 +1,32 @@
+# /etc/security/limits.d/90-db-limits
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+
+# Core dump file size limits for gpadmin
+gpadmin soft core unlimited
+gpadmin hard core unlimited
+
+# Open file limits for gpadmin
+gpadmin soft nofile 524288
+gpadmin hard nofile 524288
+
+# Process limits for gpadmin
+gpadmin soft nproc 131072
+gpadmin hard nproc 131072
diff --git a/devops/deploy/docker/build/rocky10/configs/gpinitsystem.conf b/devops/deploy/docker/build/rocky10/configs/gpinitsystem.conf
new file mode 100644
index 00000000000..d4d312231c5
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/configs/gpinitsystem.conf
@@ -0,0 +1,89 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+
+# --------------------------------------------------------------------
+# gpinitsystem Configuration File for Apache Cloudberry
+# --------------------------------------------------------------------
+# This configuration file is used to initialize an Apache Cloudberry
+# cluster. It defines the settings for the coordinator, primary segments,
+# and mirrors, as well as other important configuration options.
+# --------------------------------------------------------------------
+
+# Segment prefix - This prefix is used for naming the segment directories.
+# For example, the primary segment directories will be named gpseg0, gpseg1, etc.
+SEG_PREFIX=gpseg
+
+# Coordinator port - The port number where the coordinator will listen.
+# This is the port used by clients to connect to the database.
+COORDINATOR_PORT=5432
+
+# Coordinator hostname - The hostname of the machine where the coordinator
+# will be running. The $(hostname) command will automatically insert the
+# hostname of the current machine.
+COORDINATOR_HOSTNAME=$(hostname)
+
+# Coordinator data directory - The directory where the coordinator's data
+# will be stored. This directory should have enough space to store metadata
+# and system catalogs.
+COORDINATOR_DIRECTORY=/data1/coordinator
+
+# Base port for primary segments - The starting port number for the primary
+# segments. Each primary segment will use a unique port number starting from
+# this base.
+PORT_BASE=6000
+
+# Primary segment data directories - An array specifying the directories where
+# the primary segment data will be stored. Each directory corresponds to a
+# primary segment. In this case, two primary segments will be created in the
+# same directory.
+declare -a DATA_DIRECTORY=(/data1/primary /data1/primary)
+
+# Base port for mirror segments - The starting port number for the mirror
+# segments. Each mirror segment will use a unique port number starting from
+# this base.
+MIRROR_PORT_BASE=7000
+
+# Mirror segment data directories - An array specifying the directories where
+# the mirror segment data will be stored. Each directory corresponds to a
+# mirror segment. In this case, two mirror segments will be created in the
+# same directory.
+declare -a MIRROR_DATA_DIRECTORY=(/data1/mirror /data1/mirror)
+
+# Trusted shell - The shell program used for remote execution. Cloudberry uses
+# SSH to run commands on other machines in the cluster. 'ssh' is the default.
+TRUSTED_SHELL=ssh
+
+# Database encoding - The character set encoding to be used by the database.
+# 'UNICODE' is a common choice, especially for internationalization.
+ENCODING=UNICODE
+
+# Default database name - The name of the default database to be created during
+# initialization. This is also the default database that the gpadmin user will
+# connect to.
+DATABASE_NAME=gpadmin
+
+# Machine list file - A file containing the list of hostnames where the primary
+# segments will be created. Each line in the file represents a different machine.
+# This file is critical for setting up the cluster across multiple nodes.
+MACHINE_LIST_FILE=/home/gpadmin/hostfile_gpinitsystem
+
+# --------------------------------------------------------------------
+# End of gpinitsystem Configuration File
+# --------------------------------------------------------------------
diff --git a/devops/deploy/docker/build/rocky10/configs/init_system.sh b/devops/deploy/docker/build/rocky10/configs/init_system.sh
new file mode 100755
index 00000000000..d8c4a00b035
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/configs/init_system.sh
@@ -0,0 +1,192 @@
+#!/bin/bash
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+## Container Initialization Script
+# --------------------------------------------------------------------
+## This script sets up the environment inside the Docker container for
+## the Apache Cloudberry Build Environment. It performs the following
+## tasks:
+##
+## 1. Verifies that the container is running with the expected hostname.
+## 2. Starts the SSH daemon to allow SSH access to the container.
+## 3. Configures passwordless SSH access for the 'gpadmin' user.
+## 4. Displays a welcome banner and system information.
+## 5. Starts an interactive bash shell.
+##
+## This script is intended to be used as an entrypoint or initialization
+## script for the Docker container.
+# --------------------------------------------------------------------
+
+# --------------------------------------------------------------------
+# Check if the hostname is 'cdw'
+# --------------------------------------------------------------------
+# The script checks if the container's hostname is set to 'cdw'. This is
+# a requirement for this environment, and if the hostname does not match,
+# the script will exit with an error message. This ensures consistency
+# across different environments.
+# --------------------------------------------------------------------
+if [ "$(hostname)" != "cdw" ]; then
+    echo "Error: This container must be run with the hostname 'cdw'."
+    echo "Use the following command: docker run -h cdw ..."
+    exit 1
+fi
+
+# --------------------------------------------------------------------
+# Start SSH daemon and setup for SSH access
+# --------------------------------------------------------------------
+# The SSH daemon is started to allow remote access to the container via
+# SSH. This is useful for development and debugging purposes. If the SSH
+# daemon fails to start, the script exits with an error.
+# --------------------------------------------------------------------
+if ! sudo /usr/sbin/sshd; then
+    echo "Failed to start SSH daemon" >&2
+    exit 1
+fi
+
+# --------------------------------------------------------------------
+# Remove /run/nologin to allow logins
+# --------------------------------------------------------------------
+# The /run/nologin file, if present, prevents users from logging into
+# the system. This file is removed to ensure that users can log in via SSH.
+# --------------------------------------------------------------------
+sudo rm -rf /run/nologin
+
+# --------------------------------------------------------------------
+# Configure passwordless SSH access for 'gpadmin' user
+# --------------------------------------------------------------------
+# The script sets up SSH key-based authentication for the 'gpadmin' user,
+# allowing passwordless SSH access. It generates a new SSH key pair if one
+# does not already exist, and configures the necessary permissions.
+# --------------------------------------------------------------------
+mkdir -p /home/gpadmin/.ssh
+chmod 700 /home/gpadmin/.ssh
+
+if [ ! -f /home/gpadmin/.ssh/id_rsa ]; then
+    ssh-keygen -t rsa -b 4096 -C gpadmin -f /home/gpadmin/.ssh/id_rsa -P "" > /dev/null 2>&1
+fi
+
+cat /home/gpadmin/.ssh/id_rsa.pub >> /home/gpadmin/.ssh/authorized_keys
+chmod 600 /home/gpadmin/.ssh/authorized_keys
+
+# Add the container's hostname to the known_hosts file to avoid SSH warnings
+ssh-keyscan -t rsa cdw > /home/gpadmin/.ssh/known_hosts 2>/dev/null
+
+# Change to the home directory of the current user
+cd $HOME
+
+# --------------------------------------------------------------------
+# Display a Welcome Banner
+# --------------------------------------------------------------------
+# The following ASCII art and welcome message are displayed when the
+# container starts. This banner provides a visual indication that the
+# container is running in the Apache Cloudberry Build Environment.
+# --------------------------------------------------------------------
+cat <<-'EOF'
+
+======================================================================
+
+                          ++++++++++       ++++++
+                        ++++++++++++++   +++++++
+                       ++++        +++++ ++++
+                      ++++          +++++++++
+                   =+====         =============+
+                 ========       =====+      =====
+                ====  ====     ====           ====
+               ====    ===     ===             ====
+               ====            === ===         ====
+               ====            ===  ==--       ===
+                =====          ===== --       ====
+                 =====================     ======
+                   ============================
+                                     =-----=
+     ____  _                    _  _
+    / ___|| |  ___   _   _   __| || |__    ___  _ __  _ __  _   _
+   | |    | | / _ \ | | | | / _` || '_ \  / _ \| '__|| '__|| | | |
+   | |___ | || (_) || |_| || (_| || |_) ||  __/| |   | |   | |_| |
+    \____||_| \____  \__,_| \__,_||_.__/  \___||_|   |_|    \__, |
+                                                            |___/
+----------------------------------------------------------------------
+
+EOF
+
+# --------------------------------------------------------------------
+# Display System Information
+# --------------------------------------------------------------------
+# The script sources the /etc/os-release file to retrieve the operating
+# system name and version. It then displays the following information:
+# - OS name and version
+# - Current user
+# - Container hostname
+# - IP address
+# - CPU model name and number of cores
+# - Total memory available
+# This information is useful for users to understand the environment they
+# are working in.
+# --------------------------------------------------------------------
+source /etc/os-release
+
+# First, create the CPU info detection function
+get_cpu_info() {
+   ARCH=$(uname -m)
+   if [ "$ARCH" = "x86_64" ]; then
+       lscpu | grep 'Model name:' | awk '{print substr($0, index($0,$3))}'
+   elif [ "$ARCH" = "aarch64" ]; then
+       VENDOR=$(lscpu | grep 'Vendor ID:' | awk '{print $3}')
+       if [ "$VENDOR" = "Apple" ] || [ "$VENDOR" = "0x61" ]; then
+           echo "Apple Silicon ($ARCH)"
+       else
+           if [ -f /proc/cpuinfo ]; then
+               IMPL=$(grep "CPU implementer" /proc/cpuinfo | head -1 | awk '{print $3}')
+               PART=$(grep "CPU part" /proc/cpuinfo | head -1 | awk '{print $3}')
+               if [ ! -z "$IMPL" ] && [ ! -z "$PART" ]; then
+                   echo "ARM $ARCH (Implementer: $IMPL, Part: $PART)"
+               else
+                   echo "ARM $ARCH"
+               fi
+           else
+               echo "ARM $ARCH"
+           fi
+       fi
+   else
+       echo "Unknown architecture: $ARCH"
+   fi
+}
+
+cat <<-EOF
+Welcome to the Apache Cloudberry Build Environment!
+
+Container OS ........ : $NAME $VERSION
+User ................ : $(whoami)
+Container hostname .. : $(hostname)
+IP Address .......... : $(hostname -I | awk '{print $1}')
+CPU Info ............ : $(get_cpu_info)
+CPU(s) .............. : $(nproc)
+Memory .............. : $(free -h | grep Mem: | awk '{print $2}') total
+======================================================================
+
+EOF
+
+# --------------------------------------------------------------------
+# Start an interactive bash shell
+# --------------------------------------------------------------------
+# Finally, the script starts an interactive bash shell to keep the
+# container running and allow the user to interact with the environment.
+# --------------------------------------------------------------------
+/bin/bash
diff --git a/devops/deploy/docker/build/rocky10/tests/requirements.txt b/devops/deploy/docker/build/rocky10/tests/requirements.txt
new file mode 100644
index 00000000000..b9711eddac5
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/tests/requirements.txt
@@ -0,0 +1,3 @@
+testinfra
+pytest-testinfra
+paramiko
diff --git a/devops/deploy/docker/build/rocky10/tests/testinfra/test_cloudberry_db_env.py b/devops/deploy/docker/build/rocky10/tests/testinfra/test_cloudberry_db_env.py
new file mode 100644
index 00000000000..445318f5335
--- /dev/null
+++ b/devops/deploy/docker/build/rocky10/tests/testinfra/test_cloudberry_db_env.py
@@ -0,0 +1,127 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+
+import testinfra
+
+def test_installed_packages(host):
+    """
+    Test if the essential packages are installed.
+    """
+    packages = [
+        "epel-release",
+        "git",
+        "bat",
+        "htop",
+        "bison",
+        "cmake",
+        "gcc",
+        "gcc-c++",
+        "glibc-langpack-en",
+        "glibc-locale-source",
+        "openssh-clients",
+        "openssh-server",
+        "sudo",
+        "rsync",
+        "wget",
+        "openssl-devel",
+        "python3-devel",
+        "readline-devel",
+        "zlib-ng-compat-devel",
+        "libcurl-devel",
+        "libevent-devel",
+        "libxml2-devel",
+        "libuuid-devel",
+        "libzstd-devel",
+        "lz4",
+        "openldap-devel",
+        "libuv-devel",
+        "libyaml-devel"
+    ]
+    for package in packages:
+        pkg = host.package(package)
+        assert pkg.is_installed
+
+
+def test_user_gpadmin_exists(host):
+    """
+    Test if the gpadmin user exists and is configured properly.
+    """
+    user = host.user("gpadmin")
+    assert user.exists
+    assert "wheel" in user.groups
+
+
+def test_ssh_service(host):
+    """
+    Test if SSH service is configured correctly.
+    """
+    sshd_config = host.file("/etc/ssh/sshd_config")
+    assert sshd_config.exists
+
+
+def test_locale_configured(host):
+    """
+    Test if the locale is configured correctly.
+    """
+    locale_conf = host.file("/etc/locale.conf")
+    assert locale_conf.exists
+    assert locale_conf.contains("LANG=en_US.UTF-8")
+
+
+def test_timezone(host):
+    """
+    Test if the timezone is configured correctly.
+    """
+    localtime = host.file("/etc/localtime")
+    assert localtime.exists
+
+
+def test_system_limits_configured(host):
+    """
+    Test if the custom system limits are applied.
+    """
+    limits_file = host.file("/etc/security/limits.d/90-cbdb-limits")
+    assert limits_file.exists
+
+
+def test_init_system_script(host):
+    """
+    Test if the init_system.sh script is present and executable.
+    """
+    script = host.file("/tmp/init_system.sh")
+    assert script.exists
+    assert script.mode == 0o777
+
+
+def test_custom_configuration_files(host):
+    """
+    Test if custom configuration files are correctly copied.
+    """
+    config_file = host.file("/tmp/90-cbdb-limits")
+    assert config_file.exists
+
+
+def test_locale_generated(host):
+    """
+    Test if the en_US.UTF-8 locale is correctly generated.
+    """
+    locale = host.run("locale -a | grep en_US.utf8")
+    assert locale.exit_status == 0
+    assert "en_US.utf8" in locale.stdout
diff --git a/devops/deploy/docker/build/rocky8/Dockerfile b/devops/deploy/docker/build/rocky8/Dockerfile
index 45d6706e593..eed55e4b171 100644
--- a/devops/deploy/docker/build/rocky8/Dockerfile
+++ b/devops/deploy/docker/build/rocky8/Dockerfile
@@ -99,6 +99,7 @@ RUN dnf makecache && \
         krb5-devel \
         libcurl-devel \
         libevent-devel \
+        libicu-devel \
         libssh2-devel \
         libuuid-devel \
         libxml2-devel \
@@ -150,14 +151,14 @@ RUN dnf makecache && \
     make -j$(nproc) && \
     make install -C ~/xerces-c-${XERCES_LATEST_RELEASE} && \
     rm -rf ~/xerces-c* && \
-    cd && GO_VERSION="go1.23.4" && \
+    cd && GO_VERSION="go1.25.10" && \
     ARCH=$(uname -m) && \
     if [ "${ARCH}" = "aarch64" ]; then \
         GO_ARCH="arm64" && \
-        GO_SHA256="16e5017863a7f6071363782b1b8042eb12c6ca4f4cd71528b2123f0a1275b13e"; \
+        GO_SHA256="654da1f9b50a5d1c2a85ccf8ed405aa89c06e94d18384628bf186f7712677b08"; \
     elif [ "${ARCH}" = "x86_64" ]; then \
         GO_ARCH="amd64" && \
-        GO_SHA256="6924efde5de86fe277676e929dc9917d466efa02fb934197bc2eba35d5680971"; \
+        GO_SHA256="42d4f7a32316aa66591eca7e89867256057a4264451aca10570a715b3637ba70"; \
     else \
         echo "Unsupported architecture: ${ARCH}" && exit 1; \
     fi && \
diff --git a/devops/deploy/docker/build/rocky9/Dockerfile b/devops/deploy/docker/build/rocky9/Dockerfile
index 26190109ef0..592d9b2e10a 100644
--- a/devops/deploy/docker/build/rocky9/Dockerfile
+++ b/devops/deploy/docker/build/rocky9/Dockerfile
@@ -120,6 +120,7 @@ RUN dnf makecache && \
         libcurl-devel \
         libssh2-devel \
         libevent-devel \
+        libicu-devel \
         libxml2-devel \
         libuuid-devel \
         libzstd-devel \
@@ -151,14 +152,14 @@ RUN dnf makecache && \
     make -j$(nproc) && \
     make install -C ~/xerces-c-${XERCES_LATEST_RELEASE} && \
     rm -rf ~/xerces-c* && \
-    cd && GO_VERSION="go1.23.4" && \
+    cd && GO_VERSION="go1.25.10" && \
     ARCH=$(uname -m) && \
     if [ "${ARCH}" = "aarch64" ]; then \
         GO_ARCH="arm64" && \
-        GO_SHA256="16e5017863a7f6071363782b1b8042eb12c6ca4f4cd71528b2123f0a1275b13e"; \
+        GO_SHA256="654da1f9b50a5d1c2a85ccf8ed405aa89c06e94d18384628bf186f7712677b08"; \
     elif [ "${ARCH}" = "x86_64" ]; then \
         GO_ARCH="amd64" && \
-        GO_SHA256="6924efde5de86fe277676e929dc9917d466efa02fb934197bc2eba35d5680971"; \
+        GO_SHA256="42d4f7a32316aa66591eca7e89867256057a4264451aca10570a715b3637ba70"; \
     else \
         echo "Unsupported architecture: ${ARCH}" && exit 1; \
     fi && \
diff --git a/devops/deploy/docker/build/ubuntu22.04/Dockerfile b/devops/deploy/docker/build/ubuntu22.04/Dockerfile
index 3023a9fce67..d32467338bd 100644
--- a/devops/deploy/docker/build/ubuntu22.04/Dockerfile
+++ b/devops/deploy/docker/build/ubuntu22.04/Dockerfile
@@ -144,14 +144,14 @@ RUN apt-get update && \
             quilt \
             unzip && \
     apt-get clean && rm -rf /var/lib/apt/lists/* && \
-    cd && GO_VERSION="go1.23.4" && \
+    cd && GO_VERSION="go1.25.10" && \
     ARCH=$(uname -m) && \
     if [ "${ARCH}" = "aarch64" ]; then \
         GO_ARCH="arm64" && \
-        GO_SHA256="16e5017863a7f6071363782b1b8042eb12c6ca4f4cd71528b2123f0a1275b13e"; \
+        GO_SHA256="654da1f9b50a5d1c2a85ccf8ed405aa89c06e94d18384628bf186f7712677b08"; \
     elif [ "${ARCH}" = "x86_64" ]; then \
         GO_ARCH="amd64" && \
-        GO_SHA256="6924efde5de86fe277676e929dc9917d466efa02fb934197bc2eba35d5680971"; \
+        GO_SHA256="42d4f7a32316aa66591eca7e89867256057a4264451aca10570a715b3637ba70"; \
     else \
         echo "Unsupported architecture: ${ARCH}" && exit 1; \
     fi && \
diff --git a/devops/deploy/docker/build/ubuntu24.04/Dockerfile b/devops/deploy/docker/build/ubuntu24.04/Dockerfile
index c4f4e646720..83855bcaf68 100644
--- a/devops/deploy/docker/build/ubuntu24.04/Dockerfile
+++ b/devops/deploy/docker/build/ubuntu24.04/Dockerfile
@@ -144,14 +144,14 @@ RUN apt-get update && \
             quilt \
             unzip && \
     apt-get clean && rm -rf /var/lib/apt/lists/* && \
-    cd && GO_VERSION="go1.23.4" && \
+    cd && GO_VERSION="go1.25.10" && \
     ARCH=$(uname -m) && \
     if [ "${ARCH}" = "aarch64" ]; then \
         GO_ARCH="arm64" && \
-        GO_SHA256="16e5017863a7f6071363782b1b8042eb12c6ca4f4cd71528b2123f0a1275b13e"; \
+        GO_SHA256="654da1f9b50a5d1c2a85ccf8ed405aa89c06e94d18384628bf186f7712677b08"; \
     elif [ "${ARCH}" = "x86_64" ]; then \
         GO_ARCH="amd64" && \
-        GO_SHA256="6924efde5de86fe277676e929dc9917d466efa02fb934197bc2eba35d5680971"; \
+        GO_SHA256="42d4f7a32316aa66591eca7e89867256057a4264451aca10570a715b3637ba70"; \
     else \
         echo "Unsupported architecture: ${ARCH}" && exit 1; \
     fi && \
diff --git a/devops/deploy/docker/test/rocky10/Dockerfile b/devops/deploy/docker/test/rocky10/Dockerfile
new file mode 100644
index 00000000000..ec6b268f708
--- /dev/null
+++ b/devops/deploy/docker/test/rocky10/Dockerfile
@@ -0,0 +1,135 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+#
+# Apache Cloudberry (Incubating) is an effort undergoing incubation at
+# the Apache Software Foundation (ASF), sponsored by the Apache
+# Incubator PMC.
+#
+# Incubation is required of all newly accepted projects until a
+# further review indicates that the infrastructure, communications,
+# and decision making process have stabilized in a manner consistent
+# with other successful ASF projects.
+#
+# While incubation status is not necessarily a reflection of the
+# completeness or stability of the code, it does indicate that the
+# project has yet to be fully endorsed by the ASF.
+#
+# --------------------------------------------------------------------
+# Dockerfile for Apache Cloudberry Base Environment
+# --------------------------------------------------------------------
+# This Dockerfile sets up a Rocky Linux 10-based container to serve as
+# a base environment for evaluating the Apache Cloudberry. It installs
+# necessary system utilities, configures the environment for SSH access,
+# and sets up a 'gpadmin' user with sudo privileges. The Cloudberry
+# Database RPM can be installed into this container for testing and
+# functional verification.
+#
+# Key Features:
+# - Locale setup for en_US.UTF-8
+# - SSH daemon setup for remote access
+# - Essential system utilities installation
+# - Separate user creation and configuration steps
+#
+# Security Considerations:
+# - This Dockerfile prioritizes ease of use for functional testing and
+#   evaluation. It includes configurations such as passwordless sudo access
+#   for the 'gpadmin' user and SSH access with password authentication.
+# - These configurations are suitable for testing and development but
+#   should NOT be used in a production environment due to potential security
+#   risks.
+#
+# Usage:
+#   docker build -t cloudberry-db-base-env .
+#   docker run -h cdw -it cloudberry-db-base-env
+# --------------------------------------------------------------------
+
+# Base image: Rocky Linux 10
+FROM rockylinux/rockylinux:10
+
+# Argument for configuring the timezone
+ARG TIMEZONE_VAR="America/Los_Angeles"
+
+# Environment variables for locale
+ENV LANG=en_US.UTF-8
+
+# --------------------------------------------------------------------
+# System Update and Installation
+# --------------------------------------------------------------------
+# Update the system and install essential system utilities required for
+# running and testing Apache Cloudberry. Cleanup the DNF cache afterward
+# to reduce the image size.
+# --------------------------------------------------------------------
+RUN dnf install -y \
+        file \
+        gdb \
+        glibc-locale-source \
+        make \
+        openssh \
+        openssh-clients \
+        openssh-server \
+        procps-ng \
+        sudo \
+        which \
+        && \
+    dnf clean all  # Clean up DNF cache after package installations
+
+# --------------------------------------------------------------------
+# User Creation and Configuration
+# --------------------------------------------------------------------
+# - Create the 'gpadmin' user and group.
+# - Configure the 'gpadmin' user with passwordless sudo privileges.
+# - Add Cloudberry-specific entries to the gpadmin's .bashrc.
+# --------------------------------------------------------------------
+RUN /usr/sbin/groupadd gpadmin && \
+    /usr/sbin/useradd gpadmin -g gpadmin -G wheel && \
+    echo 'gpadmin ALL=(ALL) NOPASSWD: ALL' > /etc/sudoers.d/90-gpadmin && \
+    echo -e '\n# Add Cloudberry entries\nif [ -f /usr/local/cloudberry/cloudberry-env.sh ]; then\n  source /usr/local/cloudberry/cloudberry-env.sh\n  export COORDINATOR_DATA_DIRECTORY=/data1/coordinator/gpseg-1\nfi' >> /home/gpadmin/.bashrc
+
+# --------------------------------------------------------------------
+# Copy Configuration Files and Setup the Environment
+# --------------------------------------------------------------------
+# - Copy custom configuration files from the build context to /tmp/.
+# - Apply custom system limits and timezone.
+# - Set up SSH for password-based authentication.
+# - Generate locale and set the default locale to en_US.UTF-8.
+# --------------------------------------------------------------------
+COPY ./configs/* /tmp/
+
+RUN cp /tmp/90-cbdb-limits /etc/security/limits.d/90-cbdb-limits && \
+    sed -i.bak -r 's/^(session\s+required\s+pam_limits.so)/#\1/' /etc/pam.d/* && \
+    cat /usr/share/zoneinfo/${TIMEZONE_VAR} > /etc/localtime && \
+    chmod 777 /tmp/init_system.sh && \
+    setcap cap_net_raw+ep /usr/bin/ping && \
+    ssh-keygen -A && \
+    echo "PasswordAuthentication yes" >> /etc/ssh/sshd_config && \
+    localedef -i en_US -f UTF-8 en_US.UTF-8 && \
+    echo "LANG=en_US.UTF-8" | tee /etc/locale.conf
+
+# --------------------------------------------------------------------
+# Set the Default User and Command
+# --------------------------------------------------------------------
+# The default user is set to 'gpadmin', and the container starts by
+# running the init_system.sh script. This container serves as a base
+# environment, and the Apache Cloudberry RPM can be installed for
+# testing and functional verification.
+# --------------------------------------------------------------------
+USER gpadmin
+
+CMD ["bash","-c","/tmp/init_system.sh"]
diff --git a/devops/deploy/docker/test/rocky10/configs/90-cbdb-limits b/devops/deploy/docker/test/rocky10/configs/90-cbdb-limits
new file mode 100644
index 00000000000..474957c42f6
--- /dev/null
+++ b/devops/deploy/docker/test/rocky10/configs/90-cbdb-limits
@@ -0,0 +1,32 @@
+# /etc/security/limits.d/90-db-limits
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+
+# Core dump file size limits for gpadmin
+gpadmin soft core unlimited
+gpadmin hard core unlimited
+
+# Open file limits for gpadmin
+gpadmin soft nofile 524288
+gpadmin hard nofile 524288
+
+# Process limits for gpadmin
+gpadmin soft nproc 131072
+gpadmin hard nproc 131072
diff --git a/devops/deploy/docker/test/rocky10/configs/gpinitsystem.conf b/devops/deploy/docker/test/rocky10/configs/gpinitsystem.conf
new file mode 100644
index 00000000000..3dcd5a99365
--- /dev/null
+++ b/devops/deploy/docker/test/rocky10/configs/gpinitsystem.conf
@@ -0,0 +1,87 @@
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# ----------------------------------------------------------------------
+# gpinitsystem Configuration File for Apache Cloudberry
+# ----------------------------------------------------------------------
+# This configuration file is used to initialize an Apache Cloudberry
+# cluster. It defines the settings for the coordinator, primary segments,
+# and mirrors, as well as other important configuration options.
+# ----------------------------------------------------------------------
+
+# Segment prefix - This prefix is used for naming the segment directories.
+# For example, the primary segment directories will be named gpseg0, gpseg1, etc.
+SEG_PREFIX=gpseg
+
+# Coordinator port - The port number where the coordinator will listen.
+# This is the port used by clients to connect to the database.
+COORDINATOR_PORT=5432
+
+# Coordinator hostname - The hostname of the machine where the coordinator
+# will be running. The $(hostname) command will automatically insert the
+# hostname of the current machine.
+COORDINATOR_HOSTNAME=$(hostname)
+
+# Coordinator data directory - The directory where the coordinator's data
+# will be stored. This directory should have enough space to store metadata
+# and system catalogs.
+COORDINATOR_DIRECTORY=/data1/coordinator
+
+# Base port for primary segments - The starting port number for the primary
+# segments. Each primary segment will use a unique port number starting from
+# this base.
+PORT_BASE=6000
+
+# Primary segment data directories - An array specifying the directories where
+# the primary segment data will be stored. Each directory corresponds to a
+# primary segment. In this case, two primary segments will be created in the
+# same directory.
+declare -a DATA_DIRECTORY=(/data1/primary /data1/primary)
+
+# Base port for mirror segments - The starting port number for the mirror
+# segments. Each mirror segment will use a unique port number starting from
+# this base.
+MIRROR_PORT_BASE=7000
+
+# Mirror segment data directories - An array specifying the directories where
+# the mirror segment data will be stored. Each directory corresponds to a
+# mirror segment. In this case, two mirror segments will be created in the
+# same directory.
+declare -a MIRROR_DATA_DIRECTORY=(/data1/mirror /data1/mirror)
+
+# Trusted shell - The shell program used for remote execution. Cloudberry uses
+# SSH to run commands on other machines in the cluster. 'ssh' is the default.
+TRUSTED_SHELL=ssh
+
+# Database encoding - The character set encoding to be used by the database.
+# 'UNICODE' is a common choice, especially for internationalization.
+ENCODING=UNICODE
+
+# Default database name - The name of the default database to be created during
+# initialization. This is also the default database that the gpadmin user will
+# connect to.
+DATABASE_NAME=gpadmin
+
+# Machine list file - A file containing the list of hostnames where the primary
+# segments will be created. Each line in the file represents a different machine.
+# This file is critical for setting up the cluster across multiple nodes.
+MACHINE_LIST_FILE=/home/gpadmin/hostfile_gpinitsystem
+
+# ----------------------------------------------------------------------
+# End of gpinitsystem Configuration File
+# ----------------------------------------------------------------------
diff --git a/devops/deploy/docker/test/rocky10/configs/init_system.sh b/devops/deploy/docker/test/rocky10/configs/init_system.sh
new file mode 100755
index 00000000000..3ea7e34b0ff
--- /dev/null
+++ b/devops/deploy/docker/test/rocky10/configs/init_system.sh
@@ -0,0 +1,221 @@
+#!/bin/bash
+# --------------------------------------------------------------------
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed
+# with this work for additional information regarding copyright
+# ownership. The ASF licenses this file to You under the Apache
+# License, Version 2.0 (the "License"); you may not use this file
+# except in compliance with the License. You may obtain a copy of the
+# License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied. See the License for the specific language governing
+# permissions and limitations under the License.
+#
+# --------------------------------------------------------------------
+# Container Initialization Script
+# --------------------------------------------------------------------
+# This script sets up the environment inside the Docker container for
+# the Apache Cloudberry Build Environment. It performs the following
+# tasks:
+#
+# 1. Verifies that the container is running with the expected hostname.
+# 2. Starts the SSH daemon to allow SSH access to the container.
+# 3. Configures passwordless SSH access for the 'gpadmin' user.
+# 4. Sets up the necessary directories and configuration files for
+#    Apache Cloudberry.
+# 5. Displays a welcome banner and system information.
+# 6. Starts an interactive bash shell.
+#
+# This script is intended to be used as an entrypoint or initialization
+# script for the Docker container.
+# --------------------------------------------------------------------
+
+# --------------------------------------------------------------------
+# Check if the hostname is 'cdw'
+# --------------------------------------------------------------------
+# The script checks if the container's hostname is set to 'cdw'. This is
+# a requirement for this environment, and if the hostname does not match,
+# the script will exit with an error message. This ensures consistency
+# across different environments.
+# --------------------------------------------------------------------
+if [ "$(hostname)" != "cdw" ]; then
+    echo "Error: This container must be run with the hostname 'cdw'."
+    echo "Use the following command: docker run -h cdw ..."
+    exit 1
+fi
+
+# --------------------------------------------------------------------
+# Start SSH daemon and setup for SSH access
+# --------------------------------------------------------------------
+# The SSH daemon is started to allow remote access to the container via
+# SSH. This is useful for development and debugging purposes. If the SSH
+# daemon fails to start, the script exits with an error.
+# --------------------------------------------------------------------
+if ! sudo /usr/sbin/sshd; then
+    echo "Failed to start SSH daemon" >&2
+    exit 1
+fi
+
+# --------------------------------------------------------------------
+# Remove /run/nologin to allow logins
+# --------------------------------------------------------------------
+# The /run/nologin file, if present, prevents users from logging into
+# the system. This file is removed to ensure that users can log in via SSH.
+# --------------------------------------------------------------------
+sudo rm -rf /run/nologin
+
+# --------------------------------------------------------------------
+# Configure passwordless SSH access for 'gpadmin' user
+# --------------------------------------------------------------------
+# The script sets up SSH key-based authentication for the 'gpadmin' user,
+# allowing passwordless SSH access. It generates a new SSH key pair if one
+# does not already exist, and configures the necessary permissions.
+# --------------------------------------------------------------------
+mkdir -p /home/gpadmin/.ssh
+chmod 700 /home/gpadmin/.ssh
+
+if [ ! -f /home/gpadmin/.ssh/id_rsa ]; then
+    ssh-keygen -t rsa -b 4096 -C gpadmin -f /home/gpadmin/.ssh/id_rsa -P "" > /dev/null 2>&1
+fi
+
+cat /home/gpadmin/.ssh/id_rsa.pub >> /home/gpadmin/.ssh/authorized_keys
+chmod 600 /home/gpadmin/.ssh/authorized_keys
+
+# Add the container's hostname to the known_hosts file to avoid SSH warnings
+ssh-keyscan -t rsa cdw > /home/gpadmin/.ssh/known_hosts 2>/dev/null
+
+# --------------------------------------------------------------------
+# Cloudberry Data Directories Setup
+# --------------------------------------------------------------------
+# The script sets up the necessary directories for Apache Cloudberry,
+# including directories for the coordinator, standby coordinator, primary
+# segments, and mirror segments. It also sets up the configuration files
+# required for initializing the database.
+# --------------------------------------------------------------------
+sudo rm -rf /data1/*
+sudo mkdir -p /data1/coordinator /data1/standby_coordinator /data1/primary /data1/mirror
+sudo chown -R gpadmin.gpadmin /data1
+
+# Copy the gpinitsystem configuration file to the home directory
+cp /tmp/gpinitsystem.conf /home/gpadmin
+
+# Set up the hostfile for cluster initialization
+echo $(hostname) > /home/gpadmin/hostfile_gpinitsystem
+
+# Change to the home directory of the current user
+cd $HOME
+
+# --------------------------------------------------------------------
+# Display a Welcome Banner
+# --------------------------------------------------------------------
+# The following ASCII art and welcome message are displayed when the
+# container starts. This banner provides a visual indication that the
+# container is running in the Apache Cloudberry Build Environment.
+# --------------------------------------------------------------------
+cat <<-'EOF'
+
+======================================================================
+
+                          ++++++++++       ++++++
+                        ++++++++++++++   +++++++
+                       ++++        +++++ ++++
+                      ++++          +++++++++
+                   =+====         =============+
+                 ========       =====+      =====
+                ====  ====     ====           ====
+               ====    ===     ===             ====
+               ====            === ===         ====
+               ====            ===  ==--       ===
+                =====          ===== --       ====
+                 =====================     ======
+                   ============================
+                                     =-----=
+     ____  _                    _  _
+    / ___|| |  ___   _   _   __| || |__    ___  _ __  _ __  _   _
+   | |    | | / _ \ | | | | / _` || '_ \  / _ \| '__|| '__|| | | |
+   | |___ | || (_) || |_| || (_| || |_) ||  __/| |   | |   | |_| |
+    \____||_| \____  \__,_| \__,_||_.__/  \___||_|   |_|    \__, |
+                                                            |___/
+----------------------------------------------------------------------
+
+EOF
+
+# --------------------------------------------------------------------
+# Display System Information
+# --------------------------------------------------------------------
+# The script sources the /etc/os-release file to retrieve the operating
+# system name and version. It then displays the following information:
+# - OS name and version
+# - Current user
+# - Container hostname
+# - IP address
+# - CPU model name and number of cores
+# - Total memory available
+# - Cloudberry version (if installed)
+# This information is useful for users to understand the environment they
+# are working in.
+# --------------------------------------------------------------------
+source /etc/os-release
+
+# First, create the CPU info detection function
+get_cpu_info() {
+   ARCH=$(uname -m)
+   if [ "$ARCH" = "x86_64" ]; then
+       lscpu | grep 'Model name:' | awk '{print substr($0, index($0,$3))}'
+   elif [ "$ARCH" = "aarch64" ]; then
+       VENDOR=$(lscpu | grep 'Vendor ID:' | awk '{print $3}')
+       if [ "$VENDOR" = "Apple" ] || [ "$VENDOR" = "0x61" ]; then
+           echo "Apple Silicon ($ARCH)"
+       else
+           if [ -f /proc/cpuinfo ]; then
+               IMPL=$(grep "CPU implementer" /proc/cpuinfo | head -1 | awk '{print $3}')
+               PART=$(grep "CPU part" /proc/cpuinfo | head -1 | awk '{print $3}')
+               if [ ! -z "$IMPL" ] && [ ! -z "$PART" ]; then
+                   echo "ARM $ARCH (Implementer: $IMPL, Part: $PART)"
+               else
+                   echo "ARM $ARCH"
+               fi
+           else
+               echo "ARM $ARCH"
+           fi
+       fi
+   else
+       echo "Unknown architecture: $ARCH"
+   fi
+}
+
+# Check if Apache Cloudberry is installed and display its version
+if rpm -q apache-cloudberry-db-incubating > /dev/null 2>&1; then
+    CBDB_VERSION=$(/usr/local/cbdb/bin/postgres --gp-version)
+else
+    CBDB_VERSION="Not installed"
+fi
+
+cat <<-EOF
+Welcome to the Apache Cloudberry Test Environment!
+
+Cloudberry version .. : $CBDB_VERSION
+Container OS ........ : $NAME $VERSION
+User ................ : $(whoami)
+Container hostname .. : $(hostname)
+IP Address .......... : $(hostname -I | awk '{print $1}')
+CPU Info ............ : $(get_cpu_info)
+CPU(s) .............. : $(nproc)
+Memory .............. : $(free -h | grep Mem: | awk '{print $2}') total
+======================================================================
+
+EOF
+
+# --------------------------------------------------------------------
+# Start an interactive bash shell
+# --------------------------------------------------------------------
+# Finally, the script starts an interactive bash shell to keep the
+# container running and allow the user to interact with the environment.
+# --------------------------------------------------------------------
+/bin/bash
diff --git a/devops/release/cloudberry-release.sh b/devops/release/cloudberry-release.sh
index 3ab044d5aab..fdc4809f2f8 100755
--- a/devops/release/cloudberry-release.sh
+++ b/devops/release/cloudberry-release.sh
@@ -565,9 +565,10 @@ section "Staging release: $TAG"
   # NOTE: For RC tags like "X.Y.Z-incubating-rcN", keep the tag as-is but
   # generate the tarball name and top-level directory using BASE_VERSION
   # (without "-rcN"). This allows promoting the voted bits without rebuilding.
-  # Keep -rcN in the artifact filename for RC voting, but keep the extracted
-  # top-level directory name as BASE_VERSION (without -rcN).
-  TAR_NAME="apache-cloudberry-${TAG}-src.tar.gz"
+  # Use BASE_VERSION for both tarball filename and extracted directory name
+  # to align with Apache incubator release conventions. This enables direct
+  # 'svn mv' to release repository after voting without renaming artifacts.
+  TAR_NAME="apache-cloudberry-${BASE_VERSION}-src.tar.gz"
   TMP_DIR=$(mktemp -d)
   trap 'rm -rf "$TMP_DIR"' EXIT
 
diff --git a/devops/sandbox/.env b/devops/sandbox/.env
index 233d7c5b1b5..1ceec2e5fb7 100644
--- a/devops/sandbox/.env
+++ b/devops/sandbox/.env
@@ -17,5 +17,5 @@
 # permissions and limitations under the License.
 #
 # --------------------------------------------------------------------
-CODEBASE_VERSION=2.0.0
+CODEBASE_VERSION=2.1.0
 OS_VERSION=rockylinux9
diff --git a/devops/sandbox/Dockerfile.RELEASE.rockylinux9 b/devops/sandbox/Dockerfile.RELEASE.rockylinux9
index ac394c6cb60..215c32f452d 100644
--- a/devops/sandbox/Dockerfile.RELEASE.rockylinux9
+++ b/devops/sandbox/Dockerfile.RELEASE.rockylinux9
@@ -94,6 +94,7 @@ RUN dnf makecache && \
         readline-devel \
         zlib-devel && \
     dnf install -y --enablerepo=crb \
+        liburing-devel \
         libuv-devel \
         libyaml-devel \
         perl-IPC-Run \
@@ -120,10 +121,12 @@ USER gpadmin
 WORKDIR /home/gpadmin
 
 # Release version to build (Apache official tarball)
-ARG CB_RELEASE_VERSION=2.0.0-incubating
+ARG CB_RELEASE_VERSION=2.1.0-incubating
 
 # Download and extract the specified release version from Apache
-RUN wget -nv "https://downloads.apache.org/incubator/cloudberry/${CB_RELEASE_VERSION}/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz" -O /home/gpadmin/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz && \
+# Using Apache mirror system for better download reliability and speed
+RUN curl -L -o /home/gpadmin/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz \
+    "https://www.apache.org/dyn/closer.lua/incubator/cloudberry/${CB_RELEASE_VERSION}/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz?action=download" && \
     tar -xzf /home/gpadmin/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz -C /home/gpadmin && \
     rm -f /home/gpadmin/apache-cloudberry-${CB_RELEASE_VERSION}-src.tar.gz && \
     mv /home/gpadmin/apache-cloudberry-${CB_RELEASE_VERSION} /home/gpadmin/cloudberry
@@ -131,47 +134,9 @@ RUN wget -nv "https://downloads.apache.org/incubator/cloudberry/${CB_RELEASE_VER
 # Build Cloudberry using the official build scripts
 RUN cd /home/gpadmin/cloudberry && \
     export SRC_DIR=/home/gpadmin/cloudberry && \
-    mkdir -p "${SRC_DIR}/build-logs" && \
-    # Ensure Cloudberry lib dir exists and has Xerces libs available
-    sudo rm -rf /usr/local/cloudberry-db && \
-    sudo mkdir -p /usr/local/cloudberry-db/lib && \
-    sudo cp -v /usr/local/xerces-c/lib/libxerces-c.so \
-              /usr/local/xerces-c/lib/libxerces-c-3.*.so \
-              /usr/local/cloudberry-db/lib/ && \
-    sudo chown -R gpadmin:gpadmin /usr/local/cloudberry-db && \
-    # Configure with required features and paths
-    export LD_LIBRARY_PATH=/usr/local/cloudberry-db/lib:$LD_LIBRARY_PATH && \
-    ./configure --prefix=/usr/local/cloudberry-db \
-                --disable-external-fts \
-                --enable-debug \
-                --enable-cassert \
-                --enable-debug-extensions \
-                --enable-gpcloud \
-                --enable-ic-proxy \
-                --enable-mapreduce \
-                --enable-orafce \
-                --enable-orca \
-                --enable-pax \
-                --disable-pxf \
-                --enable-tap-tests \
-                --with-gssapi \
-                --with-ldap \
-                --with-libxml \
-                --with-lz4 \
-                --with-pam \
-                --with-perl \
-                --with-pgport=5432 \
-                --with-python \
-                --with-pythonsrc-ext \
-                --with-ssl=openssl \
-                --with-uuid=e2fs \
-                --with-includes=/usr/local/xerces-c/include \
-                --with-libraries=/usr/local/cloudberry-db/lib && \
-    # Build and install
-    make -j$(nproc) --directory ${SRC_DIR} && \
-    make -j$(nproc) --directory ${SRC_DIR}/contrib && \
-    make install --directory ${SRC_DIR} && \
-    make install --directory "${SRC_DIR}/contrib"
+    mkdir -p ${SRC_DIR}/build-logs && \
+    ./devops/build/automation/cloudberry/scripts/configure-cloudberry.sh && \
+    ./devops/build/automation/cloudberry/scripts/build-cloudberry.sh
 
 # --------------------------------------------------------------------
 # Runtime stage: Rocky Linux 9 runtime with required dependencies
@@ -192,6 +157,7 @@ RUN dnf -y update && \
       krb5-libs \
       libevent \
       libicu \
+      liburing \
       libuuid \
       libxml2 \
       libyaml \
diff --git a/devops/sandbox/README.md b/devops/sandbox/README.md
index 9f475977835..fb6a5ef80c3 100644
--- a/devops/sandbox/README.md
+++ b/devops/sandbox/README.md
@@ -92,14 +92,14 @@ Build and deploy steps:
 
     ```shell
     cd cloudberry/devops/sandbox
-    ./run.sh -c 2.0.0
+    ./run.sh -c 2.1.0
     ```
 
     - For latest Apache Cloudberry release running across multiple containers
 
     ```shell
     cd cloudberry/devops/sandbox
-    ./run.sh -c 2.0.0 -m
+    ./run.sh -c 2.1.0 -m
     ```
 
     - For latest main branch running on a single container
diff --git a/devops/sandbox/run.sh b/devops/sandbox/run.sh
index 7c266b8f64c..705442d98e1 100755
--- a/devops/sandbox/run.sh
+++ b/devops/sandbox/run.sh
@@ -38,7 +38,7 @@ PIP_INDEX_URL_VAR="${PIP_INDEX_URL_VAR:-$DEFAULT_PIP_INDEX_URL_VAR}"
 # Function to display help message
 function usage() {
     echo "Usage: $0 [-o <os_version>] [-c <codebase_version>] [-b] [-m]"
-    echo "  -c  Codebase version (valid values: main, local, or other available version like 2.0.0)"
+    echo "  -c  Codebase version (valid values: main, local, or other available version like 2.1.0)"
     echo "  -t  Timezone (default: America/Los_Angeles, or set via TIMEZONE_VAR environment variable)"
     echo "  -p  Python Package Index (PyPI) (default: https://pypi.org/simple, or set via PIP_INDEX_URL_VAR environment variable)"
     echo "  -b  Build only, do not run the container (default: false, or set via BUILD_ONLY environment variable)"
diff --git a/doc/src/sgml/config.sgml b/doc/src/sgml/config.sgml
index 23f60cad528..9b03793f74a 100644
--- a/doc/src/sgml/config.sgml
+++ b/doc/src/sgml/config.sgml
@@ -9027,6 +9027,23 @@ SET XML OPTION { DOCUMENT | CONTENT };
       </listitem>
      </varlistentry>
 
+     <varlistentry id="guc-restrict-nonsystem-relation-kind" xreflabel="restrict_nonsystem_relation_kind">
+      <term><varname>restrict_nonsystem_relation_kind</varname> (<type>string</type>)
+      <indexterm>
+       <primary><varname>restrict_nonsystem_relation_kind</varname></primary>
+       <secondary>configuration parameter</secondary>
+     </indexterm>
+     </term>
+     <listitem>
+      <para>
+       This variable specifies relation kind to which access is restricted.
+       It contains a comma-separated list of relation kind.  Currently, the
+       supported relation kinds are <literal>view</literal> and
+       <literal>foreign-table</literal>.
+      </para>
+     </listitem>
+     </varlistentry>
+
      </variablelist>
     </sect2>
      <sect2 id="runtime-config-client-format">
diff --git a/doc/src/sgml/protocol.sgml b/doc/src/sgml/protocol.sgml
index 7141f6c277a..682142724c7 100644
--- a/doc/src/sgml/protocol.sgml
+++ b/doc/src/sgml/protocol.sgml
@@ -1527,10 +1527,10 @@ SELCT 1/0;<!-- this typo is intentional -->
 
    <para>
     The frontend should also be prepared to handle an ErrorMessage
-    response to SSLRequest from the server.  This would only occur if
-    the server predates the addition of <acronym>SSL</acronym> support
-    to <productname>PostgreSQL</productname>.  (Such servers are now very ancient,
-    and likely do not exist in the wild anymore.)
+    response to SSLRequest from the server. The frontend should not display
+    this error message to the user/application, since the server has not been
+    authenticated
+    (<ulink url="https://www.postgresql.org/support/security/CVE-2024-10977/">CVE-2024-10977</ulink>).
     In this case the connection must
     be closed, but the frontend might choose to open a fresh connection
     and proceed without requesting <acronym>SSL</acronym>.
@@ -1604,12 +1604,13 @@ SELCT 1/0;<!-- this typo is intentional -->
 
    <para>
     The frontend should also be prepared to handle an ErrorMessage
-    response to GSSENCRequest from the server.  This would only occur if
-    the server predates the addition of <acronym>GSSAPI</acronym> encryption
-    support to <productname>PostgreSQL</productname>.  In this case the
-    connection must be closed, but the frontend might choose to open a fresh
-    connection and proceed without requesting <acronym>GSSAPI</acronym>
-    encryption.
+    response to GSSENCRequest from the server.  The frontend should not display
+    this error message to the user/application, since the server has not been
+    authenticated
+    (<ulink url="https://www.postgresql.org/support/security/CVE-2024-10977/">CVE-2024-10977</ulink>).
+    In this case the connection must be closed, but the frontend might choose
+    to open a fresh connection and proceed without requesting
+    <acronym>GSSAPI</acronym> encryption.
    </para>
 
    <para>
diff --git a/doc/src/sgml/ref/pg_dump.sgml b/doc/src/sgml/ref/pg_dump.sgml
index d3113d76a07..c405fef866b 100644
--- a/doc/src/sgml/ref/pg_dump.sgml
+++ b/doc/src/sgml/ref/pg_dump.sgml
@@ -831,6 +831,14 @@ PostgreSQL documentation
         The only exception is that an empty pattern is disallowed.
        </para>
 
+       <note>
+        <para>
+         Using wildcards in <option>--include-foreign-data</option> may result
+         in access to unexpected foreign servers. Also, to use this option securely,
+         make sure that the named server must have a trusted owner.
+        </para>
+       </note>
+
        <note>
         <para>
          When <option>--include-foreign-data</option> is specified,
diff --git a/gpMgmt/bin/Makefile b/gpMgmt/bin/Makefile
index c5eb6ccba9c..7092700b784 100644
--- a/gpMgmt/bin/Makefile
+++ b/gpMgmt/bin/Makefile
@@ -111,8 +111,19 @@ download-python-deps:
 	else \
 		echo "PyGreSQL-$(PYGRESQL_VERSION).tar.gz already exists, skipping download"; \
 	fi
-	# Install wheel and cython for PyYAML building
-	pip3 install --user wheel "cython<3.0.0"
+	# Install wheel and cython for PyYAML building (only if not exists)
+	@if python3 -c "import wheel" >/dev/null 2>&1; then \
+		echo "wheel already exists, skipping installation"; \
+	else \
+		echo "Installing wheel..."; \
+		pip3 install --user wheel 2>/dev/null || pip3 install --user --break-system-packages wheel; \
+	fi
+	@if python3 -c "import cython" >/dev/null 2>&1; then \
+		echo "cython already exists, skipping installation"; \
+	else \
+		echo "Installing cython..."; \
+		pip3 install --user "cython<3.0.0" 2>/dev/null || pip3 install --user --break-system-packages "cython<3.0.0"; \
+	fi
 
 #
 # PyGreSQL
diff --git a/gpMgmt/bin/gpcheckcat_modules/orphaned_toast_tables_check.py b/gpMgmt/bin/gpcheckcat_modules/orphaned_toast_tables_check.py
index 21ec8d18047..789e1b139d2 100644
--- a/gpMgmt/bin/gpcheckcat_modules/orphaned_toast_tables_check.py
+++ b/gpMgmt/bin/gpcheckcat_modules/orphaned_toast_tables_check.py
@@ -25,7 +25,7 @@ def __init__(self):
         # pg_depend back to pg_class, and if the table oids don't match and/or
         # one is missing, the TOAST table is considered to be an orphan.
         # Note: Handles toast tables <pg_toast_temp_*> which is created/used by InitTempTableNamespace().
-        self.orphaned_toast_tables_query = """
+        self.orphaned_toast_tables_query = r"""
 SELECT
     gp_segment_id AS content_id,
     toast_table_oid,
diff --git a/gpMgmt/bin/gppylib/commands/base.py b/gpMgmt/bin/gppylib/commands/base.py
index d455c6e2d13..e09dd40c061 100755
--- a/gpMgmt/bin/gppylib/commands/base.py
+++ b/gpMgmt/bin/gppylib/commands/base.py
@@ -230,7 +230,7 @@ def __init__(self, numWorkers=16, operations=None):
         if operations is not None:
             for operation in operations:
                 self._spoof_operation(operation)
-        super(OperationWorkerPool, self).__init__(numWorkers, operations)
+        super(OperationWorkerPool, self).__init__(numWorkers, items=operations)
 
     def check_results(self):
         raise NotImplementedError("OperationWorkerPool has no means of verifying success.")
diff --git a/gpMgmt/bin/gppylib/commands/pg.py b/gpMgmt/bin/gppylib/commands/pg.py
index a2af133c28f..f430b294500 100644
--- a/gpMgmt/bin/gppylib/commands/pg.py
+++ b/gpMgmt/bin/gppylib/commands/pg.py
@@ -1,13 +1,15 @@
 #!/usr/bin/env python3
 #
-# Copyright (c) Greenplum Inc 2008. All Rights Reserved. 
+# Copyright (c) Greenplum Inc 2008. All Rights Reserved.
 #
 
+from contextlib import closing
 import os
 import pipes
 
 from gppylib.gplog import *
 from gppylib.gparray import *
+from gppylib.db import dbconn
 from .base import *
 from .unix import *
 from gppylib.commands.base import *
@@ -17,6 +19,30 @@
 
 GPHOME=os.environ.get('GPHOME')
 
+
+def ensure_replication_slot_exists(source_host, source_port,
+                                   replication_slot_name):
+    if not replication_slot_name:
+        return False
+
+    escaped_slot_name = replication_slot_name.replace("'", "''")
+    dburl = dbconn.DbURL(hostname=source_host, port=source_port,
+                         dbname='template1')
+    with closing(dbconn.connect(dburl, utility=True)) as conn:
+        slot_exists = dbconn.querySingleton(
+            conn,
+            "SELECT count(*) FROM pg_catalog.pg_replication_slots "
+            "WHERE slot_name = '{}'".format(escaped_slot_name))
+        if slot_exists > 0:
+            return False
+
+        dbconn.execSQL(
+            conn,
+            "SELECT pg_catalog.pg_create_physical_replication_slot('{}')"
+            .format(escaped_slot_name))
+
+    return True
+
 class DbStatus(Command):
     def __init__(self,name,db,ctxt=LOCAL,remoteHost=None):
         self.db=db        
diff --git a/gpMgmt/bin/gppylib/commands/test/unit/test_unit_pg_base_backup.py b/gpMgmt/bin/gppylib/commands/test/unit/test_unit_pg_base_backup.py
index 117f62b41ea..66621c39d5c 100644
--- a/gpMgmt/bin/gppylib/commands/test/unit/test_unit_pg_base_backup.py
+++ b/gpMgmt/bin/gppylib/commands/test/unit/test_unit_pg_base_backup.py
@@ -1,4 +1,5 @@
 import unittest
+from unittest.mock import Mock, patch
 from gppylib.commands import pg
 
 
@@ -44,6 +45,60 @@ def test_base_backup_does_not_pass_conflicting_xlog_method_argument_when_given_r
         self.assertNotIn("-x", base_backup.command_tokens)
         self.assertNotIn("--xlog", base_backup.command_tokens)
 
+    @patch('gppylib.commands.pg.dbconn.querySingleton', return_value=1)
+    @patch('gppylib.commands.pg.dbconn.connect')
+    @patch('gppylib.commands.pg.dbconn.DbURL')
+    def test_ensure_replication_slot_exists_returns_false_when_slot_exists(self, mock_dburl,
+                                                                           mock_connect,
+                                                                           mock_query_singleton):
+        mock_conn = Mock()
+        mock_connect.return_value = mock_conn
+
+        created = pg.ensure_replication_slot_exists('source-host', 5432, 'slot_name')
+
+        self.assertFalse(created)
+        mock_dburl.assert_called_once_with(hostname='source-host', port=5432, dbname='template1')
+        mock_connect.assert_called_once_with(mock_dburl.return_value, utility=True)
+        self.assertEqual(1, mock_query_singleton.call_count)
+        self.assertIn("FROM pg_catalog.pg_replication_slots", mock_query_singleton.call_args[0][1])
+        mock_conn.close.assert_called_once_with()
+
+    @patch('gppylib.commands.pg.dbconn.execSQL')
+    @patch('gppylib.commands.pg.dbconn.querySingleton', return_value=0)
+    @patch('gppylib.commands.pg.dbconn.connect')
+    @patch('gppylib.commands.pg.dbconn.DbURL')
+    def test_ensure_replication_slot_exists_creates_missing_slot(self, mock_dburl,
+                                                                 mock_connect,
+                                                                 mock_query_singleton,
+                                                                 mock_exec_sql):
+        mock_conn = Mock()
+        mock_connect.return_value = mock_conn
+
+        created = pg.ensure_replication_slot_exists('source-host', 5432, 'slot_name')
+
+        self.assertTrue(created)
+        mock_dburl.assert_called_once_with(hostname='source-host', port=5432, dbname='template1')
+        mock_connect.assert_called_once_with(mock_dburl.return_value, utility=True)
+        self.assertEqual(1, mock_query_singleton.call_count)
+        self.assertIn("FROM pg_catalog.pg_replication_slots", mock_query_singleton.call_args[0][1])
+        mock_exec_sql.assert_called_once()
+        self.assertIn("pg_create_physical_replication_slot('slot_name')",
+                      mock_exec_sql.call_args[0][1])
+        mock_conn.close.assert_called_once_with()
+
+    @patch('gppylib.commands.pg.dbconn.querySingleton')
+    @patch('gppylib.commands.pg.dbconn.connect')
+    @patch('gppylib.commands.pg.dbconn.DbURL')
+    def test_ensure_replication_slot_exists_skips_empty_slot_name(self, mock_dburl,
+                                                                  mock_connect,
+                                                                  mock_query_singleton):
+        created = pg.ensure_replication_slot_exists('source-host', 5432, None)
+
+        self.assertFalse(created)
+        mock_dburl.assert_not_called()
+        mock_connect.assert_not_called()
+        mock_query_singleton.assert_not_called()
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/gpMgmt/bin/gppylib/logfilter.py b/gpMgmt/bin/gppylib/logfilter.py
index c427ac1a6cb..46c0b5e174a 100644
--- a/gpMgmt/bin/gppylib/logfilter.py
+++ b/gpMgmt/bin/gppylib/logfilter.py
@@ -67,7 +67,7 @@ def FilterLogEntries(iterable,
                      filters=[],
                      ibegin=0,
                      jend=None):
-    """
+    r"""
     Generator to consume the lines of a GPDB log file from iterable,
     yield the lines which satisfy the given criteria, and skip the rest.
 
@@ -668,7 +668,7 @@ def MatchInFirstLine(iterable, regex):
 
 
 def NoMatchInFirstLine(iterable, regex):
-    """
+    r"""
     Generator to filter a stream of groups.  Skips those groups whose
     first line contains a match for the given regex; yields all other
     groups.
diff --git a/gpMgmt/bin/gppylib/mainUtils.py b/gpMgmt/bin/gppylib/mainUtils.py
index 553ca9d57c9..e947639591d 100644
--- a/gpMgmt/bin/gppylib/mainUtils.py
+++ b/gpMgmt/bin/gppylib/mainUtils.py
@@ -488,7 +488,7 @@ def parseStatusLine(line, isStart = False, isStop = False):
 
     
 def check_fts(fts):
-    fts_check_cmd= "ps -ef | awk '{print \$2, \$8}' | grep gpfts | grep -v grep"
+    fts_check_cmd= r"ps -ef | awk '{print \$2, \$8}' | grep gpfts | grep -v grep"
     process_cmd = "gpssh -h %s -e \"%s\" | wc -l" % (fts, fts_check_cmd)
     fts_process_res=int(subprocess.check_output(process_cmd, shell=True).decode().strip())
     return fts_process_res == 2
@@ -500,7 +500,7 @@ def check_etcd(etcd):
     if etcd_process_res == 2:
         return True
     # for demo cluster
-    etcd_check_cmd = "ps -ef | awk '{print \$2, \$8}' | grep etcd | grep -v grep"
+    etcd_check_cmd = r"ps -ef | awk '{print \$2, \$8}' | grep etcd | grep -v grep"
     process_cmd = "gpssh -h %s -e \"%s\"| wc -l" % (etcd, etcd_check_cmd)
     etcd_process_res = int(subprocess.check_output(process_cmd, shell=True).decode().strip())
     return etcd_process_res == 2
diff --git a/gpMgmt/bin/gppylib/test/unit/test_unit_gpsegrecovery.py b/gpMgmt/bin/gppylib/test/unit/test_unit_gpsegrecovery.py
index c806dbaed90..b525801b07a 100644
--- a/gpMgmt/bin/gppylib/test/unit/test_unit_gpsegrecovery.py
+++ b/gpMgmt/bin/gppylib/test/unit/test_unit_gpsegrecovery.py
@@ -106,10 +106,12 @@ def setUp(self):
         self.maxDiff = None
         self.mock_logger = Mock(spec=['log', 'info', 'debug', 'error', 'warn', 'exception'])
         self.apply_patches([
+            patch('gpsegrecovery.ensure_replication_slot_exists'),
             patch('gpsegrecovery.start_segment', return_value=Mock()),
             patch('gpsegrecovery.PgBaseBackup.__init__', return_value=None),
             patch('gpsegrecovery.PgBaseBackup.run')
         ])
+        self.mock_ensure_slot = self.get_mock_from_apply_patch('ensure_replication_slot_exists')
         self.mock_pgbasebackup_run = self.get_mock_from_apply_patch('run')
         self.mock_pgbasebackup_init = self.get_mock_from_apply_patch('__init__')
 
@@ -130,6 +132,7 @@ def tearDown(self):
         super(FullRecoveryTestCase, self).tearDown()
 
     def _assert_basebackup_runs(self, expected_init_args):
+        self.mock_ensure_slot.assert_called_once_with('sdw1', 40000, 'internal_wal_replication_slot')
         self.assertEqual(1, self.mock_pgbasebackup_init.call_count)
         self.assertEqual(expected_init_args, self.mock_pgbasebackup_init.call_args)
         self.assertEqual(1, self.mock_pgbasebackup_run.call_count)
@@ -172,49 +175,37 @@ def test_basebackup_run_no_forceoverwrite_passes(self):
         self._assert_basebackup_runs(expected_init_args1)
         self._assert_cmd_passed()
 
-    def test_basebackup_run_one_exception(self):
-        self.mock_pgbasebackup_run.side_effect = [Exception('backup failed once'), Mock()]
+    def test_basebackup_slot_check_exception(self):
+        self.mock_ensure_slot.side_effect = [Exception('slot check failed')]
 
         self.full_recovery_cmd.run()
 
-        expected_init_args1 = call("/data/mirror0", "sdw1", '40000', create_slot=False,
-                                   replication_slot_name='internal_wal_replication_slot',
-                                   forceoverwrite=True, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        expected_init_args2 = call("/data/mirror0", "sdw1", '40000', create_slot=True,
-                                   replication_slot_name='internal_wal_replication_slot',
-                                   forceoverwrite=True, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        self.assertEqual(2, self.mock_pgbasebackup_init.call_count)
-        self.assertEqual([expected_init_args1, expected_init_args2] , self.mock_pgbasebackup_init.call_args_list)
-        self.assertEqual(2, self.mock_pgbasebackup_run.call_count)
-        self.assertEqual([call(validateAfter=True),call(validateAfter=True)], self.mock_pgbasebackup_run.call_args_list)
-        gpsegrecovery.start_segment.assert_called_once_with(self.seg_recovery_info, self.mock_logger, self.era)
-        self._assert_cmd_passed()
+        self.assertEqual(0, self.mock_pgbasebackup_init.call_count)
+        self.assertEqual(0, self.mock_pgbasebackup_run.call_count)
+        self.assertEqual(0, gpsegrecovery.start_segment.call_count)
+        self._assert_cmd_failed('{"error_type": "full", "error_msg": "slot check failed", "dbid": 2, '
+                                '"datadir": "/data/mirror0", "port": 50000, '
+                                '"progress_file": "/tmp/test_progress_file"}')
 
-    def test_basebackup_run_two_exceptions(self):
-        self.mock_pgbasebackup_run.side_effect=[Exception('backup failed once'),
-                                                Exception('backup failed twice')]
+    def test_basebackup_run_exception(self):
+        self.mock_pgbasebackup_run.side_effect=[Exception('backup failed once')]
 
         self.full_recovery_cmd.run()
 
         expected_init_args1 = call("/data/mirror0", "sdw1", '40000', create_slot=False,
                                    replication_slot_name='internal_wal_replication_slot',
                                    forceoverwrite=True, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        expected_init_args2 = call("/data/mirror0", "sdw1", '40000', create_slot=True,
-                                   replication_slot_name='internal_wal_replication_slot',
-                                   forceoverwrite=True, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        self.assertEqual(2, self.mock_pgbasebackup_init.call_count)
-        self.assertEqual([expected_init_args1, expected_init_args2], self.mock_pgbasebackup_init.call_args_list)
-        self.assertEqual(2, self.mock_pgbasebackup_run.call_count)
-        self.assertEqual([call(validateAfter=True),call(validateAfter=True)], self.mock_pgbasebackup_run.call_args_list)
-        self.mock_logger.info.any_call('Running pg_basebackup failed: backup failed once')
-        self.mock_logger.info.assert_called_with("Re-running pg_basebackup, creating the slot this time")
+        self.mock_ensure_slot.assert_called_once_with('sdw1', 40000, 'internal_wal_replication_slot')
+        self.assertEqual(1, self.mock_pgbasebackup_init.call_count)
+        self.assertEqual([expected_init_args1], self.mock_pgbasebackup_init.call_args_list)
+        self.assertEqual(1, self.mock_pgbasebackup_run.call_count)
+        self.assertEqual([call(validateAfter=True)], self.mock_pgbasebackup_run.call_args_list)
         self.assertEqual(0, gpsegrecovery.start_segment.call_count)
-        self._assert_cmd_failed('{"error_type": "full", "error_msg": "backup failed twice", "dbid": 2, ' \
+        self._assert_cmd_failed('{"error_type": "full", "error_msg": "backup failed once", "dbid": 2, ' \
                                 '"datadir": "/data/mirror0", "port": 50000, "progress_file": "/tmp/test_progress_file"}')
 
-    def test_basebackup_run_no_forceoverwrite_two_exceptions(self):
-        self.mock_pgbasebackup_run.side_effect = [Exception('backup failed once'),
-                                                  Exception('backup failed twice')]
+    def test_basebackup_run_no_forceoverwrite_exception(self):
+        self.mock_pgbasebackup_run.side_effect = [Exception('backup failed once')]
         self.full_recovery_cmd.forceoverwrite = False
 
         self.full_recovery_cmd.run()
@@ -222,16 +213,13 @@ def test_basebackup_run_no_forceoverwrite_two_exceptions(self):
         expected_init_args1 = call("/data/mirror0", "sdw1", '40000', create_slot=False,
                                    replication_slot_name='internal_wal_replication_slot',
                                    forceoverwrite=False, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        # regardless of the passed in value, second call to pg_basebackup will always have forceoverwrite=True
-        expected_init_args2 = call("/data/mirror0", "sdw1", '40000', create_slot=True,
-                                   replication_slot_name='internal_wal_replication_slot',
-                                   forceoverwrite=True, target_gp_dbid=2, progress_file='/tmp/test_progress_file')
-        self.assertEqual(2, self.mock_pgbasebackup_init.call_count)
-        self.assertEqual([expected_init_args1, expected_init_args2], self.mock_pgbasebackup_init.call_args_list)
-        self.assertEqual(2, self.mock_pgbasebackup_run.call_count)
-        self.assertEqual([call(validateAfter=True),call(validateAfter=True)], self.mock_pgbasebackup_run.call_args_list)
+        self.mock_ensure_slot.assert_called_once_with('sdw1', 40000, 'internal_wal_replication_slot')
+        self.assertEqual(1, self.mock_pgbasebackup_init.call_count)
+        self.assertEqual([expected_init_args1], self.mock_pgbasebackup_init.call_args_list)
+        self.assertEqual(1, self.mock_pgbasebackup_run.call_count)
+        self.assertEqual([call(validateAfter=True)], self.mock_pgbasebackup_run.call_args_list)
         self.assertEqual(0, gpsegrecovery.start_segment.call_count)
-        self._assert_cmd_failed('{"error_type": "full", "error_msg": "backup failed twice", "dbid": 2, ' \
+        self._assert_cmd_failed('{"error_type": "full", "error_msg": "backup failed once", "dbid": 2, ' \
                                 '"datadir": "/data/mirror0", "port": 50000, "progress_file": "/tmp/test_progress_file"}')
 
     def test_basebackup_init_exception(self):
@@ -287,7 +275,10 @@ def tearDown(self):
     @patch('gppylib.commands.pg.PgRewind.run')
     @patch('gpsegrecovery.PgBaseBackup.__init__', return_value=None)
     @patch('gpsegrecovery.PgBaseBackup.run')
-    def test_complete_workflow(self, mock_pgbasebackup_run, mock_pgbasebackup_init, mock_pgrewind_run, mock_pgrewind_init):
+    @patch('gpsegrecovery.ensure_replication_slot_exists')
+    def test_complete_workflow(self, mock_ensure_slot, mock_pgbasebackup_run,
+                               mock_pgbasebackup_init, mock_pgrewind_run,
+                               mock_pgrewind_init):
         mix_confinfo = gppylib.recoveryinfo.serialize_list([
             self.full_r1, self.incr_r2])
         sys.argv = ['gpsegrecovery', '-l', '/tmp/logdir', '--era', '{}'.format(self.era), '-c {}'.format(mix_confinfo)]
@@ -301,17 +292,21 @@ def test_complete_workflow(self, mock_pgbasebackup_run, mock_pgbasebackup_init,
         self.assertEqual(1, mock_pgrewind_init.call_count)
         self.assertEqual(1, mock_pgbasebackup_run.call_count)
         self.assertEqual(1, mock_pgbasebackup_init.call_count)
+        mock_ensure_slot.assert_called_once_with('source_hostname1', 6001, 'internal_wal_replication_slot')
         self.assertRegex(gplog.get_logfile(), '/gpsegrecovery.py_\d+\.log')
 
     @patch('gppylib.commands.pg.PgRewind.__init__', return_value=None)
     @patch('gppylib.commands.pg.PgRewind.run')
     @patch('gpsegrecovery.PgBaseBackup.__init__', return_value=None)
     @patch('gpsegrecovery.PgBaseBackup.run')
-    def test_complete_workflow_exception(self, mock_pgbasebackup_run, mock_pgbasebackup_init, mock_pgrewind_run,
+    @patch('gpsegrecovery.ensure_replication_slot_exists')
+    def test_complete_workflow_exception(self, mock_ensure_slot,
+                                         mock_pgbasebackup_run,
+                                         mock_pgbasebackup_init,
+                                         mock_pgrewind_run,
                                          mock_pgrewind_init):
         mock_pgrewind_run.side_effect = [Exception('pg_rewind failed')]
-        mock_pgbasebackup_run.side_effect = [Exception('pg_basebackup failed once'),
-                                             Exception('pg_basebackup failed twice')]
+        mock_pgbasebackup_run.side_effect = [Exception('pg_basebackup failed once')]
         mix_confinfo = gppylib.recoveryinfo.serialize_list([
             self.full_r1, self.incr_r2])
         sys.argv = ['gpsegrecovery', '-l', '/tmp/logdir', '--era={}'.format(self.era), '-c {}'.format(mix_confinfo)]
@@ -322,14 +317,15 @@ def test_complete_workflow_exception(self, mock_pgbasebackup_run, mock_pgbasebac
 
         self.assertCountEqual('[{"error_type": "incremental", "error_msg": "pg_rewind failed", "dbid": 4, "datadir": "target_data_dir4", '
                               '"port": 5004, "progress_file": "/tmp/progress_file4"} , '
-                              '{"error_type": "full", "error_msg": "pg_basebackup failed twice", "dbid": 1,'
+                              '{"error_type": "full", "error_msg": "pg_basebackup failed once", "dbid": 1,'
                               '"datadir": "target_data_dir1", "port": 5001, "progress_file": "/tmp/progress_file1"}]',
                               buf.getvalue().strip())
         self.assertEqual(1, ex.exception.code)
         self.assertEqual(1, mock_pgrewind_run.call_count)
         self.assertEqual(1, mock_pgrewind_init.call_count)
-        self.assertEqual(2, mock_pgbasebackup_run.call_count)
-        self.assertEqual(2, mock_pgbasebackup_init.call_count)
+        self.assertEqual(1, mock_pgbasebackup_run.call_count)
+        self.assertEqual(1, mock_pgbasebackup_init.call_count)
+        mock_ensure_slot.assert_called_once_with('source_hostname1', 6001, 'internal_wal_replication_slot')
         self.assertRegex(gplog.get_logfile(), '/gpsegrecovery.py_\d+\.log')
 
     @patch('recovery_base.gplog.setup_tool_logging')
diff --git a/gpMgmt/bin/lib/gpconfigurenewsegment b/gpMgmt/bin/lib/gpconfigurenewsegment
index c37c70bf1fa..4f71348b9a8 100755
--- a/gpMgmt/bin/lib/gpconfigurenewsegment
+++ b/gpMgmt/bin/lib/gpconfigurenewsegment
@@ -10,7 +10,7 @@ from optparse import Option, OptionGroup, OptionParser, OptionValueError, SUPPRE
 
 from gppylib.gpparseopts import OptParser, OptChecker
 from gppylib.commands.gp import ModifyConfSetting, SegmentStart, SegmentStop
-from gppylib.commands.pg import PgBaseBackup
+from gppylib.commands.pg import PgBaseBackup, ensure_replication_slot_exists
 from gppylib.db import dbconn
 from gppylib.commands import unix
 from gppylib.commands.pg import DbStatus
@@ -134,6 +134,10 @@ class ConfExpSegCmd(Command):
                         self.progressFile = '%s/pg_basebackup.%s.dbid%s.out' % (gplog.get_logger_dir(),
                                                                                 datetime.datetime.today().strftime('%Y%m%d_%H%M%S'),
                                                                                 self.dbid)
+                    ensure_replication_slot_exists(
+                        self.syncWithSegmentHostname,
+                        self.syncWithSegmentPort,
+                        self.replicationSlotName)
                     # Create a mirror based on the primary
                     cmd = PgBaseBackup(target_datadir=self.datadir,
                                        source_host=self.syncWithSegmentHostname,
@@ -149,30 +153,9 @@ class ConfExpSegCmd(Command):
                         self.set_results(CommandResult(0, b'', b'', True, False))
                         if shouldDeleteProgressFile:
                             os.remove(self.progressFile)
-
                     except Exception as e:
-                        #  If the cluster never has mirrors, cmd will fail
-                        #  quickly because the internal slot doesn't exist.
-                        #  Re-run with `create_slot`.
-                        #  GPDB_12_MERGE_FIXME could we check it before? or let
-                        #  pg_basebackup create slot if not exists.
-                        cmd = PgBaseBackup(target_datadir=self.datadir,
-                                           source_host=self.syncWithSegmentHostname,
-                                           source_port=str(self.syncWithSegmentPort),
-                                           create_slot = True,
-                                           replication_slot_name=self.replicationSlotName,
-                                           forceoverwrite=True,
-                                           target_gp_dbid=self.dbid,
-                                           logfile=self.progressFile)
-                        try:
-                            logger.info("Re-running pg_basebackup, creating the slot this time")
-                            cmd.run(validateAfter=True)
-                            self.set_results(CommandResult(0, b'', b'', True, False))
-                            if shouldDeleteProgressFile:
-                                os.remove(self.progressFile)
-                        except Exception as e:
-                            self.set_results(CommandResult(1, b'', str(e).encode(), True, False))
-                            raise
+                        self.set_results(CommandResult(1, b'', str(e).encode(), True, False))
+                        raise
 
                     logger.info("Successfully ran pg_basebackup: %s" % cmd.cmdStr)
                     return
diff --git a/gpMgmt/sbin/gpsegrecovery.py b/gpMgmt/sbin/gpsegrecovery.py
index 811a73ccbb5..51c72581e47 100644
--- a/gpMgmt/sbin/gpsegrecovery.py
+++ b/gpMgmt/sbin/gpsegrecovery.py
@@ -4,7 +4,8 @@
 import signal
 
 from gppylib.recoveryinfo import RecoveryErrorType
-from gppylib.commands.pg import PgBaseBackup, PgRewind
+from gppylib.commands.pg import (PgBaseBackup, PgRewind,
+                                 ensure_replication_slot_exists)
 from recovery_base import RecoveryBase, set_recovery_cmd_results
 from gppylib.commands.base import Command
 from gppylib.commands.gp import SegmentStart
@@ -30,6 +31,9 @@ def __init__(self, name, recovery_info, forceoverwrite, logger, era):
     @set_recovery_cmd_results
     def run(self):
         self.error_type = RecoveryErrorType.BASEBACKUP_ERROR
+        ensure_replication_slot_exists(self.recovery_info.source_hostname,
+                                       self.recovery_info.source_port,
+                                       self.replicationSlotName)
         cmd = PgBaseBackup(self.recovery_info.target_datadir,
                            self.recovery_info.source_hostname,
                            str(self.recovery_info.source_port),
@@ -39,26 +43,7 @@ def run(self):
                            target_gp_dbid=self.recovery_info.target_segment_dbid,
                            progress_file=self.recovery_info.progress_file)
         self.logger.info("Running pg_basebackup with progress output temporarily in %s" % self.recovery_info.progress_file)
-        try:
-            cmd.run(validateAfter=True)
-        except Exception as e: #TODO should this be ExecutionError?
-            self.logger.info("Running pg_basebackup failed: {}".format(str(e)))
-
-            #  If the cluster never has mirrors, cmd will fail
-            #  quickly because the internal slot doesn't exist.
-            #  Re-run with `create_slot`.
-            #  GPDB_12_MERGE_FIXME could we check it before? or let
-            #  pg_basebackup create slot if not exists.
-            cmd = PgBaseBackup(self.recovery_info.target_datadir,
-                               self.recovery_info.source_hostname,
-                               str(self.recovery_info.source_port),
-                               create_slot=True,
-                               replication_slot_name=self.replicationSlotName,
-                               forceoverwrite=True,
-                               target_gp_dbid=self.recovery_info.target_segment_dbid,
-                               progress_file=self.recovery_info.progress_file)
-            self.logger.info("Re-running pg_basebackup, creating the slot this time")
-            cmd.run(validateAfter=True)
+        cmd.run(validateAfter=True)
 
         self.error_type = RecoveryErrorType.DEFAULT_ERROR
         self.logger.info("Successfully ran pg_basebackup for dbid: {}".format(
diff --git a/gpcontrib/Makefile b/gpcontrib/Makefile
index 8d95a14f876..2969194cfac 100644
--- a/gpcontrib/Makefile
+++ b/gpcontrib/Makefile
@@ -22,8 +22,7 @@ ifeq "$(enable_debug_extensions)" "yes"
                gp_legacy_string_agg \
                gp_replica_check \
                gp_toolkit \
-               pg_hint_plan \
-               diskquota
+               pg_hint_plan
 else
 	recurse_targets = gp_sparse_vector \
 	       gp_distribution_policy \
@@ -31,10 +30,16 @@ else
                gp_legacy_string_agg \
                gp_exttable_fdw \
                gp_toolkit \
-               pg_hint_plan \
-               diskquota
+               pg_hint_plan
 endif
 
+ifeq "$(with_diskquota)" "yes"
+	recurse_targets += diskquota
+endif
+
+ifeq "$(with_gp_stats_collector)" "yes"
+	recurse_targets += gp_stats_collector
+endif
 ifeq "$(with_zstd)" "yes"
 	recurse_targets += zstd
 endif
@@ -99,4 +104,4 @@ installcheck:
 	$(MAKE) -C gp_sparse_vector installcheck
 	$(MAKE) -C gp_toolkit installcheck
 	$(MAKE) -C gp_exttable_fdw installcheck
-	$(MAKE) -C diskquota installcheck
+	if [ "$(with_diskquota)" = "yes" ]; then $(MAKE) -C diskquota installcheck; fi
diff --git a/gpcontrib/diskquota/CMakeLists.txt b/gpcontrib/diskquota/CMakeLists.txt
index fad393cb101..face48578a6 100644
--- a/gpcontrib/diskquota/CMakeLists.txt
+++ b/gpcontrib/diskquota/CMakeLists.txt
@@ -12,10 +12,6 @@ endif()
 # generate 'compile_commands.json'
 set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
 
-# Retrieve repository information
-include(${CMAKE_CURRENT_SOURCE_DIR}/cmake/Git.cmake)
-GitHash_Get(DISKQUOTA_GIT_HASH)
-
 include(${CMAKE_CURRENT_SOURCE_DIR}/cmake/Gpdb.cmake)
 
 
@@ -154,19 +150,6 @@ add_custom_target(create_artifact
   ${CMAKE_COMMAND} -E tar czvf ${artifact_NAME} "${tgz_NAME}.tar.gz")
 # packing end
 
-# Create build-info
-# The diskquota-build-info shouldn't be copied to GPDB release by install_gpdb_component
-include(${CMAKE_CURRENT_SOURCE_DIR}/cmake/BuildInfo.cmake)
-set(build_info_PATH ${CMAKE_CURRENT_BINARY_DIR}/diskquota-build-info)
-BuildInfo_Create(${build_info_PATH}
-  VARS
-  DISKQUOTA_GIT_HASH
-  DISKQUOTA_VERSION
-  GP_MAJOR_VERSION
-  GP_VERSION
-  CMAKE_BUILD_TYPE)
-# Create build-info end
-
 # Add installcheck targets
 add_subdirectory(tests)
 add_subdirectory(upgrade_test)
@@ -175,4 +158,3 @@ add_subdirectory(upgrade_test)
 install(PROGRAMS "cmake/install_gpdb_component" DESTINATION ".")
 install(FILES ${diskquota_DDL} DESTINATION "share/postgresql/extension/")
 install(TARGETS diskquota DESTINATION "lib/postgresql/")
-install(FILES ${build_info_PATH} DESTINATION ".")
diff --git a/gpcontrib/diskquota/cmake/BuildInfo.cmake b/gpcontrib/diskquota/cmake/BuildInfo.cmake
deleted file mode 100644
index 6e256f34502..00000000000
--- a/gpcontrib/diskquota/cmake/BuildInfo.cmake
+++ /dev/null
@@ -1,32 +0,0 @@
-# Create a build info file based on the given cmake variables
-# For example:
-# BuildInfo_Create(
-# ${CMAKE_CURRENT_BINARY_DIR}/build-info
-# VARS
-# DISKQUOTA_GIT_HASH
-# GP_MAJOR_VERSION)
-# )
-# will create a build info file:
-# ❯ cat build-info
-# DISKQUOTA_GIT_HASH = 151ed92
-# GP_MAJOR_VERSION = 6
-
-function(BuildInfo_Create path)
-  cmake_parse_arguments(
-    arg
-    ""
-    ""
-    "VARS"
-    ${ARGN})
-
-  # Set REGRESS test cases
-  foreach(key IN LISTS arg_VARS)
-    get_property(val VARIABLE PROPERTY ${key})
-    list(APPEND info_list "${key} = ${val}")
-  endforeach()
-  file(WRITE ${path} "")
-  foreach(content IN LISTS info_list)
-    file(APPEND ${path} "${content}\n")
-  endforeach()
-endfunction()
-
diff --git a/gpcontrib/diskquota/cmake/Git.cmake b/gpcontrib/diskquota/cmake/Git.cmake
deleted file mode 100644
index 81a68b1f1f4..00000000000
--- a/gpcontrib/diskquota/cmake/Git.cmake
+++ /dev/null
@@ -1,9 +0,0 @@
-# get git hash
-macro(GitHash_Get _git_hash)
-  find_package(Git)
-  execute_process(
-    COMMAND ${GIT_EXECUTABLE} log -1 --pretty=format:%h
-    OUTPUT_VARIABLE ${_git_hash}
-    OUTPUT_STRIP_TRAILING_WHITESPACE ERROR_QUIET
-    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR})
-endmacro()
diff --git a/gpcontrib/gp_exttable_fdw/input/gp_exttable_fdw.source b/gpcontrib/gp_exttable_fdw/input/gp_exttable_fdw.source
index 41012e73c81..1c089e34760 100644
--- a/gpcontrib/gp_exttable_fdw/input/gp_exttable_fdw.source
+++ b/gpcontrib/gp_exttable_fdw/input/gp_exttable_fdw.source
@@ -53,12 +53,26 @@ OPTIONS (format_type 'c', delimiter ',',
          location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv',
          reject_limit_type 'p', reject_limit '120');
 
--- Error, invalid encoding
+-- Error, invalid encoding (negative numeric ID)
 CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
 SERVER gp_exttable_server
 OPTIONS (format_type 'c', delimiter ',', encoding '-1',
          location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
 
+-- Error, invalid encoding (unknown name)
+CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
+SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',', encoding 'bogus',
+         location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
+
+-- Error, mixed numeric+letters must not be silently truncated to a
+-- valid prefix (atoi('6abc') would return 6 = UTF8; strict parsing
+-- in parse_fdw_encoding_option() rejects it).
+CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
+SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',', encoding '6abc',
+         location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
+
 -- OK, no execute_on | log_errors | encoding | is_writable option
 CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
 SERVER gp_exttable_server
@@ -79,3 +93,59 @@ SELECT urilocation FROM pg_exttable WHERE reloid = 'public.ext_special_uri'::reg
 SELECT ftoptions FROM pg_foreign_table WHERE ftrelid='public.ext_special_uri'::regclass;
 \a
 SELECT * FROM ext_special_uri ORDER BY a;
+
+-- ===================================================================
+-- Tests for issue #1726: FDW OPTIONS encoding accepts both numeric IDs
+-- and symbolic names (UTF8, utf-8, GBK, ...). Names previously parsed
+-- via atoi() and silently degraded to SQL_ASCII.
+-- ===================================================================
+
+-- Numeric form (baseline; worked before the fix as well).
+CREATE FOREIGN TABLE ext_enc_num (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding '6');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_num'::regclass;
+
+-- Symbolic name 'UTF8' — used to be silently SQL_ASCII (the bug).
+CREATE FOREIGN TABLE ext_enc_utf8 (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'UTF8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_utf8'::regclass;
+
+-- Case + dash variant resolved by pg_char_to_encoding().
+CREATE FOREIGN TABLE ext_enc_utf8_dash (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'utf-8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_utf8_dash'::regclass;
+
+-- Non-UTF8 symbolic name.
+CREATE FOREIGN TABLE ext_enc_gbk (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'GBK');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_gbk'::regclass;
+
+-- ALTER FOREIGN TABLE ... OPTIONS (SET encoding 'UTF8') — same code
+-- path, this proves the read-side resolution works after an ALTER too.
+CREATE FOREIGN TABLE ext_enc_alter (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding '0');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_alter'::regclass;
+ALTER FOREIGN TABLE ext_enc_alter OPTIONS (SET encoding 'UTF8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_alter'::regclass;
+
+DROP FOREIGN TABLE ext_enc_num;
+DROP FOREIGN TABLE ext_enc_utf8;
+DROP FOREIGN TABLE ext_enc_utf8_dash;
+DROP FOREIGN TABLE ext_enc_gbk;
+DROP FOREIGN TABLE ext_enc_alter;
diff --git a/gpcontrib/gp_exttable_fdw/option.c b/gpcontrib/gp_exttable_fdw/option.c
index 04cccfe0e47..59bd6b99014 100644
--- a/gpcontrib/gp_exttable_fdw/option.c
+++ b/gpcontrib/gp_exttable_fdw/option.c
@@ -135,11 +135,13 @@ gp_exttable_permission_check(PG_FUNCTION_ARGS)
 		}
 		else if(pg_strcasecmp(def->defname, "encoding") == 0)
 		{
-			char	*encoding = (char *) defGetString(def);
-			if (!PG_VALID_ENCODING(atoi(encoding)))
-				ereport(ERROR,
-				        (errcode(ERRCODE_FDW_INVALID_ATTRIBUTE_VALUE),
-				         errmsg("%s is not a valid encoding code", encoding)));
+			/*
+			 * Accept either a symbolic encoding name (e.g. 'UTF8', 'GBK')
+			 * or a numeric encoding ID. Reject anything else explicitly,
+			 * rather than letting atoi() silently mistranslate non-numeric
+			 * names to SQL_ASCII.
+			 */
+			(void) parse_fdw_encoding_option((char *) defGetString(def));
 		}
 	}
 
diff --git a/gpcontrib/gp_exttable_fdw/output/gp_exttable_fdw.source b/gpcontrib/gp_exttable_fdw/output/gp_exttable_fdw.source
index a3191eb0853..8ba1be8ed6c 100644
--- a/gpcontrib/gp_exttable_fdw/output/gp_exttable_fdw.source
+++ b/gpcontrib/gp_exttable_fdw/output/gp_exttable_fdw.source
@@ -52,12 +52,26 @@ OPTIONS (format_type 'c', delimiter ',',
          location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv',
          reject_limit_type 'p', reject_limit '120');
 ERROR:  segment reject limit in PERCENT must be between 1 and 100 (got 120)  (seg1 127.0.0.1:7003 pid=5173)
--- Error, invalid encoding
+-- Error, invalid encoding (negative numeric ID)
 CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
 SERVER gp_exttable_server
 OPTIONS (format_type 'c', delimiter ',', encoding '-1',
          location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
-ERROR:  -1 is not a valid encoding code  (seg0 127.0.0.1:7002 pid=8289)
+ERROR:  "-1" is not a valid encoding name or code
+-- Error, invalid encoding (unknown name)
+CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
+SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',', encoding 'bogus',
+         location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
+ERROR:  "bogus" is not a valid encoding name or code
+-- Error, mixed numeric+letters must not be silently truncated to a
+-- valid prefix (atoi('6abc') would return 6 = UTF8; strict parsing
+-- in parse_fdw_encoding_option() rejects it).
+CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
+SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',', encoding '6abc',
+         location_uris 'file://@hostname@@abs_srcdir@/data/tableless.csv');
+ERROR:  "6abc" is not a valid encoding name or code
 -- OK, no execute_on | log_errors | encoding | is_writable option
 CREATE FOREIGN TABLE tableless_ext_fdw(a int, b int)
 SERVER gp_exttable_server
@@ -96,3 +110,82 @@ SELECT * FROM ext_special_uri ORDER BY a;
  3 | 3
 (3 rows)
 
+-- ===================================================================
+-- Tests for issue #1726: FDW OPTIONS encoding accepts both numeric IDs
+-- and symbolic names (UTF8, utf-8, GBK, ...). Names previously parsed
+-- via atoi() and silently degraded to SQL_ASCII.
+-- ===================================================================
+-- Numeric form (baseline; worked before the fix as well).
+CREATE FOREIGN TABLE ext_enc_num (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding '6');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_num'::regclass;
+ pg_encoding_to_char 
+---------------------
+ UTF8
+(1 row)
+
+-- Symbolic name 'UTF8' — used to be silently SQL_ASCII (the bug).
+CREATE FOREIGN TABLE ext_enc_utf8 (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'UTF8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_utf8'::regclass;
+ pg_encoding_to_char 
+---------------------
+ UTF8
+(1 row)
+
+-- Case + dash variant resolved by pg_char_to_encoding().
+CREATE FOREIGN TABLE ext_enc_utf8_dash (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'utf-8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_utf8_dash'::regclass;
+ pg_encoding_to_char 
+---------------------
+ UTF8
+(1 row)
+
+-- Non-UTF8 symbolic name.
+CREATE FOREIGN TABLE ext_enc_gbk (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding 'GBK');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_gbk'::regclass;
+ pg_encoding_to_char 
+---------------------
+ GBK
+(1 row)
+
+-- ALTER FOREIGN TABLE ... OPTIONS (SET encoding 'UTF8') — same code
+-- path, this proves the read-side resolution works after an ALTER too.
+CREATE FOREIGN TABLE ext_enc_alter (a int) SERVER gp_exttable_server
+OPTIONS (format_type 'c', delimiter ',',
+         location_uris 'file:///tmp/ext_enc_ignored.csv',
+         encoding '0');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_alter'::regclass;
+ pg_encoding_to_char 
+---------------------
+ SQL_ASCII
+(1 row)
+
+ALTER FOREIGN TABLE ext_enc_alter OPTIONS (SET encoding 'UTF8');
+SELECT pg_encoding_to_char(encoding) FROM pg_exttable
+WHERE  reloid = 'ext_enc_alter'::regclass;
+ pg_encoding_to_char 
+---------------------
+ UTF8
+(1 row)
+
+DROP FOREIGN TABLE ext_enc_num;
+DROP FOREIGN TABLE ext_enc_utf8;
+DROP FOREIGN TABLE ext_enc_utf8_dash;
+DROP FOREIGN TABLE ext_enc_gbk;
+DROP FOREIGN TABLE ext_enc_alter;
diff --git a/gpcontrib/gp_internal_tools/Makefile b/gpcontrib/gp_internal_tools/Makefile
index 643a13f0118..829645e1268 100755
--- a/gpcontrib/gp_internal_tools/Makefile
+++ b/gpcontrib/gp_internal_tools/Makefile
@@ -4,6 +4,8 @@ DATA       = gp_internal_tools--1.0.0.sql
 
 PG_CPPFLAGS = -I$(libpq_srcdir)
 
+REGRESS = gp_session_state_memory
+
 ifdef USE_PGXS
 PG_CONFIG = pg_config
 PGXS := $(shell $(PG_CONFIG) --pgxs)
diff --git a/gpcontrib/gp_stats_collector/.clang-format b/gpcontrib/gp_stats_collector/.clang-format
new file mode 100644
index 00000000000..eb90ff33671
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/.clang-format
@@ -0,0 +1,178 @@
+---
+Language:        Cpp
+AccessModifierOffset: -4
+AlignAfterOpenBracket: Align
+AlignConsecutiveMacros: false
+AlignConsecutiveAssignments: false
+AlignConsecutiveBitFields: false
+AlignConsecutiveDeclarations: false
+AlignEscapedNewlines: Left
+AlignOperands:   Align
+AlignTrailingComments: true
+AllowAllArgumentsOnNextLine: true
+AllowAllConstructorInitializersOnNextLine: true
+AllowAllParametersOfDeclarationOnNextLine: false
+AllowShortEnumsOnASingleLine: true
+AllowShortBlocksOnASingleLine: Never
+AllowShortCaseLabelsOnASingleLine: false
+AllowShortFunctionsOnASingleLine: None
+AllowShortLambdasOnASingleLine: All
+AllowShortIfStatementsOnASingleLine: Never
+AllowShortLoopsOnASingleLine: false
+AlwaysBreakAfterDefinitionReturnType: All
+AlwaysBreakAfterReturnType: AllDefinitions
+AlwaysBreakBeforeMultilineStrings: true
+AlwaysBreakTemplateDeclarations: Yes
+BinPackArguments: true
+BinPackParameters: true
+BraceWrapping:
+  AfterCaseLabel:  true
+  AfterClass:      true
+  AfterControlStatement: Always
+  AfterEnum:       true
+  AfterFunction:   true
+  AfterNamespace:  true
+  AfterObjCDeclaration: true
+  AfterStruct:     true
+  AfterUnion:      true
+  AfterExternBlock: false
+  BeforeCatch:     true
+  BeforeElse:      true
+  BeforeLambdaBody: false
+  BeforeWhile:     false
+  IndentBraces:    false
+  SplitEmptyFunction: true
+  SplitEmptyRecord: true
+  SplitEmptyNamespace: true
+BreakBeforeBinaryOperators: None
+BreakBeforeBraces: Custom
+BreakBeforeInheritanceComma: false
+BreakInheritanceList: BeforeColon
+BreakBeforeTernaryOperators: true
+BreakConstructorInitializersBeforeComma: false
+BreakConstructorInitializers: BeforeColon
+BreakAfterJavaFieldAnnotations: false
+BreakStringLiterals: false
+ColumnLimit:     80
+CommentPragmas:  '^ IWYU pragma:'
+CompactNamespaces: false
+ConstructorInitializerAllOnOneLineOrOnePerLine: true
+ConstructorInitializerIndentWidth: 4
+ContinuationIndentWidth: 4
+Cpp11BracedListStyle: true
+DeriveLineEnding: true
+DerivePointerAlignment: false
+DisableFormat:   false
+ExperimentalAutoDetectBinPacking: false
+FixNamespaceComments: true
+ForEachMacros:
+  - foreach
+  - Q_FOREACH
+  - BOOST_FOREACH
+IncludeBlocks:   Preserve
+IncludeCategories:
+  - Regex: '^<.*'
+    Priority: 1
+  - Regex: '"protos/.*\.pb\.h"'
+    Priority: 2
+  - Regex: '"postgres\.h"'
+    Priority: 3
+  - Regex: '.*'
+    Priority: 4
+IncludeIsMainRegex: '([-_](test|unittest))?$'
+IncludeIsMainSourceRegex: ''
+IndentCaseLabels: true
+IndentCaseBlocks: false
+IndentGotoLabels: true
+IndentPPDirectives: None
+IndentExternBlock: AfterExternBlock
+IndentWidth:     4
+IndentWrappedFunctionNames: false
+InsertTrailingCommas: None
+JavaScriptQuotes: Leave
+JavaScriptWrapImports: true
+KeepEmptyLinesAtTheStartOfBlocks: false
+MacroBlockBegin: ''
+MacroBlockEnd:   ''
+MaxEmptyLinesToKeep: 3
+NamespaceIndentation: None
+ObjCBinPackProtocolList: Never
+ObjCBlockIndentWidth: 2
+ObjCBreakBeforeNestedBlockParam: true
+ObjCSpaceAfterProperty: false
+ObjCSpaceBeforeProtocolList: true
+PenaltyBreakAssignment: 2
+PenaltyBreakBeforeFirstCallParameter: 1
+PenaltyBreakComment: 300
+PenaltyBreakFirstLessLess: 120
+PenaltyBreakString: 1000
+PenaltyBreakTemplateDeclaration: 10
+PenaltyExcessCharacter: 1000000
+PenaltyReturnTypeOnItsOwnLine: 200
+PointerAlignment: Right
+RawStringFormats:
+  - Language:        Cpp
+    Delimiters:
+      - cc
+      - CC
+      - cpp
+      - Cpp
+      - CPP
+      - 'c++'
+      - 'C++'
+    CanonicalDelimiter: ''
+    BasedOnStyle:    google
+  - Language:        TextProto
+    Delimiters:
+      - pb
+      - PB
+      - proto
+      - PROTO
+    EnclosingFunctions:
+      - EqualsProto
+      - EquivToProto
+      - PARSE_PARTIAL_TEXT_PROTO
+      - PARSE_TEST_PROTO
+      - PARSE_TEXT_PROTO
+      - ParseTextOrDie
+      - ParseTextProtoOrDie
+      - ParseTestProto
+      - ParsePartialTestProto
+    CanonicalDelimiter: ''
+    BasedOnStyle:    google
+ReflowComments:  false
+SortIncludes:    true
+SortUsingDeclarations: true
+SpaceAfterCStyleCast: true
+SpaceAfterLogicalNot: false
+SpaceAfterTemplateKeyword: true
+SpaceBeforeAssignmentOperators: true
+SpaceBeforeCpp11BracedList: false
+SpaceBeforeCtorInitializerColon: true
+SpaceBeforeInheritanceColon: true
+SpaceBeforeParens: ControlStatements
+SpaceBeforeRangeBasedForLoopColon: true
+SpaceInEmptyBlock: false
+SpaceInEmptyParentheses: false
+SpacesBeforeTrailingComments: 2
+SpacesInAngles:  false
+SpacesInConditionalStatement: false
+SpacesInContainerLiterals: true
+SpacesInCStyleCastParentheses: false
+SpacesInParentheses: false
+SpacesInSquareBrackets: false
+SpaceBeforeSquareBrackets: false
+Standard:        Auto
+StatementMacros:
+  - Q_UNUSED
+  - QT_REQUIRE_VERSION
+TabWidth:        4
+UseCRLF:         false
+UseTab:          Always
+WhitespaceSensitiveMacros:
+  - STRINGIZE
+  - PP_STRINGIZE
+  - BOOST_PP_STRINGIZE
+...
+
+
diff --git a/gpcontrib/gp_stats_collector/Makefile b/gpcontrib/gp_stats_collector/Makefile
new file mode 100644
index 00000000000..b3228d2c45e
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/Makefile
@@ -0,0 +1,35 @@
+MODULE_big = gp_stats_collector
+EXTENSION  = gp_stats_collector
+DATA       = $(wildcard *--*.sql)
+REGRESS    = gpsc_cursors gpsc_dist gpsc_select gpsc_utf8_trim gpsc_utility gpsc_guc_cache gpsc_uds gpsc_locale
+
+PROTO_BASES = gpsc_plan gpsc_metrics gpsc_set_service
+PROTO_OBJS  = $(patsubst %,src/protos/%.pb.o,$(PROTO_BASES))
+
+C_OBJS   = $(patsubst %.c,%.o,$(wildcard src/*.c src/*/*.c))
+CPP_OBJS = $(patsubst %.cpp,%.o,$(wildcard src/*.cpp src/log/*.cpp src/memory/*.cpp))
+OBJS     = $(C_OBJS) $(CPP_OBJS) $(PROTO_OBJS)
+
+PG_CXXFLAGS += -Werror -Wall -Wno-unused-but-set-variable -std=c++17 -Isrc/protos -Isrc -Iinclude -DGPBUILD
+SHLIB_LINK += -lprotobuf -lstdc++
+EXTRA_CLEAN = src/protos
+
+ifdef USE_PGXS
+PG_CONFIG = pg_config
+PGXS := $(shell $(PG_CONFIG) --pgxs)
+include $(PGXS)
+else
+subdir = gpcontrib/gp_stats_collector
+top_builddir = ../..
+include $(top_builddir)/src/Makefile.global
+include $(top_srcdir)/contrib/contrib-global.mk
+endif
+
+src/protos/.done: $(wildcard protos/*.proto)
+	@mkdir -p src/protos
+	protoc -I /usr/include -I /usr/local/include -I . --cpp_out=src $^
+	for f in src/protos/*.pb.cc; do mv "$$f" "$${f%.cc}.cpp"; done
+	touch $@
+
+src/protos/%.pb.cpp src/protos/%.pb.h: src/protos/.done ;
+$(CPP_OBJS): src/protos/.done
diff --git a/gpcontrib/gp_stats_collector/README.md b/gpcontrib/gp_stats_collector/README.md
new file mode 100644
index 00000000000..8c2d5c6868e
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/README.md
@@ -0,0 +1,47 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one
+  or more contributor license agreements.  See the NOTICE file
+  distributed with this work for additional information
+  regarding copyright ownership.  The ASF licenses this file
+  to you under the Apache License, Version 2.0 (the
+  "License"); you may not use this file except in compliance
+  with the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing,
+  software distributed under the License is distributed on an
+  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  KIND, either express or implied.  See the License for the
+  specific language governing permissions and limitations
+  under the License.
+-->
+
+## GP Stats Collector
+
+An extension for collecting query execution metrics and reporting them to an external agent.
+
+### Collected Statistics
+
+#### 1. Query Lifecycle
+-   **What:** Captures query text, normalized query text, timestamps (submit, start, end, done), and user/database info.
+-   **GUC:** `gpsc.enable`.
+
+#### 2. `EXPLAIN` data
+-   **What:** Triggers generation of the `EXPLAIN (TEXT, COSTS, VERBOSE)` and captures it.
+-   **GUC:** `gpsc.enable`.
+
+#### 3. `EXPLAIN ANALYZE` data
+-   **What:** Triggers generation of the `EXPLAIN (TEXT, ANALYZE, BUFFERS, TIMING, VERBOSE)` and captures it.
+-   **GUCs:** `gpsc.enable`, `gpsc.min_analyze_time`, `gpsc.enable_cdbstats`(ANALYZE), `gpsc.enable_analyze`(BUFFERS, TIMING, VERBOSE).
+
+#### 4. Other Metrics
+-   **What:** Captures Instrument, System, Network, Interconnect, Spill metrics.
+-   **GUC:** `gpsc.enable`.
+
+### General Configuration
+-   **Nested Queries:** When `gpsc.report_nested_queries` is `false`, only top-level queries are reported from the coordinator and segments, when `true`, both top-level and nested queries are reported from the coordinator, from segments collected as aggregates.
+-   **Data Destination:** All collected data is sent to a Unix Domain Socket. Configure the path with `gpsc.uds_path`.
+-   **User Filtering:** To exclude activity from certain roles, add them to the comma-separated list in `gpsc.ignored_users_list`.
+-   **Trimming plans:** Query texts and execution plans are trimmed based on `gpsc.max_text_size` and `gpsc.max_plan_size` (default: 1024KB). For now, it is not recommended to set these GUCs higher than 1024KB.
+-   **Analyze collection:** Analyze is sent if execution time exceeds `gpsc.min_analyze_time`, which is 10 seconds by default. Analyze is collected if `gpsc.enable_analyze` is true.
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_cursors.out b/gpcontrib/gp_stats_collector/expected/gpsc_cursors.out
new file mode 100644
index 00000000000..282d9ac49e1
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_cursors.out
@@ -0,0 +1,163 @@
+CREATE EXTENSION gp_stats_collector;
+CREATE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+-- DECLARE
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+DECLARE cursor_stats_0 CURSOR FOR SELECT 0;
+CLOSE cursor_stats_0;
+COMMIT;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                 query_text                  |    query_status     
+-------+---------------------------------------------+---------------------
+    -1 | BEGIN;                                      | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                                      | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_0 CURSOR FOR SELECT 0; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_0 CURSOR FOR SELECT 0; | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_0;                       | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_0;                       | QUERY_STATUS_DONE
+    -1 | COMMIT;                                     | QUERY_STATUS_SUBMIT
+    -1 | COMMIT;                                     | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                    | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                    | QUERY_STATUS_DONE
+(10 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- DECLARE WITH HOLD
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+DECLARE cursor_stats_1 CURSOR WITH HOLD FOR SELECT 1;
+CLOSE cursor_stats_1;
+DECLARE cursor_stats_2 CURSOR WITH HOLD FOR SELECT 2;
+CLOSE cursor_stats_2;
+COMMIT;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                      query_text                       |    query_status     
+-------+-------------------------------------------------------+---------------------
+    -1 | BEGIN;                                                | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                                                | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_1 CURSOR WITH HOLD FOR SELECT 1; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_1 CURSOR WITH HOLD FOR SELECT 1; | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_1;                                 | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_1;                                 | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_2 CURSOR WITH HOLD FOR SELECT 2; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_2 CURSOR WITH HOLD FOR SELECT 2; | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_2;                                 | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_2;                                 | QUERY_STATUS_DONE
+    -1 | COMMIT;                                               | QUERY_STATUS_SUBMIT
+    -1 | COMMIT;                                               | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                              | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                              | QUERY_STATUS_DONE
+(14 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- ROLLBACK
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+DECLARE cursor_stats_3 CURSOR FOR SELECT 1;
+CLOSE cursor_stats_3;
+DECLARE cursor_stats_4 CURSOR FOR SELECT 1;
+ROLLBACK;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                 query_text                  |    query_status     
+-------+---------------------------------------------+---------------------
+    -1 | BEGIN;                                      | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                                      | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_3 CURSOR FOR SELECT 1; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_3 CURSOR FOR SELECT 1; | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_3;                       | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_3;                       | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_4 CURSOR FOR SELECT 1; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_4 CURSOR FOR SELECT 1; | QUERY_STATUS_DONE
+    -1 | ROLLBACK;                                   | QUERY_STATUS_SUBMIT
+    -1 | ROLLBACK;                                   | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                    | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                    | QUERY_STATUS_DONE
+(12 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- FETCH
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+DECLARE cursor_stats_5 CURSOR WITH HOLD FOR SELECT 2;
+DECLARE cursor_stats_6 CURSOR WITH HOLD FOR SELECT 3;
+FETCH 1 IN cursor_stats_5;
+ ?column? 
+----------
+        2
+(1 row)
+
+FETCH 1 IN cursor_stats_6;
+ ?column? 
+----------
+        3
+(1 row)
+
+CLOSE cursor_stats_5;
+CLOSE cursor_stats_6;
+COMMIT;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                      query_text                       |    query_status     
+-------+-------------------------------------------------------+---------------------
+    -1 | BEGIN;                                                | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                                                | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_5 CURSOR WITH HOLD FOR SELECT 2; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_5 CURSOR WITH HOLD FOR SELECT 2; | QUERY_STATUS_DONE
+    -1 | DECLARE cursor_stats_6 CURSOR WITH HOLD FOR SELECT 3; | QUERY_STATUS_SUBMIT
+    -1 | DECLARE cursor_stats_6 CURSOR WITH HOLD FOR SELECT 3; | QUERY_STATUS_DONE
+    -1 | FETCH 1 IN cursor_stats_5;                            | QUERY_STATUS_SUBMIT
+    -1 | FETCH 1 IN cursor_stats_5;                            | QUERY_STATUS_DONE
+    -1 | FETCH 1 IN cursor_stats_6;                            | QUERY_STATUS_SUBMIT
+    -1 | FETCH 1 IN cursor_stats_6;                            | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_5;                                 | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_5;                                 | QUERY_STATUS_DONE
+    -1 | CLOSE cursor_stats_6;                                 | QUERY_STATUS_SUBMIT
+    -1 | CLOSE cursor_stats_6;                                 | QUERY_STATUS_DONE
+    -1 | COMMIT;                                               | QUERY_STATUS_SUBMIT
+    -1 | COMMIT;                                               | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                              | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                              | QUERY_STATUS_DONE
+(18 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_dist.out b/gpcontrib/gp_stats_collector/expected/gpsc_dist.out
new file mode 100644
index 00000000000..92e8678767b
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_dist.out
@@ -0,0 +1,175 @@
+CREATE EXTENSION gp_stats_collector;
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+SET gpsc.enable_utility TO FALSE;
+-- Hash distributed table
+CREATE TABLE test_hash_dist (id int) DISTRIBUTED BY (id);
+INSERT INTO test_hash_dist SELECT 1;
+SET gpsc.logging_mode to 'TBL';
+SET optimizer_enable_direct_dispatch TO TRUE;
+-- Direct dispatch is used here, only one segment is scanned.
+select * from test_hash_dist where id = 1;
+ id 
+----
+  1
+(1 row)
+
+RESET optimizer_enable_direct_dispatch;
+RESET gpsc.logging_mode;
+-- Should see 8 rows.
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                 query_text                 |    query_status     
+-------+--------------------------------------------+---------------------
+    -1 | select * from test_hash_dist where id = 1; | QUERY_STATUS_SUBMIT
+    -1 | select * from test_hash_dist where id = 1; | QUERY_STATUS_START
+    -1 | select * from test_hash_dist where id = 1; | QUERY_STATUS_END
+    -1 | select * from test_hash_dist where id = 1; | QUERY_STATUS_DONE
+     1 |                                            | QUERY_STATUS_SUBMIT
+     1 |                                            | QUERY_STATUS_START
+     1 |                                            | QUERY_STATUS_END
+     1 |                                            | QUERY_STATUS_DONE
+(8 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+SET gpsc.logging_mode to 'TBL';
+-- Scan all segments.
+select * from test_hash_dist;
+ id 
+----
+  1
+(1 row)
+
+DROP TABLE test_hash_dist;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |          query_text           |    query_status     
+-------+-------------------------------+---------------------
+    -1 | select * from test_hash_dist; | QUERY_STATUS_SUBMIT
+    -1 | select * from test_hash_dist; | QUERY_STATUS_START
+    -1 | select * from test_hash_dist; | QUERY_STATUS_END
+    -1 | select * from test_hash_dist; | QUERY_STATUS_DONE
+     1 |                               | QUERY_STATUS_SUBMIT
+     1 |                               | QUERY_STATUS_START
+     1 |                               | QUERY_STATUS_END
+     1 |                               | QUERY_STATUS_DONE
+     2 |                               | QUERY_STATUS_SUBMIT
+     2 |                               | QUERY_STATUS_START
+     2 |                               | QUERY_STATUS_END
+     2 |                               | QUERY_STATUS_DONE
+       |                               | QUERY_STATUS_SUBMIT
+       |                               | QUERY_STATUS_START
+       |                               | QUERY_STATUS_END
+       |                               | QUERY_STATUS_DONE
+(16 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Replicated table
+CREATE FUNCTION force_segments() RETURNS SETOF text AS $$
+BEGIN
+  RETURN NEXT 'seg';
+END;
+$$ LANGUAGE plpgsql VOLATILE EXECUTE ON ALL SEGMENTS;
+CREATE TABLE test_replicated (id int) DISTRIBUTED REPLICATED;
+INSERT INTO test_replicated SELECT 1;
+SET gpsc.logging_mode to 'TBL';
+SELECT COUNT(*) FROM test_replicated, force_segments();
+ count 
+-------
+     3
+(1 row)
+
+DROP TABLE test_replicated;
+DROP FUNCTION force_segments();
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                       query_text                        |    query_status     
+-------+---------------------------------------------------------+---------------------
+    -1 | SELECT COUNT(*) FROM test_replicated, force_segments(); | QUERY_STATUS_SUBMIT
+    -1 | SELECT COUNT(*) FROM test_replicated, force_segments(); | QUERY_STATUS_START
+    -1 | SELECT COUNT(*) FROM test_replicated, force_segments(); | QUERY_STATUS_END
+    -1 | SELECT COUNT(*) FROM test_replicated, force_segments(); | QUERY_STATUS_DONE
+     1 |                                                         | QUERY_STATUS_SUBMIT
+     1 |                                                         | QUERY_STATUS_START
+     1 |                                                         | QUERY_STATUS_END
+     1 |                                                         | QUERY_STATUS_DONE
+     2 |                                                         | QUERY_STATUS_SUBMIT
+     2 |                                                         | QUERY_STATUS_START
+     2 |                                                         | QUERY_STATUS_END
+     2 |                                                         | QUERY_STATUS_DONE
+       |                                                         | QUERY_STATUS_SUBMIT
+       |                                                         | QUERY_STATUS_START
+       |                                                         | QUERY_STATUS_END
+       |                                                         | QUERY_STATUS_DONE
+(16 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Partially distributed table (2 numsegments)
+SET allow_system_table_mods = ON;
+CREATE TABLE test_partial_dist (id int, data text) DISTRIBUTED BY (id);
+UPDATE gp_distribution_policy SET numsegments = 2 WHERE localoid = 'test_partial_dist'::regclass;
+INSERT INTO test_partial_dist SELECT * FROM generate_series(1, 100);
+SET gpsc.logging_mode to 'TBL';
+SELECT COUNT(*) FROM test_partial_dist;
+ count 
+-------
+   100
+(1 row)
+
+RESET gpsc.logging_mode;
+DROP TABLE test_partial_dist;
+RESET allow_system_table_mods;
+-- Should see 12 rows.
+SELECT query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+               query_text                |    query_status     
+-----------------------------------------+---------------------
+ SELECT COUNT(*) FROM test_partial_dist; | QUERY_STATUS_SUBMIT
+ SELECT COUNT(*) FROM test_partial_dist; | QUERY_STATUS_START
+ SELECT COUNT(*) FROM test_partial_dist; | QUERY_STATUS_END
+ SELECT COUNT(*) FROM test_partial_dist; | QUERY_STATUS_DONE
+                                         | QUERY_STATUS_SUBMIT
+                                         | QUERY_STATUS_START
+                                         | QUERY_STATUS_END
+                                         | QUERY_STATUS_DONE
+                                         | QUERY_STATUS_SUBMIT
+                                         | QUERY_STATUS_START
+                                         | QUERY_STATUS_END
+                                         | QUERY_STATUS_DONE
+(12 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_guc_cache.out b/gpcontrib/gp_stats_collector/expected/gpsc_guc_cache.out
new file mode 100644
index 00000000000..11a420839db
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_guc_cache.out
@@ -0,0 +1,57 @@
+--
+-- Test GUC caching for query lifecycle consistency.
+--
+-- The extension logs SUBMIT and DONE events for each query.
+-- GUC values that control logging (enable_utility, ignored_users_list, ...)
+-- must be cached at SUBMIT time to ensure DONE uses the same filtering
+-- criteria. Otherwise, a SET command that modifies these GUCs would
+-- have its DONE event rejected, creating orphaned SUBMIT entries.
+-- This is due to query being actually executed between SUBMIT and DONE.
+-- start_ignore
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+SELECT gpsc.truncate_log();
+-- end_ignore
+CREATE OR REPLACE FUNCTION print_last_query(query text)
+RETURNS TABLE(query_status text) AS $$
+    SELECT query_status
+    FROM gpsc.log
+    WHERE segid = -1 AND query_text = query
+    ORDER BY ccnt DESC
+$$ LANGUAGE sql;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.logging_mode TO 'TBL';
+-- SET below disables utility logging and DONE must still be logged.
+SET gpsc.enable_utility TO FALSE;
+SELECT * FROM print_last_query('SET gpsc.enable_utility TO FALSE;');
+    query_status     
+---------------------
+ QUERY_STATUS_SUBMIT
+ QUERY_STATUS_DONE
+(2 rows)
+
+-- SELECT below adds current user to ignore list and DONE must still be logged.
+-- start_ignore
+SELECT set_config('gpsc.ignored_users_list', current_user, false);
+ set_config 
+------------
+ gpadmin
+(1 row)
+
+-- end_ignore
+SELECT * FROM print_last_query('SELECT set_config(''gpsc.ignored_users_list'', current_user, false);');
+    query_status     
+---------------------
+ QUERY_STATUS_SUBMIT
+ QUERY_STATUS_START
+ QUERY_STATUS_END
+ QUERY_STATUS_DONE
+(4 rows)
+
+DROP FUNCTION print_last_query(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
+RESET gpsc.logging_mode;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_locale.out b/gpcontrib/gp_stats_collector/expected/gpsc_locale.out
new file mode 100644
index 00000000000..a01fe0648b9
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_locale.out
@@ -0,0 +1,23 @@
+-- The extension generates normalized query text and plan using jumbling functions.
+-- Those functions may fail when translating to wide character if the current locale
+-- cannot handle the character set. This test checks that even when those functions
+-- fail, the plan is still generated and executed. This test is partially taken from
+-- gp_locale.
+-- start_ignore
+DROP DATABASE IF EXISTS gpsc_test_locale;
+-- end_ignore
+CREATE DATABASE gpsc_test_locale WITH LC_COLLATE='C' LC_CTYPE='C' TEMPLATE=template0;
+\c gpsc_test_locale
+CREATE EXTENSION gp_stats_collector;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.enable TO TRUE;
+CREATE TABLE gpsc_hi_안녕세계 (a int, 안녕세계1 text, 안녕세계2 text, 안녕세계3 text) DISTRIBUTED BY (a);
+INSERT INTO gpsc_hi_안녕세계 VALUES(1, '안녕세계1 first', '안녕세2 first', '안녕세계3 first');
+-- Should not see error here
+UPDATE gpsc_hi_안녕세계 SET 안녕세계1='안녕세계1 first UPDATE' WHERE 안녕세계1='안녕세계1 first';
+RESET gpsc.enable;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
+DROP TABLE gpsc_hi_안녕세계;
+DROP EXTENSION gp_stats_collector;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_select.out b/gpcontrib/gp_stats_collector/expected/gpsc_select.out
new file mode 100644
index 00000000000..3008c8f6d55
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_select.out
@@ -0,0 +1,136 @@
+CREATE EXTENSION gp_stats_collector;
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+SET gpsc.enable_utility TO FALSE;
+-- Basic SELECT tests
+SET gpsc.logging_mode to 'TBL';
+SELECT 1;
+ ?column? 
+----------
+        1
+(1 row)
+
+SELECT COUNT(*) FROM generate_series(1,10);
+ count 
+-------
+    10
+(1 row)
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                 query_text                  |    query_status     
+-------+---------------------------------------------+---------------------
+    -1 | SELECT 1;                                   | QUERY_STATUS_SUBMIT
+    -1 | SELECT 1;                                   | QUERY_STATUS_START
+    -1 | SELECT 1;                                   | QUERY_STATUS_END
+    -1 | SELECT 1;                                   | QUERY_STATUS_DONE
+    -1 | SELECT COUNT(*) FROM generate_series(1,10); | QUERY_STATUS_SUBMIT
+    -1 | SELECT COUNT(*) FROM generate_series(1,10); | QUERY_STATUS_START
+    -1 | SELECT COUNT(*) FROM generate_series(1,10); | QUERY_STATUS_END
+    -1 | SELECT COUNT(*) FROM generate_series(1,10); | QUERY_STATUS_DONE
+(8 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Transaction test
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+SELECT 1;
+ ?column? 
+----------
+        1
+(1 row)
+
+COMMIT;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid | query_text |    query_status     
+-------+------------+---------------------
+    -1 | SELECT 1;  | QUERY_STATUS_SUBMIT
+    -1 | SELECT 1;  | QUERY_STATUS_START
+    -1 | SELECT 1;  | QUERY_STATUS_END
+    -1 | SELECT 1;  | QUERY_STATUS_DONE
+(4 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- CTE test
+SET gpsc.logging_mode to 'TBL';
+WITH t AS (VALUES (1), (2))
+SELECT * FROM t;
+ column1 
+---------
+       1
+       2
+(2 rows)
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |         query_text          |    query_status     
+-------+-----------------------------+---------------------
+    -1 | WITH t AS (VALUES (1), (2))+| QUERY_STATUS_SUBMIT
+       | SELECT * FROM t;            | 
+    -1 | WITH t AS (VALUES (1), (2))+| QUERY_STATUS_START
+       | SELECT * FROM t;            | 
+    -1 | WITH t AS (VALUES (1), (2))+| QUERY_STATUS_END
+       | SELECT * FROM t;            | 
+    -1 | WITH t AS (VALUES (1), (2))+| QUERY_STATUS_DONE
+       | SELECT * FROM t;            | 
+(4 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Prepared statement test
+SET gpsc.logging_mode to 'TBL';
+PREPARE test_stmt AS SELECT 1;
+EXECUTE test_stmt;
+ ?column? 
+----------
+        1
+(1 row)
+
+DEALLOCATE test_stmt;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |           query_text           |    query_status     
+-------+--------------------------------+---------------------
+    -1 | PREPARE test_stmt AS SELECT 1; | QUERY_STATUS_SUBMIT
+    -1 | PREPARE test_stmt AS SELECT 1; | QUERY_STATUS_START
+    -1 | PREPARE test_stmt AS SELECT 1; | QUERY_STATUS_END
+    -1 | PREPARE test_stmt AS SELECT 1; | QUERY_STATUS_DONE
+(4 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_uds.out b/gpcontrib/gp_stats_collector/expected/gpsc_uds.out
new file mode 100644
index 00000000000..e8bca79e669
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_uds.out
@@ -0,0 +1,42 @@
+-- Test UDS socket
+-- start_ignore
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+-- end_ignore
+\set UDS_PATH '/tmp/gpsc_test.sock'
+-- Configure extension to send via UDS
+SET gpsc.uds_path TO :'UDS_PATH';
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.logging_mode TO 'UDS';
+-- Start receiver
+SELECT gpsc.__test_uds_start_server(:'UDS_PATH');
+ __test_uds_start_server 
+-------------------------
+(0 rows)
+
+-- Send
+SELECT 1;
+ ?column? 
+----------
+        1
+(1 row)
+
+-- Receive
+SELECT gpsc.__test_uds_receive() > 0 as received;
+ received 
+----------
+ t
+(1 row)
+
+-- Stop receiver
+SELECT gpsc.__test_uds_stop_server();
+ __test_uds_stop_server 
+------------------------
+(0 rows)
+
+-- Cleanup
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.uds_path;
+RESET gpsc.ignored_users_list;
+RESET gpsc.enable;
+RESET gpsc.logging_mode;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_utf8_trim.out b/gpcontrib/gp_stats_collector/expected/gpsc_utf8_trim.out
new file mode 100644
index 00000000000..db3949f3152
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_utf8_trim.out
@@ -0,0 +1,68 @@
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+CREATE OR REPLACE FUNCTION get_marked_query(marker TEXT)
+RETURNS TEXT AS $$
+    SELECT query_text
+    FROM gpsc.log
+    WHERE query_text LIKE '%' || marker || '%'
+    ORDER BY datetime DESC
+    LIMIT 1
+$$ LANGUAGE sql VOLATILE;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+-- Test 1: 1 byte chars
+SET gpsc.max_text_size to 19;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test1*/ 'HelloWorld';
+  ?column?  
+------------
+ HelloWorld
+(1 row)
+
+RESET gpsc.logging_mode;
+SELECT octet_length(get_marked_query('test1')) = 19 AS correct_length;
+ correct_length 
+----------------
+ t
+(1 row)
+
+-- Test 2: 2 byte chars
+SET gpsc.max_text_size to 19;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test2*/ 'РУССКИЙЯЗЫК';
+  ?column?   
+-------------
+ РУССКИЙЯЗЫК
+(1 row)
+
+RESET gpsc.logging_mode;
+-- Character 'Р' has two bytes and cut in the middle => not included.
+SELECT octet_length(get_marked_query('test2')) = 18 AS correct_length;
+ correct_length 
+----------------
+ t
+(1 row)
+
+-- Test 3: 4 byte chars
+SET gpsc.max_text_size to 21;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test3*/ '😀';
+ ?column? 
+----------
+ 😀
+(1 row)
+
+RESET gpsc.logging_mode;
+-- Emoji has 4 bytes and cut before the last byte => not included.
+SELECT octet_length(get_marked_query('test3')) = 18 AS correct_length;
+ correct_length 
+----------------
+ t
+(1 row)
+
+-- Cleanup
+DROP FUNCTION get_marked_query(TEXT);
+RESET gpsc.max_text_size;
+RESET gpsc.logging_mode;
+RESET gpsc.enable;
+RESET gpsc.ignored_users_list;
+DROP EXTENSION gp_stats_collector;
diff --git a/gpcontrib/gp_stats_collector/expected/gpsc_utility.out b/gpcontrib/gp_stats_collector/expected/gpsc_utility.out
new file mode 100644
index 00000000000..e8e28614370
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/expected/gpsc_utility.out
@@ -0,0 +1,248 @@
+CREATE EXTENSION gp_stats_collector;
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+SET gpsc.logging_mode to 'TBL';
+CREATE TABLE test_table (a int, b text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+CREATE INDEX test_idx ON test_table(a);
+ALTER TABLE test_table ADD COLUMN c int DEFAULT 1;
+DROP TABLE test_table;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                     query_text                     |    query_status     
+-------+----------------------------------------------------+---------------------
+    -1 | CREATE TABLE test_table (a int, b text);           | QUERY_STATUS_SUBMIT
+    -1 | CREATE TABLE test_table (a int, b text);           | QUERY_STATUS_DONE
+    -1 | CREATE INDEX test_idx ON test_table(a);            | QUERY_STATUS_SUBMIT
+    -1 | CREATE INDEX test_idx ON test_table(a);            | QUERY_STATUS_DONE
+    -1 | ALTER TABLE test_table ADD COLUMN c int DEFAULT 1; | QUERY_STATUS_SUBMIT
+    -1 | ALTER TABLE test_table ADD COLUMN c int DEFAULT 1; | QUERY_STATUS_DONE
+    -1 | DROP TABLE test_table;                             | QUERY_STATUS_SUBMIT
+    -1 | DROP TABLE test_table;                             | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                           | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                           | QUERY_STATUS_DONE
+(10 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Partitioning
+SET gpsc.logging_mode to 'TBL';
+CREATE TABLE pt_test (a int, b int)
+DISTRIBUTED BY (a)
+PARTITION BY RANGE (a)
+(START (0) END (100) EVERY (50));
+DROP TABLE pt_test;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |             query_text              |    query_status     
+-------+-------------------------------------+---------------------
+    -1 | CREATE TABLE pt_test (a int, b int)+| QUERY_STATUS_SUBMIT
+       | DISTRIBUTED BY (a)                 +| 
+       | PARTITION BY RANGE (a)             +| 
+       | (START (0) END (100) EVERY (50));   | 
+    -1 | CREATE TABLE pt_test (a int, b int)+| QUERY_STATUS_DONE
+       | DISTRIBUTED BY (a)                 +| 
+       | PARTITION BY RANGE (a)             +| 
+       | (START (0) END (100) EVERY (50));   | 
+    -1 | DROP TABLE pt_test;                 | QUERY_STATUS_SUBMIT
+    -1 | DROP TABLE pt_test;                 | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;            | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;            | QUERY_STATUS_DONE
+(6 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Views and Functions
+SET gpsc.logging_mode to 'TBL';
+CREATE VIEW test_view AS SELECT 1 AS a;
+CREATE FUNCTION test_func(i int) RETURNS int AS $$ SELECT $1 + 1; $$ LANGUAGE SQL;
+DROP VIEW test_view;
+DROP FUNCTION test_func(int);
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                                     query_text                                     |    query_status     
+-------+------------------------------------------------------------------------------------+---------------------
+    -1 | CREATE VIEW test_view AS SELECT 1 AS a;                                            | QUERY_STATUS_SUBMIT
+    -1 | CREATE VIEW test_view AS SELECT 1 AS a;                                            | QUERY_STATUS_DONE
+    -1 | CREATE FUNCTION test_func(i int) RETURNS int AS $$ SELECT $1 + 1; $$ LANGUAGE SQL; | QUERY_STATUS_SUBMIT
+    -1 | CREATE FUNCTION test_func(i int) RETURNS int AS $$ SELECT $1 + 1; $$ LANGUAGE SQL; | QUERY_STATUS_DONE
+    -1 | DROP VIEW test_view;                                                               | QUERY_STATUS_SUBMIT
+    -1 | DROP VIEW test_view;                                                               | QUERY_STATUS_DONE
+    -1 | DROP FUNCTION test_func(int);                                                      | QUERY_STATUS_SUBMIT
+    -1 | DROP FUNCTION test_func(int);                                                      | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                                                           | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                                                           | QUERY_STATUS_DONE
+(10 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Transaction Operations
+SET gpsc.logging_mode to 'TBL';
+BEGIN;
+SAVEPOINT sp1;
+ROLLBACK TO sp1;
+COMMIT;
+BEGIN;
+SAVEPOINT sp2;
+ABORT;
+BEGIN;
+ROLLBACK;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |        query_text        |    query_status     
+-------+--------------------------+---------------------
+    -1 | BEGIN;                   | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                   | QUERY_STATUS_DONE
+    -1 | SAVEPOINT sp1;           | QUERY_STATUS_SUBMIT
+    -1 | ROLLBACK TO sp1;         | QUERY_STATUS_SUBMIT
+    -1 | ROLLBACK TO sp1;         | QUERY_STATUS_DONE
+    -1 | COMMIT;                  | QUERY_STATUS_SUBMIT
+    -1 | COMMIT;                  | QUERY_STATUS_DONE
+    -1 | BEGIN;                   | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                   | QUERY_STATUS_DONE
+    -1 | SAVEPOINT sp2;           | QUERY_STATUS_SUBMIT
+    -1 | ABORT;                   | QUERY_STATUS_SUBMIT
+    -1 | ABORT;                   | QUERY_STATUS_DONE
+    -1 | BEGIN;                   | QUERY_STATUS_SUBMIT
+    -1 | BEGIN;                   | QUERY_STATUS_DONE
+    -1 | ROLLBACK;                | QUERY_STATUS_SUBMIT
+    -1 | ROLLBACK;                | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode; | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode; | QUERY_STATUS_DONE
+(18 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- DML Operations
+SET gpsc.logging_mode to 'TBL';
+CREATE TABLE dml_test (a int, b text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+INSERT INTO dml_test VALUES (1, 'test');
+UPDATE dml_test SET b = 'updated' WHERE a = 1;
+DELETE FROM dml_test WHERE a = 1;
+DROP TABLE dml_test;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |               query_text               |    query_status     
+-------+----------------------------------------+---------------------
+    -1 | CREATE TABLE dml_test (a int, b text); | QUERY_STATUS_SUBMIT
+    -1 | CREATE TABLE dml_test (a int, b text); | QUERY_STATUS_DONE
+    -1 | DROP TABLE dml_test;                   | QUERY_STATUS_SUBMIT
+    -1 | DROP TABLE dml_test;                   | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;               | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;               | QUERY_STATUS_DONE
+(6 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- COPY Operations
+SET gpsc.logging_mode to 'TBL';
+CREATE TABLE copy_test (a int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+COPY (SELECT 1) TO STDOUT;
+1
+DROP TABLE copy_test;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |           query_text            |    query_status     
+-------+---------------------------------+---------------------
+    -1 | CREATE TABLE copy_test (a int); | QUERY_STATUS_SUBMIT
+    -1 | CREATE TABLE copy_test (a int); | QUERY_STATUS_DONE
+    -1 | COPY (SELECT 1) TO STDOUT;      | QUERY_STATUS_SUBMIT
+    -1 | COPY (SELECT 1) TO STDOUT;      | QUERY_STATUS_DONE
+    -1 | DROP TABLE copy_test;           | QUERY_STATUS_SUBMIT
+    -1 | DROP TABLE copy_test;           | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;        | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;        | QUERY_STATUS_DONE
+(8 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- Prepared Statements and error during execute
+SET gpsc.logging_mode to 'TBL';
+PREPARE test_prep(int) AS SELECT $1/0 AS value;
+EXECUTE test_prep(0::int);
+ERROR:  division by zero
+DEALLOCATE test_prep;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                   query_text                    |    query_status     
+-------+-------------------------------------------------+---------------------
+    -1 | PREPARE test_prep(int) AS SELECT $1/0 AS value; | QUERY_STATUS_SUBMIT
+    -1 | PREPARE test_prep(int) AS SELECT $1/0 AS value; | QUERY_STATUS_DONE
+    -1 | EXECUTE test_prep(0::int);                      | QUERY_STATUS_SUBMIT
+    -1 | EXECUTE test_prep(0::int);                      | QUERY_STATUS_ERROR
+    -1 | DEALLOCATE test_prep;                           | QUERY_STATUS_SUBMIT
+    -1 | DEALLOCATE test_prep;                           | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                        | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                        | QUERY_STATUS_DONE
+(8 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+-- GUC Settings
+SET gpsc.logging_mode to 'TBL';
+SET gpsc.report_nested_queries TO FALSE;
+RESET gpsc.report_nested_queries;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+ segid |                query_text                |    query_status     
+-------+------------------------------------------+---------------------
+    -1 | SET gpsc.report_nested_queries TO FALSE; | QUERY_STATUS_SUBMIT
+    -1 | SET gpsc.report_nested_queries TO FALSE; | QUERY_STATUS_DONE
+    -1 | RESET gpsc.report_nested_queries;        | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.report_nested_queries;        | QUERY_STATUS_DONE
+    -1 | RESET gpsc.logging_mode;                 | QUERY_STATUS_SUBMIT
+    -1 | RESET gpsc.logging_mode;                 | QUERY_STATUS_DONE
+(6 rows)
+
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+ t 
+---
+(0 rows)
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/gp_stats_collector--1.0--1.1.sql b/gpcontrib/gp_stats_collector/gp_stats_collector--1.0--1.1.sql
new file mode 100644
index 00000000000..398f03b4fa9
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/gp_stats_collector--1.0--1.1.sql
@@ -0,0 +1,113 @@
+/* gp_stats_collector--1.0--1.1.sql */
+
+-- complain if script is sourced in psql, rather than via ALTER EXTENSION
+\echo Use "ALTER EXTENSION gp_stats_collector UPDATE TO '1.1'" to load this file. \quit
+
+CREATE SCHEMA gpsc;
+
+-- Unlink existing objects from extension.
+ALTER EXTENSION gp_stats_collector DROP VIEW gpsc_stat_messages;
+ALTER EXTENSION gp_stats_collector DROP FUNCTION gpsc_stat_messages_reset();
+ALTER EXTENSION gp_stats_collector DROP FUNCTION __gpsc_stat_messages_f_on_segments();
+ALTER EXTENSION gp_stats_collector DROP FUNCTION __gpsc_stat_messages_f_on_master();
+ALTER EXTENSION gp_stats_collector DROP FUNCTION __gpsc_stat_messages_reset_f_on_segments();
+ALTER EXTENSION gp_stats_collector DROP FUNCTION __gpsc_stat_messages_reset_f_on_master();
+
+-- Now drop the objects.
+DROP VIEW gpsc_stat_messages;
+DROP FUNCTION gpsc_stat_messages_reset();
+DROP FUNCTION __gpsc_stat_messages_f_on_segments();
+DROP FUNCTION __gpsc_stat_messages_f_on_master();
+DROP FUNCTION __gpsc_stat_messages_reset_f_on_segments();
+DROP FUNCTION __gpsc_stat_messages_reset_f_on_master();
+
+-- Recreate functions and view in new schema.
+CREATE FUNCTION gpsc.__stat_messages_reset_f_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_reset_f_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON ALL SEGMENTS;
+
+CREATE FUNCTION gpsc.stat_messages_reset()
+RETURNS SETOF void
+AS
+$$
+  SELECT gpsc.__stat_messages_reset_f_on_master();
+  SELECT gpsc.__stat_messages_reset_f_on_segments();
+$$
+LANGUAGE SQL EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_f_on_master()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_f_on_segments()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE VIEW gpsc.stat_messages AS
+  SELECT C.*
+	FROM gpsc.__stat_messages_f_on_master() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+  UNION ALL
+  SELECT C.*
+	FROM gpsc.__stat_messages_f_on_segments() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+ORDER BY segid;
+
+-- Create new objects.
+CREATE FUNCTION gpsc.__init_log_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_init_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__init_log_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_init_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+-- Creates log table inside gpsc schema.
+SELECT gpsc.__init_log_on_master();
+SELECT gpsc.__init_log_on_segments();
+
+CREATE VIEW gpsc.log AS
+  SELECT * FROM gpsc.__log -- master
+  UNION ALL
+  SELECT * FROM gp_dist_random('gpsc.__log') -- segments
+  ORDER BY tmid, ssid, ccnt;
+
+CREATE FUNCTION gpsc.__truncate_log_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_truncate_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__truncate_log_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_truncate_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE FUNCTION gpsc.truncate_log()
+RETURNS SETOF void AS $$
+BEGIN
+    PERFORM gpsc.__truncate_log_on_master();
+    PERFORM gpsc.__truncate_log_on_segments();
+END;
+$$ LANGUAGE plpgsql VOLATILE;
diff --git a/gpcontrib/gp_stats_collector/gp_stats_collector--1.0.sql b/gpcontrib/gp_stats_collector/gp_stats_collector--1.0.sql
new file mode 100644
index 00000000000..e4a50aa2133
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/gp_stats_collector--1.0.sql
@@ -0,0 +1,55 @@
+/* gp_stats_collector--1.0.sql */
+
+-- complain if script is sourced in psql, rather than via CREATE EXTENSION
+\echo Use "CREATE EXTENSION gp_stats_collector" to load this file. \quit
+
+CREATE FUNCTION __gpsc_stat_messages_reset_f_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION __gpsc_stat_messages_reset_f_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON ALL SEGMENTS;
+
+CREATE FUNCTION gpsc_stat_messages_reset()
+RETURNS SETOF void
+AS
+$$
+  SELECT __gpsc_stat_messages_reset_f_on_master();
+  SELECT __gpsc_stat_messages_reset_f_on_segments();
+$$
+LANGUAGE SQL EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION __gpsc_stat_messages_f_on_master()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION __gpsc_stat_messages_f_on_segments()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE VIEW gpsc_stat_messages AS
+  SELECT C.*
+	FROM __gpsc_stat_messages_f_on_master() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+  UNION ALL
+  SELECT C.*
+	FROM __gpsc_stat_messages_f_on_segments() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+ORDER BY segid;
diff --git a/gpcontrib/gp_stats_collector/gp_stats_collector--1.1.sql b/gpcontrib/gp_stats_collector/gp_stats_collector--1.1.sql
new file mode 100644
index 00000000000..3ebdad14b06
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/gp_stats_collector--1.1.sql
@@ -0,0 +1,110 @@
+/* gp_stats_collector--1.1.sql */
+
+-- complain if script is sourced in psql, rather than via CREATE EXTENSION
+\echo Use "CREATE EXTENSION gp_stats_collector" to load this file. \quit
+
+CREATE SCHEMA gpsc;
+
+CREATE FUNCTION gpsc.__stat_messages_reset_f_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_reset_f_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages_reset'
+LANGUAGE C EXECUTE ON ALL SEGMENTS;
+
+CREATE FUNCTION gpsc.stat_messages_reset()
+RETURNS SETOF void
+AS
+$$
+  SELECT gpsc.__stat_messages_reset_f_on_master();
+  SELECT gpsc.__stat_messages_reset_f_on_segments();
+$$
+LANGUAGE SQL EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_f_on_master()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__stat_messages_f_on_segments()
+RETURNS SETOF record
+AS 'MODULE_PATHNAME', 'gpsc_stat_messages'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE VIEW gpsc.stat_messages AS
+  SELECT C.*
+	FROM gpsc.__stat_messages_f_on_master() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+  UNION ALL
+  SELECT C.*
+	FROM gpsc.__stat_messages_f_on_segments() as C (
+    segid int,
+    total_messages bigint,
+    send_failures bigint,
+    connection_failures bigint,
+    other_errors bigint,
+    max_message_size int
+	)
+ORDER BY segid;
+
+CREATE FUNCTION gpsc.__init_log_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_init_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__init_log_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_init_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+-- Creates log table inside gpsc schema.
+SELECT gpsc.__init_log_on_master();
+SELECT gpsc.__init_log_on_segments();
+
+CREATE VIEW gpsc.log AS
+  SELECT * FROM gpsc.__log -- master
+  UNION ALL
+  SELECT * FROM gp_dist_random('gpsc.__log') -- segments
+ORDER BY tmid, ssid, ccnt;
+
+CREATE FUNCTION gpsc.__truncate_log_on_master()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_truncate_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__truncate_log_on_segments()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_truncate_log'
+LANGUAGE C STRICT VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE FUNCTION gpsc.truncate_log()
+RETURNS SETOF void AS $$
+BEGIN
+    PERFORM gpsc.__truncate_log_on_master();
+    PERFORM gpsc.__truncate_log_on_segments();
+END;
+$$ LANGUAGE plpgsql VOLATILE;
+
+CREATE FUNCTION gpsc.__test_uds_start_server(path text)
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_test_uds_start_server'
+LANGUAGE C STRICT EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__test_uds_receive(timeout_ms int DEFAULT 2000)
+RETURNS SETOF bigint
+AS 'MODULE_PATHNAME', 'gpsc_test_uds_receive'
+LANGUAGE C STRICT EXECUTE ON COORDINATOR;
+
+CREATE FUNCTION gpsc.__test_uds_stop_server()
+RETURNS SETOF void
+AS 'MODULE_PATHNAME', 'gpsc_test_uds_stop_server'
+LANGUAGE C EXECUTE ON COORDINATOR;
diff --git a/gpcontrib/gp_stats_collector/gp_stats_collector.control b/gpcontrib/gp_stats_collector/gp_stats_collector.control
new file mode 100644
index 00000000000..4aea2bd49b8
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/gp_stats_collector.control
@@ -0,0 +1,5 @@
+# gp_stats_collector extension
+comment = 'Intercept query and plan execution hooks and report them to Cloudberry monitor agents'
+default_version = '1.1'
+module_pathname = '$libdir/gp_stats_collector'
+superuser = true
diff --git a/gpcontrib/gp_stats_collector/metric.md b/gpcontrib/gp_stats_collector/metric.md
new file mode 100644
index 00000000000..6f168d8cd98
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/metric.md
@@ -0,0 +1,145 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one
+  or more contributor license agreements.  See the NOTICE file
+  distributed with this work for additional information
+  regarding copyright ownership.  The ASF licenses this file
+  to you under the Apache License, Version 2.0 (the
+  "License"); you may not use this file except in compliance
+  with the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing,
+  software distributed under the License is distributed on an
+  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  KIND, either express or implied.  See the License for the
+  specific language governing permissions and limitations
+  under the License.
+-->
+
+## GP Stats Collector Metrics
+
+### States
+A Postgres process goes through 4 executor functions to execute a query:
+1) `ExecutorStart()` - resource allocation for the query.
+2) `ExecutorRun()` - query execution.
+3) `ExecutorFinish()` - cleanup.
+4) `ExecutorEnd()` - cleanup.
+
+gp-stats-collector sends messages with 4 states, from _Dispatcher_ and/or _Execute_ processes: `submit`, `start`, `end`, `done`, in this order:
+```
+submit -> ExecutorStart() -> start -> ExecutorRun() -> ExecutorFinish() -> end -> ExecutorEnd() -> done
+```
+
+### Key Points
+- Some queries may skip the _end_ state, then the _end_ statistics is sent during _done_.
+- If a query finishes with an error (`METRICS_QUERY_ERROR`), or is cancelled (`METRICS_QUERY_CANCELLED`), statistics is sent at _done_.
+- Some statistics is calculated as the difference between the current global metric and the previous. The initial snapshot is taken at submit, and at _end_/_done_ the diff is calculated.
+- Nested queries on _Dispatcher_ become top-level on _Execute_.
+- Each process (_Dispatcher_/_Execute_) sends its own statistics
+
+### Notations
+- **S** = Submit event.
+- **T** = Start event.
+- **E** = End event.
+- **D** = Done event.
+- **DIFF** = current_value - submit_value (submit event).
+- **ABS** = Absolute value, or where diff is not applicable, the value taken.
+- **Local*** - Statistics that starts counting from zero for each new query. A nested query is also considered new.
+- **Node** - PG process, either a `Query Dispatcher` (on master) or an `Execute` (on segment).
+
+### Statistics Table
+
+| Proto Field                  | Type   | When    | DIFF/ABS | Local* | Scope   | Dispatcher | Execute | Units   | Notes                                               |
+| :--------------------------- | :----- | :------ | :------- | ------ | :------ | :--------: | :-----: | :------ | :-------------------------------------------------- |
+| **SystemStat**               |        |         |          |        |         |            |         |         |                                                     |
+| `runningTimeSeconds`         | double | E, D    | DIFF     | -      | Node    |     +      |    +    | seconds | Wall clock time                                     |
+| `userTimeSeconds`            | double | E, D    | DIFF     | -      | Node    |     +      |    +    | seconds | /proc/pid/stat utime                                |
+| `kernelTimeSeconds`          | double | E, D    | DIFF     | -      | Node    |     +      |    +    | seconds | /proc/pid/stat stime                                |
+| `vsize`                      | uint64 | E, D    | ABS      | -      | Node    |     +      |    +    | bytes   | /proc/pid/stat vsize                                |
+| `rss`                        | uint64 | E, D    | ABS      | -      | Node    |     +      |    +    | pages   | /proc/pid/stat rss                                  |
+| `VmSizeKb`                   | uint64 | E, D    | ABS      | -      | Node    |     +      |    +    | KB      | /proc/pid/status VmSize                             |
+| `VmPeakKb`                   | uint64 | E, D    | ABS      | -      | Node    |     +      |    +    | KB      | /proc/pid/status VmPeak                             |
+| `rchar`                      | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | /proc/pid/io rchar                                  |
+| `wchar`                      | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | /proc/pid/io wchar                                  |
+| `syscr`                      | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | count   | /proc/pid/io syscr                                  |
+| `syscw`                      | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | count   | /proc/pid/io syscw                                  |
+| `read_bytes`                 | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | /proc/pid/io read_bytes                             |
+| `write_bytes`                | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | /proc/pid/io write_bytes                            |
+| `cancelled_write_bytes`      | uint64 | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | /proc/pid/io cancelled_write_bytes                  |
+| **MetricInstrumentation**    |        |         |          |        |         |            |         |         |                                                     |
+| `ntuples`                    | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | tuples  | Accumulated total tuples                            |
+| `nloops`                     | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | count   | Number of cycles                                    |
+| `tuplecount`                 | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | tuples  | Accumulated tuples per cycle                        |
+| `firsttuple`                 | double | E, D    | ABS      | +      | Node    |     +      |    +    | seconds | Time for first tuple of this cycle                  |
+| `startup`                    | double | E, D    | ABS      | +      | Node    |     +      |    +    | seconds | Start time of current iteration                     |
+| `total`                      | double | E, D    | ABS      | +      | Node    |     +      |    +    | seconds | Total time taken                                    |
+| `shared_blks_hit`            | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Shared buffer blocks found in cache                 |
+| `shared_blks_read`           | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Shared buffer blocks read from disk                 |
+| `shared_blks_dirtied`        | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Shared blocks dirtied                               |
+| `shared_blks_written`        | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Dirty shared buffer blocks written to disk          |
+| `local_blks_hit`             | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Local buffer hits                                   |
+| `local_blks_read`            | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Disk blocks read                                    |
+| `local_blks_dirtied`         | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Local blocks dirtied                                |
+| `local_blks_written`         | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Local blocks written to disk                        |
+| `temp_blks_read`             | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Temp file blocks read                               |
+| `temp_blks_written`          | uint64 | E, D    | ABS      | +      | Node    |     +      |    +    | blocks  | Temp file blocks written                            |
+| `blk_read_time`              | double | E, D    | ABS      | +      | Node    |     +      |    +    | seconds | Time reading data blocks                            |
+| `blk_write_time`             | double | E, D    | ABS      | +      | Node    |     +      |    +    | seconds | Time writing data blocks                            |
+| `inherited_calls`            | uint64 | E, D    | ABS      | -      | Node    |     +      |    +    | count   | Nested query count (GPSC-specific)                |
+| `inherited_time`             | double | E, D    | ABS      | -      | Node    |     +      |    +    | seconds | Nested query time (GPSC-specific)                 |
+| **NetworkStat (sent)**       |        |         |          |        |         |            |         |         |                                                     |
+| `sent.total_bytes`           | uint32 | D       | ABS      | -      | Node    |     +      |    +    | bytes   | Bytes sent, including headers                       |
+| `sent.tuple_bytes`           | uint32 | D       | ABS      | -      | Node    |     +      |    +    | bytes   | Bytes of pure tuple-data sent                       |
+| `sent.chunks`                | uint32 | D       | ABS      | -      | Node    |     +      |    +    | count   | Tuple-chunks sent                                   |
+| **NetworkStat (received)**   |        |         |          |        |         |            |         |         |                                                     |
+| `received.total_bytes`       | uint32 | D       | ABS      | -      | Node    |     +      |    +    | bytes   | Bytes of pure tuple-data received                   |
+| `received.tuple_bytes`       | uint32 | D       | ABS      | -      | Node    |     +      |    +    | bytes   | Bytes of pure tuple-data received                   |
+| `received.chunks`            | uint32 | D       | ABS      | -      | Node    |     +      |    +    | count   | Tuple-chunks received                               |
+| **InterconnectStat**         |        |         |          |        |         |            |         |         |                                                     |
+| `total_recv_queue_size`      | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | bytes   | Receive queue size sum                              |
+| `recv_queue_size_counting_t` | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | count   | Counting times when computing total_recv_queue_size |
+| `total_capacity`             | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | bytes   | the capacity sum for sent packets                   |
+| `capacity_counting_time`     | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | count   | counting times used to compute total_capacity       |
+| `total_buffers`              | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | count   | Available buffers                                   |
+| `buffer_counting_time`       | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | count   | counting times when compute total_buffers           |
+| `active_connections_num`     | uint64 | D       | DIFF     | -      | Node    |     +      |    +    | count   | Active connections                                  |
+| `retransmits`                | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Packet retransmits                                  |
+| `startup_cached_pkt_num`     | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Startup cached packets                              |
+| `mismatch_num`               | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Mismatched packets received                         |
+| `crc_errors`                 | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | CRC errors                                          |
+| `snd_pkt_num`                | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Packets sent                                        |
+| `recv_pkt_num`               | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Packets received                                    |
+| `disordered_pkt_num`         | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Out-of-order packets                                |
+| `duplicated_pkt_num`         | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Duplicate packets                                   |
+| `recv_ack_num`               | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | ACKs received                                       |
+| `status_query_msg_num`       | int64  | D       | DIFF     | -      | Node    |     +      |    +    | count   | Status query messages sent                          |
+| **SpillInfo**                |        |         |          |        |         |            |         |         |                                                     |
+| `fileCount`                  | int32  | E, D    | DIFF     | -      | Node    |     +      |    +    | count   | Spill (temp) files created                          |
+| `totalBytes`                 | int64  | E, D    | DIFF     | -      | Node    |     +      |    +    | bytes   | Spill bytes written                                 |
+| **QueryInfo**                |        |         |          |        |         |            |         |         |                                                     |
+| `generator`                  | enum   | T, E, D | ABS      | -      | Cluster |     +      |    -    | enum    | Planner/Optimizer                                   |
+| `query_id`                   | uint64 | T, E, D | ABS      | -      | Cluster |     +      |    -    | id      | Query ID                                            |
+| `plan_id`                    | uint64 | T, E, D | ABS      | -      | Cluster |     +      |    -    | id      | Hash of normalized plan                             |
+| `query_text`                 | string | S       | ABS      | -      | Cluster |     +      |    -    | text    | Query text                                          |
+| `plan_text`                  | string | T       | ABS      | -      | Cluster |     +      |    -    | text    | EXPLAIN text                                        |
+| `template_query_text`        | string | S       | ABS      | -      | Cluster |     +      |    -    | text    | Normalized query text                               |
+| `template_plan_text`         | string | T       | ABS      | -      | Cluster |     +      |    -    | text    | Normalized plan text                                |
+| `userName`                   | string | All     | ABS      | -      | Cluster |     +      |    -    | text    | Session user                                        |
+| `databaseName`               | string | All     | ABS      | -      | Cluster |     +      |    -    | text    | Database name                                       |
+| `rsgname`                    | string | All     | ABS      | -      | Cluster |     +      |    -    | text    | Resource group name                                 |
+| `analyze_text`               | string | D       | ABS      | -      | Cluster |     +      |    -    | text    | EXPLAIN ANALYZE                                |
+| **AdditionalQueryInfo**      |        |         |          |        |         |            |         |         |                                                     |
+| `nested_level`               | int64  | All     | ABS      | -      | Node    |     +      |    +    | count   | Current nesting level                               |
+| `error_message`              | string | D       | ABS      | -      | Node    |     +      |    +    | text    | Error message                                       |
+| `slice_id`                   | int64  | All     | ABS      | -      | Node    |     +      |    +    | id      | Slice ID                                            |
+| **QueryKey**                 |        |         |          |        |         |            |         |         |                                                     |
+| `tmid`                       | int32  | All     | ABS      | -      | Node    |     +      |    +    | id      | Transaction start time                                             |
+| `ssid`                       | int32  | All     | ABS      | -      | Node    |     +      |    +    | id      | Session ID                                          |
+| `ccnt`                       | int32  | All     | ABS      | -      | Node    |     +      |    +    | count   | Command counter                                     |
+| **SegmentKey**               |        |         |          |        |         |            |         |         |                                                     |
+| `dbid`                       | int32  | All     | ABS      | -      | Node    |     +      |    +    | id      | Database ID                                         |
+| `segment_index`              | int32  | All     | ABS      | -      | Node    |     +      |    +    | id      | Segment index (-1=coordinator)                      |
+
+---
+
diff --git a/gpcontrib/gp_stats_collector/protos/gpsc_metrics.proto b/gpcontrib/gp_stats_collector/protos/gpsc_metrics.proto
new file mode 100644
index 00000000000..10991301557
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/protos/gpsc_metrics.proto
@@ -0,0 +1,201 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+syntax = "proto3";
+
+package gpsc;
+
+enum QueryStatus {
+    QUERY_STATUS_UNSPECIFIED = 0;
+    QUERY_STATUS_SUBMIT = 1;
+    QUERY_STATUS_START = 2;
+    QUERY_STATUS_DONE = 3;
+    QUERY_STATUS_QUERY_DONE = 4;
+    QUERY_STATUS_ERROR = 5;
+    QUERY_STATUS_CANCELLING = 6;
+    QUERY_STATUS_CANCELED = 7;
+    QUERY_STATUS_END = 8;
+}
+
+enum PlanNodeStatus {
+    PLAN_NODE_STATUS_UNSPECIFIED = 0;
+    PLAN_NODE_STATUS_INITIALIZED = 1;
+    PLAN_NODE_STATUS_EXECUTING = 2;
+    PLAN_NODE_STATUS_FINISHED = 3;
+}
+
+message QueryInfo {
+    PlanGenerator generator = 1;
+    uint64 query_id = 2;
+    uint64 plan_id = 3;
+    string query_text = 4;
+    string plan_text = 5;
+    string template_query_text = 6;
+    string template_plan_text = 7;
+    string userName = 8;
+    string databaseName = 9;
+    string rsgname = 10;
+    string analyze_text = 11;
+}
+
+message AdditionalQueryInfo {
+    int64 nested_level                    = 1;
+    string error_message                  = 2;
+    int64 slice_id                        = 3;
+}
+
+message AdditionalQueryStat {
+    string error_message                  = 1;
+    repeated int64 slices                 = 2;
+}
+
+enum PlanGenerator
+{
+    PLAN_GENERATOR_UNSPECIFIED = 0;
+    PLAN_GENERATOR_PLANNER = 1;         /* plan produced by the planner*/
+    PLAN_GENERATOR_OPTIMIZER = 2;       /* plan produced by the optimizer*/
+}
+
+message GPMetrics {
+    SystemStat systemStat = 1;
+    MetricInstrumentation instrumentation = 2;
+    SpillInfo spill = 3;
+}
+
+message QueryKey {
+    int32 tmid = 1; /* A time identifier for a particular query. All records associated with the query will have the same tmid. */
+    int32 ssid = 2; /* The session id as shown by gp_session_id. All records associated with the query will have the same ssid */
+    int32 ccnt = 3; /* The command number within this session as shown by gp_command_count. All records associated with the query will have the same ccnt */
+}
+
+message SegmentKey {
+    int32		dbid = 1;		/* the dbid of this database */
+    int32		segindex = 2;		/* content indicator: -1 for entry database,
+                                                 * 0, ..., n-1 for segment database *
+                                                 * a primary and its mirror have the same segIndex */
+}
+
+message SystemStat {
+    /* CPU stat*/
+    double runningTimeSeconds = 1;
+    double userTimeSeconds = 2;
+    double kernelTimeSeconds = 3;
+
+    /* Memory stat */
+    uint64 vsize = 4;
+    uint64 rss = 5;
+    uint64 VmSizeKb = 6;
+    uint64 VmPeakKb = 7;
+
+   /* Storage stat */
+    uint64 rchar = 8;
+    uint64 wchar = 9;
+    uint64 syscr = 10;
+    uint64 syscw = 11;
+    uint64 read_bytes = 12;
+    uint64 write_bytes = 13;
+    uint64 cancelled_write_bytes = 14;
+}
+
+message NetworkStat {
+    uint64 total_bytes  = 1;
+    uint64 tuple_bytes = 2;
+    uint64 chunks = 3;
+}
+
+message InterconnectStat {
+    // Receive queue size sum when main thread is trying to get a packet
+    uint64 total_recv_queue_size = 1;
+    // Counting times when computing total_recv_queue_size
+    uint64 recv_queue_size_counting_time = 2;
+
+    // The capacity sum when packets are tried to be sent
+    uint64 total_capacity = 3;
+    // Counting times used to compute total_capacity
+    uint64 capacity_counting_time = 4;
+
+    // Total buffers available when sending packets
+    uint64 total_buffers = 5;
+    // Counting times when compute total_buffers
+    uint64 buffer_counting_time = 6;
+
+    // The number of active connections
+    uint64 active_connections_num = 7;
+
+    // The number of packet retransmits
+    int64 retransmits = 8;
+
+    // The number of cached future packets
+    int64 startup_cached_pkt_num = 9;
+
+    // The number of mismatched packets received
+    int64 mismatch_num = 10;
+
+    // The number of crc errors
+    int64 crc_errors = 11;
+
+    // The number of packets sent by sender
+    int64 snd_pkt_num = 12;
+
+    // The number of packets received by receiver
+    int64 recv_pkt_num = 13;
+
+    // Disordered packet number
+    int64 disordered_pkt_num = 14;
+
+    // Duplicate packet number
+    int64 duplicated_pkt_num = 15;
+
+    // The number of Acks received
+    int64 recv_ack_num = 16;
+
+    // The number of status query messages sent
+    int64 status_query_msg_num = 17;
+}
+
+message MetricInstrumentation {
+    uint64  ntuples     = 1;    /* Total tuples produced */
+    uint64  nloops      = 2;    /* # of run cycles for this node */
+    uint64  tuplecount  = 3;    /* Tuples emitted so far this cycle */
+    double  firsttuple  = 4;    /* Time for first tuple of this cycle */
+    double  startup     = 5;    /* Total startup time (in seconds) (optimiser's cost estimation) */
+    double  total       = 6;    /* Total total time (in seconds) */
+    uint64 shared_blks_hit     = 7; /* shared blocks stats*/
+    uint64 shared_blks_read    = 8;
+    uint64 shared_blks_dirtied = 9;
+    uint64 shared_blks_written = 10;
+    uint64 local_blks_hit      = 11; /* data read from disks */
+    uint64 local_blks_read     = 12;
+    uint64 local_blks_dirtied  = 13;
+    uint64 local_blks_written  = 14;
+    uint64 temp_blks_read      = 15; /* temporary tables read stat */
+    uint64 temp_blks_written   = 16;
+    double blk_read_time       = 17; /* measured read/write time */
+    double blk_write_time      = 18;
+    NetworkStat sent           = 19;
+    NetworkStat received       = 20;
+    double  startup_time       = 21; /* real query startup time (planning + queue time) */
+    uint64  inherited_calls    = 22; /* the number of executed sub-queries */
+    double  inherited_time     = 23; /* total time spend on inherited execution */
+    InterconnectStat interconnect = 24;
+}
+
+message SpillInfo {
+    int32 fileCount = 1;
+    int64 totalBytes = 2;
+}
diff --git a/gpcontrib/gp_stats_collector/protos/gpsc_plan.proto b/gpcontrib/gp_stats_collector/protos/gpsc_plan.proto
new file mode 100644
index 00000000000..c1632478464
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/protos/gpsc_plan.proto
@@ -0,0 +1,586 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+syntax = "proto3";
+
+package gpsc;
+
+message MetricPlan {
+    GpdbNodeType   type = 1;
+
+    int32   plan_node_id = 2;
+    int32   parent_plan_node_id = 3; // Valid only for QueryInfoMetricQuerySubmit 
+
+    double  startup_cost = 4;	/* cost expended before fetching any tuples */
+    double  total_cost = 5;	/* total cost (assuming all tuples fetched) */
+    double  plan_rows = 6;	/* number of rows plan is expected to emit */
+    int32   plan_width = 7;	/* average row width in bytes */
+
+    int32   arg1 = 8;  // for some nodes it's additional opperand type
+    int32   arg2 = 9;  // for some nodes it's additional opperand type
+
+    MetricMotionInfo motion_info = 10;
+    MetricRelationInfo relation_info = 11;
+    
+    string scan_index_name = 12;
+    ScanDirection scan_direction = 13;
+    MetricSliceInfo slice_info = 14;
+    string statement = 15;
+}
+
+message MetricMotionInfo {
+    MotionType   type = 1;
+    bool         isBroadcast = 2;
+    CdbLocusType locusType = 3;
+
+    int32 sliceId = 4;
+    int32 parentSliceId = 5;
+}
+
+message MetricRelationInfo {
+    int32   oid = 1;
+    string  name = 2;
+    string  schema = 3;
+    string  alias = 4;
+    int32   dynamicScanId = 5;
+}
+
+message MetricSliceInfo {
+    int32       slice = 1;
+    int32       segments = 2;
+    GangType    gangType = 3;
+    int32       gang = 4;
+}
+
+enum ScanDirection
+{
+    SCAN_DIRECTION_UNSPECIFIED = 0;
+    SCAN_DIRECTION_BACKWARD = 1;
+    SCAN_DIRECTION_FORWARD = 2;
+}
+
+/* GangType enumeration is used in several structures related to CDB
+ * slice plan support.
+ */
+enum GangType
+{
+    GANG_TYPE_UNSPECIFIED = 0;
+    GANG_TYPE_UNALLOCATED = 1;       /* a root slice executed by the qDisp */
+    GANG_TYPE_ENTRYDB_READER = 2;    /* a 1-gang with read access to the entry db */
+    GANG_TYPE_SINGLETON_READER = 3;  /* a 1-gang to read the segment dbs */
+    GANG_TYPE_PRIMARY_READER = 4;    /* a 1-gang or N-gang to read the segment dbs */
+    GANG_TYPE_PRIMARY_WRITER = 5;    /* the N-gang that can update the segment dbs */
+}
+
+
+enum CdbLocusType
+{
+    CDB_LOCUS_TYPE_UNSPECIFIED = 0;
+    CDB_LOCUS_TYPE_ENTRY = 1;       /* a single backend process on the entry db:
+                                    * usually the qDisp itself, but could be a
+                                    * qExec started by the entry postmaster.
+                                    */
+
+    CDB_LOCUS_TYPE_SINGLE_QE = 2;   /* a single backend process on any db: the
+                                    * qDisp itself, or a qExec started by a
+                                    * segment postmaster or the entry postmaster.
+                                    */
+
+    CDB_LOCUS_TYPE_GENERAL = 3;      /* compatible with any locus (data is
+                                     * self-contained in the query plan or
+                                     * generally available in any qExec or qDisp) */
+
+    CDB_LOCUS_TYPE_SEGMENT_GENERAL = 4; /* generally available in any qExec, but not
+                                         * available in qDisp */
+
+    CDB_LOCUS_TYPE_REPLICATED = 5;    /* replicated over all qExecs of an N-gang */
+    CDB_LOCUS_TYPE_HASHED = 6;        /* hash partitioned over all qExecs of N-gang */
+    CDB_LOCUS_TYPE_HASHED_OJ = 7;     /* result of hash partitioned outer join, NULLs can be anywhere */
+    CDB_LOCUS_TYPE_STREWN = 8;        /* partitioned on no known function */
+    CDB_LOCUS_TYPE_END = 9;           /* = last valid CdbLocusType + 1 */
+}
+
+enum MotionType
+{
+    MOTION_TYPE_UNSPECIFIED = 0;
+    MOTION_TYPE_HASH = 1;                // Use hashing to select a segindex destination
+    MOTION_TYPE_FIXED = 2;               // Send tuples to a fixed set of segindexes
+    MOTION_TYPE_EXPLICIT = 3;            // Send tuples to the segment explicitly specified in their segid column
+}
+
+enum GpdbNodeType {
+	GPDB_NODE_TYPE_UNSPECIFIED = 0;
+	INDEX_INFO = 1;
+	EXPR_CONTEXT = 2;
+	PROJECTION_INFO = 3;
+	JUNK_FILTER = 4;
+	RESULT_REL_INFO = 5;
+	E_STATE = 6;
+	TUPLE_TABLE_SLOT = 7;
+	CDB_PROCESS = 8;
+	SLICE = 9;
+	SLICE_TABLE = 10;
+	CURSOR_POS_INFO = 11;
+	SHARE_NODE_ENTRY = 12;
+	PARTITION_STATE = 13;
+	QUERY_DISPATCH_DESC = 14;
+	OID_ASSIGNMENT = 15;
+	PLAN = 16;
+	SCAN = 17;
+	JOIN = 18;
+	RESULT = 19;
+	MODIFY_TABLE = 20;
+	APPEND = 21;
+	MERGE_APPEND = 22;
+	RECURSIVE_UNION = 23;
+	SEQUENCE = 24;
+	BITMAP_AND = 25;
+	BITMAP_OR = 26;
+	SEQ_SCAN = 27;
+	DYNAMIC_SEQ_SCAN = 28;
+	EXTERNAL_SCAN = 29;
+	INDEX_SCAN = 30;
+	DYNAMIC_INDEX_SCAN = 31;
+	INDEX_ONLY_SCAN = 32;
+	BITMAP_INDEX_SCAN = 33;
+	DYNAMIC_BITMAP_INDEX_SCAN = 34;
+	BITMAP_HEAP_SCAN = 35;
+	DYNAMIC_BITMAP_HEAP_SCAN = 36;
+	TID_SCAN = 37;
+	SUBQUERY_SCAN = 38;
+	FUNCTION_SCAN = 39;
+	TABLE_FUNCTION_SCAN = 40;
+	VALUES_SCAN = 41;
+	CTE_SCAN = 42;
+	WORK_TABLE_SCAN = 43;
+	FOREIGN_SCAN = 44;
+	NEST_LOOP = 45;
+	MERGE_JOIN = 46;
+	HASH_JOIN = 47;
+	MATERIAL = 48;
+	SORT = 49;
+	AGG = 50;
+	WINDOW_AGG = 51;
+	UNIQUE = 52;
+	HASH = 53;
+	SET_OP = 54;
+	LOCK_ROWS = 55;
+	LIMIT = 56;
+	MOTION = 57;
+	SHARE_INPUT_SCAN = 58;
+	REPEAT = 59;
+	DML = 60;
+	SPLIT_UPDATE = 61;
+	ROW_TRIGGER = 62;
+	ASSERT_OP = 63;
+	PARTITION_SELECTOR = 64;
+	PLAN_END = 65;
+	NEST_LOOP_PARAM = 66;
+	PLAN_ROW_MARK = 67;
+	PLAN_INVAL_ITEM = 68;
+	PLAN_STATE = 69;
+	SCAN_STATE = 70;
+	JOIN_STATE = 71;
+	RESULT_STATE = 72;
+	MODIFY_TABLE_STATE = 73;
+	APPEND_STATE = 74;
+	MERGE_APPEND_STATE = 75;
+	RECURSIVE_UNION_STATE = 76;
+	SEQUENCE_STATE = 77;
+	BITMAP_AND_STATE = 78;
+	BITMAP_OR_STATE = 79;
+	SEQ_SCAN_STATE = 80;
+	DYNAMIC_SEQ_SCAN_STATE = 81;
+	EXTERNAL_SCAN_STATE = 82;
+	INDEX_SCAN_STATE = 83;
+	DYNAMIC_INDEX_SCAN_STATE = 84;
+	INDEX_ONLY_SCAN_STATE = 85;
+	BITMAP_INDEX_SCAN_STATE = 86;
+	DYNAMIC_BITMAP_INDEX_SCAN_STATE = 87;
+	BITMAP_HEAP_SCAN_STATE = 88;
+	DYNAMIC_BITMAP_HEAP_SCAN_STATE = 89;
+	TID_SCAN_STATE = 90;
+	SUBQUERY_SCAN_STATE = 91;
+	FUNCTION_SCAN_STATE = 92;
+	TABLE_FUNCTION_STATE = 93;
+	VALUES_SCAN_STATE = 94;
+	CTE_SCAN_STATE = 95;
+	WORK_TABLE_SCAN_STATE = 96;
+	FOREIGN_SCAN_STATE = 97;
+	NEST_LOOP_STATE = 98;
+	MERGE_JOIN_STATE = 99;
+	HASH_JOIN_STATE = 100;
+	MATERIAL_STATE = 101;
+	SORT_STATE = 102;
+	AGG_STATE = 103;
+	WINDOW_AGG_STATE = 104;
+	UNIQUE_STATE = 105;
+	HASH_STATE = 106;
+	SET_OP_STATE = 107;
+	LOCK_ROWS_STATE = 108;
+	LIMIT_STATE = 109;
+	MOTION_STATE = 110;
+	SHARE_INPUT_SCAN_STATE = 111;
+	REPEAT_STATE = 112;
+	DML_STATE = 113;
+	SPLIT_UPDATE_STATE = 114;
+	ROW_TRIGGER_STATE = 115;
+	ASSERT_OP_STATE = 116;
+	PARTITION_SELECTOR_STATE = 117;
+	TUPLE_DESC_NODE = 118;
+	SERIALIZED_PARAM_EXTERN_DATA = 119;
+	ALIAS = 120;
+	RANGE_VAR = 121;
+	EXPR = 122;
+	VAR = 123;
+	CONST = 124;
+	PARAM = 125;
+	AGGREF = 126;
+	WINDOW_FUNC = 127;
+	ARRAY_REF = 128;
+	FUNC_EXPR = 129;
+	NAMED_ARG_EXPR = 130;
+	OP_EXPR = 131;
+	DISTINCT_EXPR = 132;
+	NULL_IF_EXPR = 133;
+	SCALAR_ARRAY_OP_EXPR = 134;
+	BOOL_EXPR = 135;
+	SUB_LINK = 136;
+	SUB_PLAN = 137;
+	ALTERNATIVE_SUB_PLAN = 138;
+	FIELD_SELECT = 139;
+	FIELD_STORE = 140;
+	RELABEL_TYPE = 141;
+	COERCE_VIA_IO = 142;
+	ARRAY_COERCE_EXPR = 143;
+	CONVERT_ROWTYPE_EXPR = 144;
+	COLLATE_EXPR = 145;
+	CASE_EXPR = 146;
+	CASE_WHEN = 147;
+	CASE_TEST_EXPR = 148;
+	ARRAY_EXPR = 149;
+	ROW_EXPR = 150;
+	ROW_COMPARE_EXPR = 151;
+	COALESCE_EXPR = 152;
+	MIN_MAX_EXPR = 153;
+	XML_EXPR = 154;
+	NULL_TEST = 155;
+	BOOLEAN_TEST = 156;
+	COERCE_TO_DOMAIN = 157;
+	COERCE_TO_DOMAIN_VALUES = 158;
+	SET_TO_DEFAULT = 159;
+	CURRENT_OF_EXPR = 160;
+	TARGET_ENTRY = 161;
+	RANGE_TBL_REF = 162;
+	JOIN_EXPR = 163;
+	FROM_EXPR = 164;
+	INTO_CLAUSE = 165;
+	COPY_INTO_CLAUSE = 166;
+	REFRESH_CLAUSE = 167;
+	FLOW = 168;
+	GROUPING = 169;
+	GROUP_ID = 170;
+	DISTRIBUTED_BY = 171;
+	DML_ACTION_EXPR = 172;
+	PART_SELECTED_EXPR = 173;
+	PART_DEFAULT_EXPR = 174;
+	PART_BOUND_EXPR = 175;
+	PART_BOUND_INCLUSION_EXPR = 176;
+	PART_BOUND_OPEN_EXPR = 177;
+	PART_LIST_RULE_EXPR = 178;
+	PART_LIST_NULL_TEST_EXPR = 179;
+	TABLE_OID_INFO = 180;
+	EXPR_STATE = 181;
+	GENERIC_EXPR_STATE = 182;
+	WHOLE_ROW_VAR_EXPR_STATE = 183;
+	AGGREF_EXPR_STATE = 184;
+	WINDOW_FUNC_EXPR_STATE = 185;
+	ARRAY_REF_EXPR_STATE = 186;
+	FUNC_EXPR_STATE = 187;
+	SCALAR_ARRAY_OP_EXPR_STATE = 188;
+	BOOL_EXPR_STATE = 189;
+	SUB_PLAN_STATE = 190;
+	ALTERNATIVE_SUB_PLAN_STATE = 191;
+	FIELD_SELECT_STATE = 192;
+	FIELD_STORE_STATE = 193;
+	COERCE_VIA_IO_STATE = 194;
+	ARRAY_COERCE_EXPR_STATE = 195;
+	CONVERT_ROWTYPE_EXPR_STATE = 196;
+	CASE_EXPR_STATE = 197;
+	CASE_WHEN_STATE = 198;
+	ARRAY_EXPR_STATE = 199;
+	ROW_EXPR_STATE = 200;
+	ROW_COMPARE_EXPR_STATE = 201;
+	COALESCE_EXPR_STATE = 202;
+	MIN_MAX_EXPR_STATE = 203;
+	XML_EXPR_STATE = 204;
+	NULL_TEST_STATE = 205;
+	COERCE_TO_DOMAIN_STATE = 206;
+	DOMAIN_CONSTRAINT_STATE = 207;
+	GROUPING_FUNC_EXPR_STATE = 208;
+	PART_SELECTED_EXPR_STATE = 209;
+	PART_DEFAULT_EXPR_STATE = 210;
+	PART_BOUND_EXPR_STATE = 211;
+	PART_BOUND_INCLUSION_EXPR_STATE = 212;
+	PART_BOUND_OPEN_EXPR_STATE = 213;
+	PART_LIST_RULE_EXPR_STATE = 214;
+	PART_LIST_NULL_TEST_EXPR_STATE = 215;
+	PLANNER_INFO = 216;
+	PLANNER_GLOBAL = 217;
+	REL_OPT_INFO = 218;
+	INDEX_OPT_INFO = 219;
+	PARAM_PATH_INFO = 220;
+	PATH = 221;
+	APPEND_ONLY_PATH = 222;
+	AOCS_PATH = 223;
+	EXTERNAL_PATH = 224;
+	INDEX_PATH = 225;
+	BITMAP_HEAP_PATH = 226;
+	BITMAP_AND_PATH = 227;
+	BITMAP_OR_PATH = 228;
+	NEST_PATH = 229;
+	MERGE_PATH = 230;
+	HASH_PATH = 231;
+	TID_PATH = 232;
+	FOREIGN_PATH = 233;
+	APPEND_PATH = 234;
+	MERGE_APPEND_PATH = 235;
+	RESULT_PATH = 236;
+	MATERIAL_PATH = 237;
+	UNIQUE_PATH = 238;
+	PROJECTION_PATH = 239;
+	EQUIVALENCE_CLASS = 240;
+	EQUIVALENCE_MEMBER = 241;
+	PATH_KEY = 242;
+	RESTRICT_INFO = 243;
+	PLACE_HOLDER_VAR = 244;
+	SPECIAL_JOIN_INFO = 245;
+	LATERAL_JOIN_INFO = 246;
+	APPEND_REL_INFO = 247;
+	PLACE_HOLDER_INFO = 248;
+	MIN_MAX_AGG_INFO = 249;
+	PARTITION = 250;
+	PARTITION_RULE = 251;
+	PARTITION_NODE = 252;
+	PG_PART_RULE = 253;
+	SEGFILE_MAP_NODE = 254;
+	PLANNER_PARAM_ITEM = 255;
+	CDB_MOTION_PATH = 256;
+	PARTITION_SELECTOR_PATH = 257;
+	CDB_REL_COLUMN_INFO = 258;
+	DISTRIBUTION_KEY = 259;
+	MEMORY_CONTEXT = 260;
+	ALLOC_SET_CONTEXT = 261;
+	MEMORY_ACCOUNT = 262;
+	VALUE = 263;
+	INTEGER = 264;
+	FLOAT = 265;
+	STRING = 266;
+	BIT_STRING = 267;
+	NULL_VALUE = 268;
+	LIST = 269;
+	INT_LIST = 270;
+	OID_LIST = 271;
+	QUERY = 272;
+	PLANNED_STMT = 273;
+	INSERT_STMT = 274;
+	DELETE_STMT = 275;
+	UPDATE_STMT = 276;
+	SELECT_STMT = 277;
+	ALTER_TABLE_STMT = 278;
+	ALTER_TABLE_CMD = 279;
+	ALTER_DOMAIN_STMT = 280;
+	SET_OPERATION_STMT = 281;
+	GRANT_STMT = 282;
+	GRANT_ROLE_STMT = 283;
+	ALTER_DEFAULT_PRIVILEGES_STMT = 284;
+	CLOSE_PORTAL_STMT = 285;
+	CLUSTER_STMT = 286;
+	COPY_STMT = 287;
+	CREATE_STMT = 288;
+	SINGLE_ROW_ERROR_DESC = 289;
+	EXT_TABLE_TYPE_DESC = 290;
+	CREATE_EXTERNAL_STMT = 291;
+	DEFINE_STMT = 292;
+	DROP_STMT = 293;
+	TRUNCATE_STMT = 294;
+	COMMENT_STMT = 295;
+	FETCH_STMT = 296;
+	INDEX_STMT = 297;
+	CREATE_FUNCTION_STMT = 298;
+	ALTER_FUNCTION_STMT = 299;
+	DO_STMT = 300;
+	RENAME_STMT = 301;
+	RULE_STMT = 302;
+	NOTIFY_STMT = 303;
+	LISTEN_STMT = 304;
+	UNLISTEN_STMT = 305;
+	TRANSACTION_STMT = 306;
+	VIEW_STMT = 307;
+	LOAD_STMT = 308;
+	CREATE_DOMAIN_STMT = 309;
+	CREATEDB_STMT = 310;
+	DROPDB_STMT = 311;
+	VACUUM_STMT = 312;
+	EXPLAIN_STMT = 313;
+	CREATE_TABLE_AS_STMT = 314;
+	CREATE_SEQ_STMT = 315;
+	ALTER_SEQ_STMT = 316;
+	VARIABLE_SET_STMT = 317;
+	VARIABLE_SHOW_STMT = 318;
+	DISCARD_STMT = 319;
+	CREATE_TRIG_STMT = 320;
+	CREATE_P_LANG_STMT = 321;
+	CREATE_ROLE_STMT = 322;
+	ALTER_ROLE_STMT = 323;
+	DROP_ROLE_STMT = 324;
+	CREATE_QUEUE_STMT = 325;
+	ALTER_QUEUE_STMT = 326;
+	DROP_QUEUE_STMT = 327;
+	CREATE_RESOURCE_GROUP_STMT = 328;
+	DROP_RESOURCE_GROUP_STMT = 329;
+	ALTER_RESOURCE_GROUP_STMT = 330;
+	LOCK_STMT = 331;
+	CONSTRAINTS_SET_STMT = 332;
+	REINDEX_STMT = 333;
+	CHECK_POINT_STMT = 334;
+	CREATE_SCHEMA_STMT = 335;
+	ALTER_DATABASE_STMT = 336;
+	ALTER_DATABASE_SET_STMT = 337;
+	ALTER_ROLE_SET_STMT = 338;
+	CREATE_CONVERSION_STMT = 339;
+	CREATE_CAST_STMT = 340;
+	CREATE_OP_CLASS_STMT = 341;
+	CREATE_OP_FAMILY_STMT = 342;
+	ALTER_OP_FAMILY_STMT = 343;
+	PREPARE_STMT = 344;
+	EXECUTE_STMT = 345;
+	DEALLOCATE_STMT = 346;
+	DECLARE_CURSOR_STMT = 347;
+	CREATE_TABLE_SPACE_STMT = 348;
+	DROP_TABLE_SPACE_STMT = 349;
+	ALTER_OBJECT_SCHEMA_STMT = 350;
+	ALTER_OWNER_STMT = 351;
+	DROP_OWNED_STMT = 352;
+	REASSIGN_OWNED_STMT = 353;
+	COMPOSITE_TYPE_STMT = 354;
+	CREATE_ENUM_STMT = 355;
+	CREATE_RANGE_STMT = 356;
+	ALTER_ENUM_STMT = 357;
+	ALTER_TS_DICTIONARY_STMT = 358;
+	ALTER_TS_CONFIGURATION_STMT = 359;
+	CREATE_FDW_STMT = 360;
+	ALTER_FDW_STMT = 361;
+	CREATE_FOREIGN_SERVER_STMT = 362;
+	ALTER_FOREIGN_SERVER_STMT = 363;
+	CREATE_USER_MAPPING_STMT = 364;
+	ALTER_USER_MAPPING_STMT = 365;
+	DROP_USER_MAPPING_STMT = 366;
+	ALTER_TABLE_SPACE_OPTIONS_STMT = 367;
+	ALTER_TABLE_MOVE_ALL_STMT = 368;
+	SEC_LABEL_STMT = 369;
+	CREATE_FOREIGN_TABLE_STMT = 370;
+	CREATE_EXTENSION_STMT = 371;
+	ALTER_EXTENSION_STMT = 372;
+	ALTER_EXTENSION_CONTENTS_STMT = 373;
+	CREATE_EVENT_TRIG_STMT = 374;
+	ALTER_EVENT_TRIG_STMT = 375;
+	REFRESH_MAT_VIEW_STMT = 376;
+	REPLICA_IDENTITY_STMT = 377;
+	ALTER_SYSTEM_STMT = 378;
+	PARTITION_BY = 379;
+	PARTITION_ELEM = 380;
+	PARTITION_RANGE_ITEM = 381;
+	PARTITION_BOUND_SPEC = 382;
+	PARTITION_SPEC = 383;
+	PARTITION_VALUES_SPEC = 384;
+	ALTER_PARTITION_ID = 385;
+	ALTER_PARTITION_CMD = 386;
+	INHERIT_PARTITION_CMD = 387;
+	CREATE_FILE_SPACE_STMT = 388;
+	FILE_SPACE_ENTRY = 389;
+	DROP_FILE_SPACE_STMT = 390;
+	TABLE_VALUE_EXPR = 391;
+	DENY_LOGIN_INTERVAL = 392;
+	DENY_LOGIN_POINT = 393;
+	ALTER_TYPE_STMT = 394;
+	SET_DISTRIBUTION_CMD = 395;
+	EXPAND_STMT_SPEC = 396;
+	A_EXPR = 397;
+	COLUMN_REF = 398;
+	PARAM_REF = 399;
+	A_CONST = 400;
+	FUNC_CALL = 401;
+	A_STAR = 402;
+	A_INDICES = 403;
+	A_INDIRECTION = 404;
+	A_ARRAY_EXPR = 405;
+	RES_TARGET = 406;
+	TYPE_CAST = 407;
+	COLLATE_CLAUSE = 408;
+	SORT_BY = 409;
+	WINDOW_DEF = 410;
+	RANGE_SUBSELECT = 411;
+	RANGE_FUNCTION = 412;
+	TYPE_NAME = 413;
+	COLUMN_DEF = 414;
+	INDEX_ELEM = 415;
+	CONSTRAINT = 416;
+	DEF_ELEM = 417;
+	RANGE_TBL_ENTRY = 418;
+	RANGE_TBL_FUNCTION = 419;
+	WITH_CHECK_OPTION = 420;
+	GROUPING_CLAUSE = 421;
+	GROUPING_FUNC = 422;
+	SORT_GROUP_CLAUSE = 423;
+	WINDOW_CLAUSE = 424;
+	PRIV_GRANTEE = 425;
+	FUNC_WITH_ARGS = 426;
+	ACCESS_PRIV = 427;
+	CREATE_OP_CLASS_ITEM = 428;
+	TABLE_LIKE_CLAUSE = 429;
+	FUNCTION_PARAMETER = 430;
+	LOCKING_CLAUSE = 431;
+	ROW_MARK_CLAUSE = 432;
+	XML_SERIALIZE = 433;
+	WITH_CLAUSE = 434;
+	COMMON_TABLE_EXPR = 435;
+	COLUMN_REFERENCE_STORAGE_DIRECTIVE = 436;
+	IDENTIFY_SYSTEM_CMD = 437;
+	BASE_BACKUP_CMD = 438;
+	CREATE_REPLICATION_SLOT_CMD = 439;
+	DROP_REPLICATION_SLOT_CMD = 440;
+	START_REPLICATION_CMD = 441;
+	TIME_LINE_HISTORY_CMD = 442;
+	TRIGGER_DATA = 443;
+	EVENT_TRIGGER_DATA = 444;
+	RETURN_SET_INFO = 445;
+	WINDOW_OBJECT_DATA = 446;
+	TID_BITMAP = 447;
+	INLINE_CODE_BLOCK = 448;
+	FDW_ROUTINE = 449;
+	STREAM_BITMAP = 450;
+	FORMATTER_DATA = 451;
+	EXT_PROTOCOL_DATA = 452;
+	EXT_PROTOCOL_VALIDATOR_DATA = 453;
+	SELECTED_PARTS = 454;
+	COOKED_CONSTRAINT = 455;
+	CDB_EXPLAIN_STAT_HDR = 456;
+	GP_POLICY = 457;
+	RETRIEVE_STMT = 458;
+}
diff --git a/gpcontrib/gp_stats_collector/protos/gpsc_set_service.proto b/gpcontrib/gp_stats_collector/protos/gpsc_set_service.proto
new file mode 100644
index 00000000000..bcf09074ed7
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/protos/gpsc_set_service.proto
@@ -0,0 +1,69 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+syntax = "proto3";
+
+import "google/protobuf/timestamp.proto";
+
+import "protos/gpsc_metrics.proto";
+import "protos/gpsc_plan.proto";
+
+package gpsc;
+
+service SetQueryInfo {
+    rpc SetMetricPlanNode (SetPlanNodeReq) returns (MetricResponse) {}
+
+    rpc SetMetricQuery (SetQueryReq) returns (MetricResponse) {}
+}
+
+message MetricResponse {
+    MetricResponseStatusCode error_code = 1;
+    string error_text = 2;
+}
+
+enum MetricResponseStatusCode {
+    METRIC_RESPONSE_STATUS_CODE_UNSPECIFIED = 0;
+    METRIC_RESPONSE_STATUS_CODE_SUCCESS = 1;
+    METRIC_RESPONSE_STATUS_CODE_ERROR = 2;
+}
+
+message SetQueryReq {
+    QueryStatus           query_status    = 1;
+    google.protobuf.Timestamp datetime    = 2;
+    QueryKey                 query_key    = 3;
+    SegmentKey             segment_key    = 4;
+    QueryInfo               query_info    = 5;
+    GPMetrics            query_metrics    = 6;
+    repeated MetricPlan      plan_tree    = 7;
+    google.protobuf.Timestamp submit_time = 8;
+    google.protobuf.Timestamp start_time  = 9;
+    google.protobuf.Timestamp end_time    = 10;
+    AdditionalQueryInfo add_info          = 11;
+}
+
+message SetPlanNodeReq {
+    PlanNodeStatus         node_status = 1;
+    google.protobuf.Timestamp datetime = 2;
+    QueryKey                 query_key = 3;
+    SegmentKey             segment_key = 4;
+    GPMetrics             node_metrics = 5;
+    MetricPlan               plan_node = 6;
+    google.protobuf.Timestamp submit_time = 7;
+    google.protobuf.Timestamp start_time  = 8;
+    google.protobuf.Timestamp end_time    = 9;
+}
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_cursors.sql b/gpcontrib/gp_stats_collector/sql/gpsc_cursors.sql
new file mode 100644
index 00000000000..8361f7b678d
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_cursors.sql
@@ -0,0 +1,85 @@
+CREATE EXTENSION gp_stats_collector;
+
+CREATE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+
+-- DECLARE
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+DECLARE cursor_stats_0 CURSOR FOR SELECT 0;
+CLOSE cursor_stats_0;
+COMMIT;
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- DECLARE WITH HOLD
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+DECLARE cursor_stats_1 CURSOR WITH HOLD FOR SELECT 1;
+CLOSE cursor_stats_1;
+DECLARE cursor_stats_2 CURSOR WITH HOLD FOR SELECT 2;
+CLOSE cursor_stats_2;
+COMMIT;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- ROLLBACK
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+DECLARE cursor_stats_3 CURSOR FOR SELECT 1;
+CLOSE cursor_stats_3;
+DECLARE cursor_stats_4 CURSOR FOR SELECT 1;
+ROLLBACK;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- FETCH
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+DECLARE cursor_stats_5 CURSOR WITH HOLD FOR SELECT 2;
+DECLARE cursor_stats_6 CURSOR WITH HOLD FOR SELECT 3;
+FETCH 1 IN cursor_stats_5;
+FETCH 1 IN cursor_stats_6;
+CLOSE cursor_stats_5;
+CLOSE cursor_stats_6;
+COMMIT;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_dist.sql b/gpcontrib/gp_stats_collector/sql/gpsc_dist.sql
new file mode 100644
index 00000000000..46b531a70ca
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_dist.sql
@@ -0,0 +1,88 @@
+CREATE EXTENSION gp_stats_collector;
+
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+SET gpsc.enable_utility TO FALSE;
+
+-- Hash distributed table
+
+CREATE TABLE test_hash_dist (id int) DISTRIBUTED BY (id);
+INSERT INTO test_hash_dist SELECT 1;
+
+SET gpsc.logging_mode to 'TBL';
+SET optimizer_enable_direct_dispatch TO TRUE;
+-- Direct dispatch is used here, only one segment is scanned.
+select * from test_hash_dist where id = 1;
+RESET optimizer_enable_direct_dispatch;
+
+RESET gpsc.logging_mode;
+-- Should see 8 rows.
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+SET gpsc.logging_mode to 'TBL';
+
+-- Scan all segments.
+select * from test_hash_dist;
+
+DROP TABLE test_hash_dist;
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Replicated table
+CREATE FUNCTION force_segments() RETURNS SETOF text AS $$
+BEGIN
+  RETURN NEXT 'seg';
+END;
+$$ LANGUAGE plpgsql VOLATILE EXECUTE ON ALL SEGMENTS;
+
+CREATE TABLE test_replicated (id int) DISTRIBUTED REPLICATED;
+INSERT INTO test_replicated SELECT 1;
+
+SET gpsc.logging_mode to 'TBL';
+SELECT COUNT(*) FROM test_replicated, force_segments();
+DROP TABLE test_replicated;
+DROP FUNCTION force_segments();
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Partially distributed table (2 numsegments)
+SET allow_system_table_mods = ON;
+CREATE TABLE test_partial_dist (id int, data text) DISTRIBUTED BY (id);
+UPDATE gp_distribution_policy SET numsegments = 2 WHERE localoid = 'test_partial_dist'::regclass;
+INSERT INTO test_partial_dist SELECT * FROM generate_series(1, 100);
+
+SET gpsc.logging_mode to 'TBL';
+SELECT COUNT(*) FROM test_partial_dist;
+RESET gpsc.logging_mode;
+
+DROP TABLE test_partial_dist;
+RESET allow_system_table_mods;
+-- Should see 12 rows.
+SELECT query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_guc_cache.sql b/gpcontrib/gp_stats_collector/sql/gpsc_guc_cache.sql
new file mode 100644
index 00000000000..6aff2ad5cf6
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_guc_cache.sql
@@ -0,0 +1,43 @@
+--
+-- Test GUC caching for query lifecycle consistency.
+--
+-- The extension logs SUBMIT and DONE events for each query.
+-- GUC values that control logging (enable_utility, ignored_users_list, ...)
+-- must be cached at SUBMIT time to ensure DONE uses the same filtering
+-- criteria. Otherwise, a SET command that modifies these GUCs would
+-- have its DONE event rejected, creating orphaned SUBMIT entries.
+-- This is due to query being actually executed between SUBMIT and DONE.
+-- start_ignore
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+SELECT gpsc.truncate_log();
+-- end_ignore
+
+CREATE OR REPLACE FUNCTION print_last_query(query text)
+RETURNS TABLE(query_status text) AS $$
+    SELECT query_status
+    FROM gpsc.log
+    WHERE segid = -1 AND query_text = query
+    ORDER BY ccnt DESC
+$$ LANGUAGE sql;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.logging_mode TO 'TBL';
+
+-- SET below disables utility logging and DONE must still be logged.
+SET gpsc.enable_utility TO FALSE;
+SELECT * FROM print_last_query('SET gpsc.enable_utility TO FALSE;');
+
+-- SELECT below adds current user to ignore list and DONE must still be logged.
+-- start_ignore
+SELECT set_config('gpsc.ignored_users_list', current_user, false);
+-- end_ignore
+SELECT * FROM print_last_query('SELECT set_config(''gpsc.ignored_users_list'', current_user, false);');
+
+DROP FUNCTION print_last_query(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
+RESET gpsc.logging_mode;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_locale.sql b/gpcontrib/gp_stats_collector/sql/gpsc_locale.sql
new file mode 100644
index 00000000000..6321c93f5ab
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_locale.sql
@@ -0,0 +1,29 @@
+-- The extension generates normalized query text and plan using jumbling functions.
+-- Those functions may fail when translating to wide character if the current locale
+-- cannot handle the character set. This test checks that even when those functions
+-- fail, the plan is still generated and executed. This test is partially taken from
+-- gp_locale.
+
+-- start_ignore
+DROP DATABASE IF EXISTS gpsc_test_locale;
+-- end_ignore
+
+CREATE DATABASE gpsc_test_locale WITH LC_COLLATE='C' LC_CTYPE='C' TEMPLATE=template0;
+\c gpsc_test_locale
+
+CREATE EXTENSION gp_stats_collector;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.enable TO TRUE;
+
+CREATE TABLE gpsc_hi_안녕세계 (a int, 안녕세계1 text, 안녕세계2 text, 안녕세계3 text) DISTRIBUTED BY (a);
+INSERT INTO gpsc_hi_안녕세계 VALUES(1, '안녕세계1 first', '안녕세2 first', '안녕세계3 first');
+-- Should not see error here
+UPDATE gpsc_hi_안녕세계 SET 안녕세계1='안녕세계1 first UPDATE' WHERE 안녕세계1='안녕세계1 first';
+
+RESET gpsc.enable;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
+DROP TABLE gpsc_hi_안녕세계;
+DROP EXTENSION gp_stats_collector;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_select.sql b/gpcontrib/gp_stats_collector/sql/gpsc_select.sql
new file mode 100644
index 00000000000..673cbee0c10
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_select.sql
@@ -0,0 +1,69 @@
+CREATE EXTENSION gp_stats_collector;
+
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+SET gpsc.enable_utility TO FALSE;
+
+-- Basic SELECT tests
+SET gpsc.logging_mode to 'TBL';
+
+SELECT 1;
+SELECT COUNT(*) FROM generate_series(1,10);
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Transaction test
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+SELECT 1;
+COMMIT;
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- CTE test
+SET gpsc.logging_mode to 'TBL';
+
+WITH t AS (VALUES (1), (2))
+SELECT * FROM t;
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Prepared statement test
+SET gpsc.logging_mode to 'TBL';
+
+PREPARE test_stmt AS SELECT 1;
+EXECUTE test_stmt;
+DEALLOCATE test_stmt;
+
+RESET gpsc.logging_mode;
+SELECT segid, query_text, query_status FROM gpsc.log ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_uds.sql b/gpcontrib/gp_stats_collector/sql/gpsc_uds.sql
new file mode 100644
index 00000000000..14377b15c8c
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_uds.sql
@@ -0,0 +1,31 @@
+-- Test UDS socket
+-- start_ignore
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+-- end_ignore
+
+\set UDS_PATH '/tmp/gpsc_test.sock'
+
+-- Configure extension to send via UDS
+SET gpsc.uds_path TO :'UDS_PATH';
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.logging_mode TO 'UDS';
+
+-- Start receiver
+SELECT gpsc.__test_uds_start_server(:'UDS_PATH');
+
+-- Send
+SELECT 1;
+
+-- Receive
+SELECT gpsc.__test_uds_receive() > 0 as received;
+
+-- Stop receiver
+SELECT gpsc.__test_uds_stop_server();
+
+-- Cleanup
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.uds_path;
+RESET gpsc.ignored_users_list;
+RESET gpsc.enable;
+RESET gpsc.logging_mode;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_utf8_trim.sql b/gpcontrib/gp_stats_collector/sql/gpsc_utf8_trim.sql
new file mode 100644
index 00000000000..a3f8a376d55
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_utf8_trim.sql
@@ -0,0 +1,45 @@
+CREATE EXTENSION IF NOT EXISTS gp_stats_collector;
+
+CREATE OR REPLACE FUNCTION get_marked_query(marker TEXT)
+RETURNS TEXT AS $$
+    SELECT query_text
+    FROM gpsc.log
+    WHERE query_text LIKE '%' || marker || '%'
+    ORDER BY datetime DESC
+    LIMIT 1
+$$ LANGUAGE sql VOLATILE;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+
+-- Test 1: 1 byte chars
+SET gpsc.max_text_size to 19;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test1*/ 'HelloWorld';
+RESET gpsc.logging_mode;
+SELECT octet_length(get_marked_query('test1')) = 19 AS correct_length;
+
+-- Test 2: 2 byte chars
+SET gpsc.max_text_size to 19;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test2*/ 'РУССКИЙЯЗЫК';
+RESET gpsc.logging_mode;
+-- Character 'Р' has two bytes and cut in the middle => not included.
+SELECT octet_length(get_marked_query('test2')) = 18 AS correct_length;
+
+-- Test 3: 4 byte chars
+SET gpsc.max_text_size to 21;
+SET gpsc.logging_mode to 'TBL';
+SELECT /*test3*/ '😀';
+RESET gpsc.logging_mode;
+-- Emoji has 4 bytes and cut before the last byte => not included.
+SELECT octet_length(get_marked_query('test3')) = 18 AS correct_length;
+
+-- Cleanup
+DROP FUNCTION get_marked_query(TEXT);
+RESET gpsc.max_text_size;
+RESET gpsc.logging_mode;
+RESET gpsc.enable;
+RESET gpsc.ignored_users_list;
+
+DROP EXTENSION gp_stats_collector;
diff --git a/gpcontrib/gp_stats_collector/sql/gpsc_utility.sql b/gpcontrib/gp_stats_collector/sql/gpsc_utility.sql
new file mode 100644
index 00000000000..9abb965db37
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/sql/gpsc_utility.sql
@@ -0,0 +1,135 @@
+CREATE EXTENSION gp_stats_collector;
+
+CREATE OR REPLACE FUNCTION gpsc_status_order(status text)
+RETURNS integer
+AS $$
+BEGIN
+    RETURN CASE status
+        WHEN 'QUERY_STATUS_SUBMIT' THEN 1
+        WHEN 'QUERY_STATUS_START' THEN 2
+        WHEN 'QUERY_STATUS_END' THEN 3
+        WHEN 'QUERY_STATUS_DONE' THEN 4
+        ELSE 999
+    END;
+END;
+$$ LANGUAGE plpgsql IMMUTABLE;
+
+SET gpsc.ignored_users_list TO '';
+SET gpsc.enable TO TRUE;
+SET gpsc.enable_utility TO TRUE;
+SET gpsc.report_nested_queries TO TRUE;
+
+SET gpsc.logging_mode to 'TBL';
+
+CREATE TABLE test_table (a int, b text);
+CREATE INDEX test_idx ON test_table(a);
+ALTER TABLE test_table ADD COLUMN c int DEFAULT 1;
+DROP TABLE test_table;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Partitioning
+SET gpsc.logging_mode to 'TBL';
+
+CREATE TABLE pt_test (a int, b int)
+DISTRIBUTED BY (a)
+PARTITION BY RANGE (a)
+(START (0) END (100) EVERY (50));
+DROP TABLE pt_test;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Views and Functions
+SET gpsc.logging_mode to 'TBL';
+
+CREATE VIEW test_view AS SELECT 1 AS a;
+CREATE FUNCTION test_func(i int) RETURNS int AS $$ SELECT $1 + 1; $$ LANGUAGE SQL;
+DROP VIEW test_view;
+DROP FUNCTION test_func(int);
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Transaction Operations
+SET gpsc.logging_mode to 'TBL';
+
+BEGIN;
+SAVEPOINT sp1;
+ROLLBACK TO sp1;
+COMMIT;
+
+BEGIN;
+SAVEPOINT sp2;
+ABORT;
+
+BEGIN;
+ROLLBACK;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- DML Operations
+SET gpsc.logging_mode to 'TBL';
+
+CREATE TABLE dml_test (a int, b text);
+INSERT INTO dml_test VALUES (1, 'test');
+UPDATE dml_test SET b = 'updated' WHERE a = 1;
+DELETE FROM dml_test WHERE a = 1;
+DROP TABLE dml_test;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- COPY Operations
+SET gpsc.logging_mode to 'TBL';
+
+CREATE TABLE copy_test (a int);
+COPY (SELECT 1) TO STDOUT;
+DROP TABLE copy_test;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- Prepared Statements and error during execute
+SET gpsc.logging_mode to 'TBL';
+
+PREPARE test_prep(int) AS SELECT $1/0 AS value;
+EXECUTE test_prep(0::int);
+DEALLOCATE test_prep;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+-- GUC Settings
+SET gpsc.logging_mode to 'TBL';
+
+SET gpsc.report_nested_queries TO FALSE;
+RESET gpsc.report_nested_queries;
+
+RESET gpsc.logging_mode;
+
+SELECT segid, query_text, query_status FROM gpsc.log WHERE segid = -1 AND utility = true ORDER BY segid, ccnt, gpsc_status_order(query_status) ASC;
+SELECT gpsc.truncate_log() IS NOT NULL AS t;
+
+DROP FUNCTION gpsc_status_order(text);
+DROP EXTENSION gp_stats_collector;
+RESET gpsc.enable;
+RESET gpsc.report_nested_queries;
+RESET gpsc.enable_utility;
+RESET gpsc.ignored_users_list;
diff --git a/gpcontrib/gp_stats_collector/src/Config.cpp b/gpcontrib/gp_stats_collector/src/Config.cpp
new file mode 100644
index 00000000000..08a8d8cff86
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/Config.cpp
@@ -0,0 +1,191 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * Config.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/Config.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "Config.h"
+#include <limits.h>
+#include <memory>
+#include <string>
+#include <unordered_set>
+#include "memory/gpdbwrappers.h"
+
+extern "C" {
+#include "postgres.h"
+#include "utils/guc.h"
+}
+
+static char *guc_uds_path = nullptr;
+static bool guc_enable_analyze = true;
+static bool guc_enable_cdbstats = true;
+static bool guc_enable_collector = false;
+static bool guc_report_nested_queries = true;
+static char *guc_ignored_users = nullptr;
+static int guc_max_text_size = 1 << 20;	  // in bytes (1MB)
+static int guc_max_plan_size = 1024;	  // in KB
+static int guc_min_analyze_time = 10000;  // in ms
+static int guc_logging_mode = LOG_MODE_UDS;
+static bool guc_enable_utility = false;
+
+static const struct config_enum_entry logging_mode_options[] = {
+	{"uds", LOG_MODE_UDS, false /* hidden */},
+	{"tbl", LOG_MODE_TBL, false},
+	{NULL, 0, false}};
+
+static bool ignored_users_guc_dirty = false;
+
+static void
+assign_ignored_users_hook(const char *, void *)
+{
+	ignored_users_guc_dirty = true;
+}
+
+void
+Config::init_gucs()
+{
+	DefineCustomStringVariable(
+		"gpsc.uds_path", "Sets filesystem path of the agent socket", 0LL,
+		&guc_uds_path, "/tmp/gpsc_agent.sock", PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL, 0LL, 0LL);
+
+	DefineCustomBoolVariable("gpsc.enable", "Enable metrics collector", 0LL,
+							 &guc_enable_collector, false, PGC_SUSET,
+							 GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL, 0LL,
+							 0LL);
+
+	DefineCustomBoolVariable(
+		"gpsc.enable_analyze", "Collect analyze metrics in gpsc", 0LL,
+		&guc_enable_analyze, true, PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL, 0LL, 0LL);
+
+	DefineCustomBoolVariable(
+		"gpsc.enable_cdbstats", "Collect CDB metrics in gpsc", 0LL,
+		&guc_enable_cdbstats, true, PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL, 0LL, 0LL);
+
+	DefineCustomBoolVariable(
+		"gpsc.report_nested_queries", "Collect stats on nested queries", 0LL,
+		&guc_report_nested_queries, true, PGC_USERSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL, 0LL, 0LL);
+
+	DefineCustomStringVariable("gpsc.ignored_users_list",
+							   "Make gpsc ignore queries issued by given users",
+							   0LL, &guc_ignored_users, "", PGC_SUSET,
+							   GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, 0LL,
+							   assign_ignored_users_hook, 0LL);
+
+	DefineCustomIntVariable(
+		"gpsc.max_text_size",
+		"Make gpsc trim query texts longer than configured size in bytes", NULL,
+		&guc_max_text_size, 1 << 20 /* 1MB */, 0, INT_MAX, PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, NULL, NULL, NULL);
+
+	DefineCustomIntVariable(
+		"gpsc.max_plan_size", "Make gpsc trim plan longer than configured size",
+		NULL, &guc_max_plan_size, 1024, 0, INT_MAX / 1024, PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC | GUC_UNIT_KB, NULL, NULL, NULL);
+
+	DefineCustomIntVariable(
+		"gpsc.min_analyze_time",
+		"Sets the minimum execution time above which plans will be logged.",
+		"Zero prints all plans. -1 turns this feature off.",
+		&guc_min_analyze_time, 10000, -1, INT_MAX, PGC_USERSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC | GUC_UNIT_MS, NULL, NULL, NULL);
+
+	DefineCustomEnumVariable(
+		"gpsc.logging_mode", "Logging mode: UDS or PG Table", NULL,
+		&guc_logging_mode, LOG_MODE_UDS, logging_mode_options, PGC_SUSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC | GUC_SUPERUSER_ONLY, NULL, NULL,
+		NULL);
+
+	DefineCustomBoolVariable(
+		"gpsc.enable_utility", "Collect utility statement stats", NULL,
+		&guc_enable_utility, false, PGC_USERSET,
+		GUC_NOT_IN_SAMPLE | GUC_GPDB_NEED_SYNC, NULL, NULL, NULL);
+}
+
+void
+Config::update_ignored_users(const char *new_guc_ignored_users)
+{
+	auto new_ignored_users_set = std::make_unique<IgnoredUsers>();
+	if (new_guc_ignored_users != nullptr && new_guc_ignored_users[0] != '\0')
+	{
+		/* Need a modifiable copy of string */
+		char *rawstring = gpdb::pstrdup(new_guc_ignored_users);
+		List *elemlist;
+		ListCell *l;
+
+		/* Parse string into list of identifiers */
+		if (!gpdb::split_identifier_string(rawstring, ',', &elemlist))
+		{
+			/* syntax error in list */
+			gpdb::pfree(rawstring);
+			gpdb::list_free(elemlist);
+			ereport(
+				LOG,
+				(errcode(ERRCODE_SYNTAX_ERROR),
+				 errmsg(
+					 "invalid list syntax in parameter gpsc.ignored_users_list")));
+			return;
+		}
+		foreach (l, elemlist)
+		{
+			new_ignored_users_set->insert((char *) lfirst(l));
+		}
+		gpdb::pfree(rawstring);
+		gpdb::list_free(elemlist);
+	}
+	ignored_users_ = std::move(new_ignored_users_set);
+}
+
+bool
+Config::filter_user(const std::string &username) const
+{
+	if (!ignored_users_)
+	{
+		return true;
+	}
+	return ignored_users_->find(username) != ignored_users_->end();
+}
+
+void
+Config::sync()
+{
+	if (ignored_users_guc_dirty)
+	{
+		update_ignored_users(guc_ignored_users);
+		ignored_users_guc_dirty = false;
+	}
+	uds_path_ = guc_uds_path;
+	enable_analyze_ = guc_enable_analyze;
+	enable_cdbstats_ = guc_enable_cdbstats;
+	enable_collector_ = guc_enable_collector;
+	enable_utility_ = guc_enable_utility;
+	report_nested_queries_ = guc_report_nested_queries;
+	max_text_size_ = guc_max_text_size;
+	max_plan_size_ = guc_max_plan_size;
+	min_analyze_time_ = guc_min_analyze_time;
+	logging_mode_ = guc_logging_mode;
+}
diff --git a/gpcontrib/gp_stats_collector/src/Config.h b/gpcontrib/gp_stats_collector/src/Config.h
new file mode 100644
index 00000000000..259799e5135
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/Config.h
@@ -0,0 +1,115 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * Config.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/Config.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef CONFIG_H
+#define CONFIG_H
+
+#include <memory>
+#include <string>
+#include <unordered_set>
+
+#define LOG_MODE_UDS 0
+#define LOG_MODE_TBL 1
+
+using IgnoredUsers = std::unordered_set<std::string>;
+
+class Config
+{
+public:
+	static void init_gucs();
+
+	void sync();
+
+	const std::string &
+	uds_path() const
+	{
+		return uds_path_;
+	}
+	bool
+	enable_analyze() const
+	{
+		return enable_analyze_;
+	}
+	bool
+	enable_cdbstats() const
+	{
+		return enable_cdbstats_;
+	}
+	bool
+	enable_collector() const
+	{
+		return enable_collector_;
+	}
+	bool
+	enable_utility() const
+	{
+		return enable_utility_;
+	}
+	bool
+	report_nested_queries() const
+	{
+		return report_nested_queries_;
+	}
+	int
+	max_text_size() const
+	{
+		return max_text_size_;
+	}
+	int
+	max_plan_size() const
+	{
+		return max_plan_size_ * 1024;
+	}
+	int
+	min_analyze_time() const
+	{
+		return min_analyze_time_;
+	}
+	int
+	logging_mode() const
+	{
+		return logging_mode_;
+	}
+	bool filter_user(const std::string &username) const;
+
+private:
+	void update_ignored_users(const char *new_guc_ignored_users);
+
+	std::unique_ptr<IgnoredUsers> ignored_users_;
+	std::string uds_path_;
+	bool enable_analyze_;
+	bool enable_cdbstats_;
+	bool enable_collector_;
+	bool enable_utility_;
+	bool report_nested_queries_;
+	int max_text_size_;
+	int max_plan_size_;
+	int min_analyze_time_;
+	int logging_mode_;
+};
+
+#endif /* CONFIG_H */
diff --git a/gpcontrib/gp_stats_collector/src/EventSender.cpp b/gpcontrib/gp_stats_collector/src/EventSender.cpp
new file mode 100644
index 00000000000..0bc44c1198d
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/EventSender.cpp
@@ -0,0 +1,645 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * EventSender.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/EventSender.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "UDSConnector.h"
+#include "log/LogOps.h"
+#include "memory/gpdbwrappers.h"
+
+#define typeid __typeid
+extern "C" {
+#include "postgres.h"
+
+#include "executor/executor.h"
+#include "utils/elog.h"
+#include "utils/guc.h"
+
+#include "cdb/cdbexplain.h"
+#include "cdb/cdbvars.h"
+#include "cdb/ml_ipc.h"
+}
+#undef typeid
+
+#include "EventSender.h"
+#include "PgUtils.h"
+#include "ProtoUtils.h"
+
+#define need_collect_analyze()                                        \
+	(Gp_role == GP_ROLE_DISPATCH && config.min_analyze_time() >= 0 && \
+	 config.enable_analyze())
+
+bool
+EventSender::verify_query(QueryDesc *query_desc, QueryState state, bool utility)
+{
+	if (!proto_verified)
+	{
+		return false;
+	}
+	if (Gp_role != GP_ROLE_DISPATCH && Gp_role != GP_ROLE_EXECUTE)
+	{
+		return false;
+	}
+
+	switch (state)
+	{
+		case QueryState::SUBMIT:
+			// Cache GUCs once at SUBMIT. Synced GUCs are visible to all subsequent
+			// states. Without caching, a query that unsets/sets filtering GUCs would
+			// see different filter criteria at DONE, because at SUBMIT the query was
+			// not executed yet, causing DONE to be skipped/added.
+			config.sync();
+
+			if (!config.enable_collector())
+			{
+				return false;
+			}
+
+			if (utility && !config.enable_utility())
+			{
+				return false;
+			}
+
+			// Register qkey for a nested query we won't report,
+			// so we can detect nesting_level > 0 and skip reporting at end/done.
+			if (!need_report_nested_query() && nesting_level > 0)
+			{
+				QueryKey::register_qkey(query_desc, nesting_level);
+				return false;
+			}
+			if (is_top_level_query(query_desc, nesting_level))
+			{
+				nested_timing = 0;
+				nested_calls = 0;
+			}
+			break;
+		case QueryState::START:
+			if (!qdesc_submitted(query_desc))
+			{
+				collect_query_submit(query_desc, false /* utility */);
+			}
+			break;
+		case QueryState::DONE:
+			if (utility && !config.enable_utility())
+			{
+				return false;
+			}
+		default:
+			break;
+	}
+
+	if (filter_query(query_desc))
+	{
+		return false;
+	}
+	if (!nesting_is_valid(query_desc, nesting_level))
+	{
+		return false;
+	}
+
+	return true;
+}
+
+bool
+EventSender::log_query_req(const gpsc::SetQueryReq &req,
+						   const std::string &event, bool utility)
+{
+	bool clear_big_fields = false;
+	switch (config.logging_mode())
+	{
+		case LOG_MODE_UDS:
+			clear_big_fields = UDSConnector::report_query(req, event, config);
+			break;
+		case LOG_MODE_TBL:
+			gpdb::insert_log(req, utility);
+			clear_big_fields = false;
+			break;
+		default:
+			Assert(false);
+	}
+	return clear_big_fields;
+}
+
+void
+EventSender::query_metrics_collect(QueryMetricsStatus status, void *arg,
+								   bool utility, ErrorData *edata)
+{
+	auto *query_desc = reinterpret_cast<QueryDesc *>(arg);
+	switch (status)
+	{
+		case METRICS_PLAN_NODE_INITIALIZE:
+		case METRICS_PLAN_NODE_EXECUTING:
+		case METRICS_PLAN_NODE_FINISHED:
+			// TODO
+			break;
+		case METRICS_QUERY_SUBMIT:
+			collect_query_submit(query_desc, utility);
+			break;
+		case METRICS_QUERY_START:
+			// no-op: executor_after_start is enough
+			break;
+		case METRICS_QUERY_CANCELING:
+			// it appears we're only interested in the actual CANCELED event.
+			// for now we will ignore CANCELING state unless otherwise requested from
+			// end users
+			break;
+		case METRICS_QUERY_DONE:
+		case METRICS_QUERY_ERROR:
+		case METRICS_QUERY_CANCELED:
+		case METRICS_INNER_QUERY_DONE:
+			collect_query_done(query_desc, utility, status, edata);
+			break;
+		default:
+			ereport(ERROR, (errmsg("Unknown query status: %d", status)));
+	}
+}
+
+void
+EventSender::executor_before_start(QueryDesc *query_desc, int eflags)
+{
+	if (!verify_query(query_desc, QueryState::START, false /* utility*/))
+	{
+		return;
+	}
+
+	if (Gp_role == GP_ROLE_DISPATCH && config.enable_analyze() &&
+		(eflags & EXEC_FLAG_EXPLAIN_ONLY) == 0)
+	{
+		query_desc->instrument_options |= INSTRUMENT_BUFFERS;
+		query_desc->instrument_options |= INSTRUMENT_ROWS;
+		query_desc->instrument_options |= INSTRUMENT_TIMER;
+		if (config.enable_cdbstats())
+		{
+			query_desc->instrument_options |= INSTRUMENT_CDB;
+			if (!query_desc->showstatctx)
+			{
+				instr_time starttime;
+				INSTR_TIME_SET_CURRENT(starttime);
+				query_desc->showstatctx =
+					gpdb::cdbexplain_showExecStatsBegin(query_desc, starttime);
+			}
+		}
+	}
+}
+
+void
+EventSender::executor_after_start(QueryDesc *query_desc, int /* eflags*/)
+{
+	if (!verify_query(query_desc, QueryState::START, false /* utility */))
+	{
+		return;
+	}
+
+	auto &query = get_query(query_desc);
+	auto query_msg = query.message.get();
+	*query_msg->mutable_start_time() = current_ts();
+	update_query_state(query, QueryState::START, false /* utility */);
+	set_query_plan(query_msg, query_desc, config);
+	if (need_collect_analyze())
+	{
+		// Set up to track total elapsed time during query run.
+		// Make sure the space is allocated in the per-query
+		// context so it will go away at executor_end.
+		if (query_desc->totaltime == NULL)
+		{
+			MemoryContext oldcxt =
+				gpdb::mem_ctx_switch_to(query_desc->estate->es_query_cxt);
+			query_desc->totaltime = gpdb::instr_alloc(1, INSTRUMENT_ALL, false);
+			gpdb::mem_ctx_switch_to(oldcxt);
+		}
+	}
+	gpsc::GPMetrics stats;
+	std::swap(stats, *query_msg->mutable_query_metrics());
+	if (log_query_req(*query_msg, "started", false /* utility */))
+	{
+		clear_big_fields(query_msg);
+	}
+	std::swap(stats, *query_msg->mutable_query_metrics());
+}
+
+void
+EventSender::executor_end(QueryDesc *query_desc)
+{
+	if (!verify_query(query_desc, QueryState::END, false /* utility */))
+	{
+		return;
+	}
+
+	auto &query = get_query(query_desc);
+	auto *query_msg = query.message.get();
+	*query_msg->mutable_end_time() = current_ts();
+	update_query_state(query, QueryState::END, false /* utility */);
+	if (is_top_level_query(query_desc, nesting_level))
+	{
+		set_gp_metrics(query_msg->mutable_query_metrics(), query_desc,
+					   nested_calls, nested_timing);
+	}
+	else
+	{
+		set_gp_metrics(query_msg->mutable_query_metrics(), query_desc, 0, 0);
+	}
+	if (log_query_req(*query_msg, "ended", false /* utility */))
+	{
+		clear_big_fields(query_msg);
+	}
+}
+
+void
+EventSender::collect_query_submit(QueryDesc *query_desc, bool utility)
+{
+	if (!verify_query(query_desc, QueryState::SUBMIT, utility))
+	{
+		return;
+	}
+
+	submit_query(query_desc);
+	auto &query = get_query(query_desc);
+	auto *query_msg = query.message.get();
+	*query_msg = create_query_req(gpsc::QueryStatus::QUERY_STATUS_SUBMIT);
+	*query_msg->mutable_submit_time() = current_ts();
+	set_query_info(query_msg);
+	set_qi_nesting_level(query_msg, nesting_level);
+	set_qi_slice_id(query_msg);
+	set_query_text(query_msg, query_desc, config);
+	if (log_query_req(*query_msg, "submit", utility))
+	{
+		clear_big_fields(query_msg);
+	}
+	// take initial metrics snapshot so that we can safely take diff afterwards
+	// in END or DONE events.
+	set_gp_metrics(query_msg->mutable_query_metrics(), query_desc, 0, 0);
+#ifdef IC_TEARDOWN_HOOK
+	// same for interconnect statistics
+	ic_metrics_collect();
+	set_ic_stats(query_msg->mutable_query_metrics()->mutable_instrumentation(),
+				 &ic_statistics);
+#endif
+}
+
+void
+EventSender::report_query_done(QueryDesc *query_desc, QueryItem &query,
+							   QueryMetricsStatus status, bool utility,
+							   ErrorData *edata)
+{
+	gpsc::QueryStatus query_status;
+	std::string msg;
+	switch (status)
+	{
+		case METRICS_QUERY_DONE:
+		case METRICS_INNER_QUERY_DONE:
+			query_status = gpsc::QueryStatus::QUERY_STATUS_DONE;
+			msg = "done";
+			break;
+		case METRICS_QUERY_ERROR:
+			query_status = gpsc::QueryStatus::QUERY_STATUS_ERROR;
+			msg = "error";
+			break;
+		case METRICS_QUERY_CANCELING:
+			// at the moment we don't track this event, but I`ll leave this code
+			// here just in case
+			Assert(false);
+			query_status = gpsc::QueryStatus::QUERY_STATUS_CANCELLING;
+			msg = "cancelling";
+			break;
+		case METRICS_QUERY_CANCELED:
+			query_status = gpsc::QueryStatus::QUERY_STATUS_CANCELED;
+			msg = "cancelled";
+			break;
+		default:
+			ereport(ERROR,
+					(errmsg("Unexpected query status in query_done hook: %d",
+							status)));
+	}
+	auto prev_state = query.state;
+	update_query_state(query, QueryState::DONE, utility,
+					   query_status == gpsc::QueryStatus::QUERY_STATUS_DONE);
+	auto query_msg = query.message.get();
+	query_msg->set_query_status(query_status);
+	if (status == METRICS_QUERY_ERROR)
+	{
+		bool error_flushed = elog_message() == NULL;
+		if (error_flushed && (edata == NULL || edata->message == NULL))
+		{
+			ereport(WARNING, (errmsg("GPSC missing error message")));
+			ereport(DEBUG3, (errmsg("GPSC query sourceText: %s",
+									query_desc->sourceText)));
+		}
+		else
+		{
+			set_qi_error_message(
+				query_msg, error_flushed ? edata->message : elog_message(),
+				config);
+		}
+	}
+	if (prev_state == START)
+	{
+		// We've missed ExecutorEnd call due to query cancel or error. It's
+		// fine, but now we need to collect and report execution stats
+		*query_msg->mutable_end_time() = current_ts();
+		set_gp_metrics(query_msg->mutable_query_metrics(), query_desc,
+					   nested_calls, nested_timing);
+	}
+#ifdef IC_TEARDOWN_HOOK
+	ic_metrics_collect();
+	set_ic_stats(query_msg->mutable_query_metrics()->mutable_instrumentation(),
+				 &ic_statistics);
+#endif
+	(void) log_query_req(*query_msg, msg, utility);
+}
+
+void
+EventSender::collect_query_done(QueryDesc *query_desc, bool utility,
+								QueryMetricsStatus status, ErrorData *edata)
+{
+	if (!verify_query(query_desc, QueryState::DONE, utility))
+	{
+		return;
+	}
+
+	// Skip sending done message if query errored before submit.
+	if (!qdesc_submitted(query_desc))
+	{
+		if (status != METRICS_QUERY_ERROR)
+		{
+			ereport(WARNING, (errmsg("GPSC trying to process DONE hook for "
+									 "unsubmitted and unerrored query")));
+			ereport(DEBUG3, (errmsg("GPSC query sourceText: %s",
+									query_desc->sourceText)));
+		}
+		return;
+	}
+
+	if (queries.empty())
+	{
+		ereport(WARNING,
+				(errmsg("GPSC cannot find query to process DONE hook")));
+		ereport(DEBUG3,
+				(errmsg("GPSC query sourceText: %s", query_desc->sourceText)));
+		return;
+	}
+	auto &query = get_query(query_desc);
+
+	report_query_done(query_desc, query, status, utility, edata);
+
+	if (need_report_nested_query())
+		update_nested_counters(query_desc);
+
+	queries.erase(QueryKey::from_qdesc(query_desc));
+	pfree(query_desc->gpsc_query_key);
+	query_desc->gpsc_query_key = NULL;
+}
+
+void
+EventSender::ic_metrics_collect()
+{
+#ifdef IC_TEARDOWN_HOOK
+	if (Gp_interconnect_type != INTERCONNECT_TYPE_UDPIFC)
+	{
+		return;
+	}
+	if (!proto_verified || gp_command_count == 0 ||
+		!config.enable_collector() || config.filter_user(get_user_name()))
+	{
+		return;
+	}
+	// we also would like to know nesting level here and filter queries BUT we
+	// don't have this kind of information from this callback. Will have to
+	// collect stats anyways and throw it away later, if necessary
+	auto metrics = UDPIFCGetICStats();
+	ic_statistics.totalRecvQueueSize += metrics.totalRecvQueueSize;
+	ic_statistics.recvQueueSizeCountingTime +=
+		metrics.recvQueueSizeCountingTime;
+	ic_statistics.totalCapacity += metrics.totalCapacity;
+	ic_statistics.capacityCountingTime += metrics.capacityCountingTime;
+	ic_statistics.totalBuffers += metrics.totalBuffers;
+	ic_statistics.bufferCountingTime += metrics.bufferCountingTime;
+	ic_statistics.activeConnectionsNum += metrics.activeConnectionsNum;
+	ic_statistics.retransmits += metrics.retransmits;
+	ic_statistics.startupCachedPktNum += metrics.startupCachedPktNum;
+	ic_statistics.mismatchNum += metrics.mismatchNum;
+	ic_statistics.crcErrors += metrics.crcErrors;
+	ic_statistics.sndPktNum += metrics.sndPktNum;
+	ic_statistics.recvPktNum += metrics.recvPktNum;
+	ic_statistics.disorderedPktNum += metrics.disorderedPktNum;
+	ic_statistics.duplicatedPktNum += metrics.duplicatedPktNum;
+	ic_statistics.recvAckNum += metrics.recvAckNum;
+	ic_statistics.statusQueryMsgNum += metrics.statusQueryMsgNum;
+#endif
+}
+
+void
+EventSender::analyze_stats_collect(QueryDesc *query_desc)
+{
+	if (!verify_query(query_desc, QueryState::END, false /* utility */))
+	{
+		return;
+	}
+	if (Gp_role != GP_ROLE_DISPATCH)
+	{
+		return;
+	}
+	if (!query_desc->totaltime || !need_collect_analyze())
+	{
+		return;
+	}
+	// Make sure stats accumulation is done.
+	// (Note: it's okay if several levels of hook all do this.)
+	gpdb::instr_end_loop(query_desc->totaltime);
+
+	double ms = query_desc->totaltime->total * 1000.0;
+	if (ms >= config.min_analyze_time())
+	{
+		auto &query = get_query(query_desc);
+		auto *query_msg = query.message.get();
+		set_analyze_plan_text(query_desc, query_msg, config);
+	}
+}
+
+EventSender::EventSender()
+{
+	// Perform initial sync to get default GUC values
+	config.sync();
+
+	try
+	{
+		GOOGLE_PROTOBUF_VERIFY_VERSION;
+		proto_verified = true;
+	}
+	catch (const std::exception &e)
+	{
+		ereport(INFO, (errmsg("GPSC protobuf version mismatch is detected %s",
+							  e.what())));
+	}
+#ifdef IC_TEARDOWN_HOOK
+	memset(&ic_statistics, 0, sizeof(ICStatistics));
+#endif
+}
+
+EventSender::~EventSender()
+{
+	for (const auto &[qkey, _] : queries)
+	{
+		ereport(LOG,
+				(errmsg("GPSC query with missing done event: "
+						"tmid=%d ssid=%d ccnt=%d nlvl=%d",
+						qkey.tmid, qkey.ssid, qkey.ccnt, qkey.nesting_level)));
+	}
+}
+
+// That's basically a very simplistic state machine to fix or highlight any bugs
+// coming from GP
+void
+EventSender::update_query_state(QueryItem &query, QueryState new_state,
+								bool utility, bool success)
+{
+	switch (new_state)
+	{
+		case QueryState::SUBMIT:
+			Assert(false);
+			break;
+		case QueryState::START:
+			if (query.state == QueryState::SUBMIT)
+			{
+				query.message->set_query_status(
+					gpsc::QueryStatus::QUERY_STATUS_START);
+			}
+			else
+			{
+				Assert(false);
+			}
+			break;
+		case QueryState::END:
+			// Example of below assert triggering: CURSOR closes before ever being
+			// executed Assert(query->state == QueryState::START ||
+			// IsAbortInProgress());
+			query.message->set_query_status(
+				gpsc::QueryStatus::QUERY_STATUS_END);
+			break;
+		case QueryState::DONE:
+			Assert(query.state == QueryState::END || !success || utility);
+			query.message->set_query_status(
+				gpsc::QueryStatus::QUERY_STATUS_DONE);
+			break;
+		default:
+			Assert(false);
+	}
+	query.state = new_state;
+}
+
+EventSender::QueryItem &
+EventSender::get_query(QueryDesc *query_desc)
+{
+	if (!qdesc_submitted(query_desc))
+	{
+		ereport(
+			WARNING,
+			(errmsg("GPSC attempting to get query that was not submitted")));
+		ereport(DEBUG3,
+				(errmsg("GPSC query sourceText: %s", query_desc->sourceText)));
+		throw std::runtime_error(
+			"Attempting to get query that was not submitted");
+	}
+	return queries.find(QueryKey::from_qdesc(query_desc))->second;
+}
+
+void
+EventSender::submit_query(QueryDesc *query_desc)
+{
+	if (query_desc->gpsc_query_key)
+	{
+		ereport(WARNING,
+				(errmsg("GPSC trying to submit already submitted query")));
+		ereport(DEBUG3,
+				(errmsg("GPSC query sourceText: %s", query_desc->sourceText)));
+	}
+	QueryKey::register_qkey(query_desc, nesting_level);
+	auto key = QueryKey::from_qdesc(query_desc);
+	auto [_, inserted] = queries.emplace(key, QueryItem(QueryState::SUBMIT));
+	if (!inserted)
+	{
+		ereport(WARNING, (errmsg("GPSC duplicate query submit detected")));
+		ereport(DEBUG3,
+				(errmsg("GPSC query sourceText: %s", query_desc->sourceText)));
+	}
+}
+
+void
+EventSender::update_nested_counters(QueryDesc *query_desc)
+{
+	if (!is_top_level_query(query_desc, nesting_level))
+	{
+		auto &query = get_query(query_desc);
+		nested_calls++;
+		double end_time = protots_to_double(query.message->end_time());
+		double start_time = protots_to_double(query.message->start_time());
+		if (end_time >= start_time)
+		{
+			nested_timing += end_time - start_time;
+		}
+		else
+		{
+			ereport(WARNING,
+					(errmsg("GPSC query start_time > end_time (%f > %f)",
+							start_time, end_time)));
+			ereport(DEBUG3, (errmsg("GPSC nested query text %s",
+									query_desc->sourceText)));
+		}
+	}
+}
+
+bool
+EventSender::qdesc_submitted(QueryDesc *query_desc)
+{
+	if (query_desc->gpsc_query_key == NULL)
+	{
+		return false;
+	}
+	return queries.find(QueryKey::from_qdesc(query_desc)) != queries.end();
+}
+
+bool
+EventSender::nesting_is_valid(QueryDesc *query_desc, int nesting_level)
+{
+	return need_report_nested_query() ||
+		   is_top_level_query(query_desc, nesting_level);
+}
+
+bool
+EventSender::need_report_nested_query()
+{
+	return config.report_nested_queries() && Gp_role == GP_ROLE_DISPATCH;
+}
+
+bool
+EventSender::filter_query(QueryDesc *query_desc)
+{
+	return gp_command_count == 0 || query_desc->sourceText == nullptr ||
+		   !config.enable_collector() || config.filter_user(get_user_name());
+}
+
+EventSender::QueryItem::QueryItem(QueryState st)
+	: message(std::make_unique<gpsc::SetQueryReq>()), state(st)
+{
+}
diff --git a/gpcontrib/gp_stats_collector/src/EventSender.h b/gpcontrib/gp_stats_collector/src/EventSender.h
new file mode 100644
index 00000000000..2651a020593
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/EventSender.h
@@ -0,0 +1,203 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * EventSender.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/EventSender.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef EVENTSENDER_H
+#define EVENTSENDER_H
+
+#include <memory>
+#include <tuple>
+#include <unordered_map>
+
+#define typeid __typeid
+extern "C" {
+#include "utils/metrics_utils.h"
+#ifdef IC_TEARDOWN_HOOK
+#include "cdb/ic_udpifc.h"
+#endif
+}
+#undef typeid
+
+#include "Config.h"
+#include "memory/gpdbwrappers.h"
+
+class UDSConnector;
+struct QueryDesc;
+namespace gpsc
+{
+class SetQueryReq;
+}
+
+#include <cstdint>
+
+extern void gp_gettmid(int32 *);
+
+struct QueryKey
+{
+	int tmid;
+	int ssid;
+	int ccnt;
+	int nesting_level;
+	uintptr_t query_desc_addr;
+
+	bool
+	operator==(const QueryKey &other) const
+	{
+		return std::tie(tmid, ssid, ccnt, nesting_level, query_desc_addr) ==
+			   std::tie(other.tmid, other.ssid, other.ccnt, other.nesting_level,
+						other.query_desc_addr);
+	}
+
+	static void
+	register_qkey(QueryDesc *query_desc, size_t nesting_level)
+	{
+		query_desc->gpsc_query_key =
+			(GpscQueryKey *) gpdb::palloc0(sizeof(GpscQueryKey));
+		int32 tmid;
+		gp_gettmid(&tmid);
+		query_desc->gpsc_query_key->tmid = tmid;
+		query_desc->gpsc_query_key->ssid = gp_session_id;
+		query_desc->gpsc_query_key->ccnt = gp_command_count;
+		query_desc->gpsc_query_key->nesting_level = nesting_level;
+		query_desc->gpsc_query_key->query_desc_addr = (uintptr_t) query_desc;
+	}
+
+	static QueryKey
+	from_qdesc(QueryDesc *query_desc)
+	{
+		return {
+			.tmid = query_desc->gpsc_query_key->tmid,
+			.ssid = query_desc->gpsc_query_key->ssid,
+			.ccnt = query_desc->gpsc_query_key->ccnt,
+			.nesting_level = query_desc->gpsc_query_key->nesting_level,
+			.query_desc_addr = query_desc->gpsc_query_key->query_desc_addr,
+		};
+	}
+};
+
+// https://www.boost.org/doc/libs/1_35_0/doc/html/boost/hash_combine_id241013.html
+template <class T>
+inline void
+hash_combine(std::size_t &seed, const T &v)
+{
+	std::hash<T> hasher;
+	seed ^= hasher(v) + 0x9e3779b9 + (seed << 6) + (seed >> 2);
+}
+
+namespace std
+{
+template <>
+struct hash<QueryKey>
+{
+	size_t
+	operator()(const QueryKey &k) const noexcept
+	{
+		size_t seed = hash<uint32_t>{}(k.tmid);
+		hash_combine(seed, k.ssid);
+		hash_combine(seed, k.ccnt);
+		hash_combine(seed, k.nesting_level);
+		uintptr_t addr = k.query_desc_addr;
+		if constexpr (SIZE_MAX < UINTPTR_MAX)
+		{
+			addr %= SIZE_MAX;
+		}
+		hash_combine(seed, addr);
+		return seed;
+	}
+};
+}  // namespace std
+
+class EventSender
+{
+public:
+	void executor_before_start(QueryDesc *query_desc, int eflags);
+	void executor_after_start(QueryDesc *query_desc, int eflags);
+	void executor_end(QueryDesc *query_desc);
+	void query_metrics_collect(QueryMetricsStatus status, void *arg,
+							   bool utility, ErrorData *edata = NULL);
+	void ic_metrics_collect();
+	void analyze_stats_collect(QueryDesc *query_desc);
+	void
+	incr_depth()
+	{
+		nesting_level++;
+	}
+	void
+	decr_depth()
+	{
+		nesting_level--;
+	}
+	EventSender();
+	~EventSender();
+
+private:
+	enum QueryState
+	{
+		SUBMIT,
+		START,
+		END,
+		DONE
+	};
+
+	struct QueryItem
+	{
+		std::unique_ptr<gpsc::SetQueryReq> message;
+		QueryState state;
+
+		explicit QueryItem(QueryState st);
+	};
+
+	bool log_query_req(const gpsc::SetQueryReq &req, const std::string &event,
+					   bool utility);
+	bool verify_query(QueryDesc *query_desc, QueryState state, bool utility);
+	void update_query_state(QueryItem &query, QueryState new_state,
+							bool utility, bool success = true);
+	QueryItem &get_query(QueryDesc *query_desc);
+	void submit_query(QueryDesc *query_desc);
+	void collect_query_submit(QueryDesc *query_desc, bool utility);
+	void report_query_done(QueryDesc *query_desc, QueryItem &query,
+						   QueryMetricsStatus status, bool utility,
+						   ErrorData *edata = NULL);
+	void collect_query_done(QueryDesc *query_desc, bool utility,
+							QueryMetricsStatus status, ErrorData *edata = NULL);
+	void update_nested_counters(QueryDesc *query_desc);
+	bool qdesc_submitted(QueryDesc *query_desc);
+	bool nesting_is_valid(QueryDesc *query_desc, int nesting_level);
+	bool need_report_nested_query();
+	bool filter_query(QueryDesc *query_desc);
+
+	bool proto_verified = false;
+	int nesting_level = 0;
+	int64_t nested_calls = 0;
+	double nested_timing = 0;
+#ifdef IC_TEARDOWN_HOOK
+	ICStatistics ic_statistics;
+#endif
+	std::unordered_map<QueryKey, QueryItem> queries;
+
+	Config config;
+};
+#endif /* EVENTSENDER_H */
diff --git a/gpcontrib/gp_stats_collector/src/GpscStat.cpp b/gpcontrib/gp_stats_collector/src/GpscStat.cpp
new file mode 100644
index 00000000000..151cfd87c02
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/GpscStat.cpp
@@ -0,0 +1,154 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * GpscStat.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/GpscStat.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "GpscStat.h"
+
+#include <algorithm>
+
+extern "C" {
+#include "postgres.h"
+#include "miscadmin.h"
+#include "storage/ipc.h"
+#include "storage/lwlock.h"
+#include "storage/shmem.h"
+#include "storage/spin.h"
+}
+
+namespace
+{
+struct ProtectedData
+{
+	slock_t mutex;
+	GpscStat::Data data;
+};
+shmem_startup_hook_type prev_shmem_startup_hook = NULL;
+ProtectedData *data = nullptr;
+
+void
+gpsc_shmem_startup()
+{
+	if (prev_shmem_startup_hook)
+		prev_shmem_startup_hook();
+	LWLockAcquire(AddinShmemInitLock, LW_EXCLUSIVE);
+	bool found;
+	data = reinterpret_cast<ProtectedData *>(
+		ShmemInitStruct("gpsc_stat_messages", sizeof(ProtectedData), &found));
+	if (!found)
+	{
+		SpinLockInit(&data->mutex);
+		data->data = GpscStat::Data();
+	}
+	LWLockRelease(AddinShmemInitLock);
+}
+
+class LockGuard
+{
+public:
+	LockGuard(slock_t *mutex) : mutex_(mutex)
+	{
+		SpinLockAcquire(mutex_);
+	}
+	~LockGuard()
+	{
+		SpinLockRelease(mutex_);
+	}
+
+private:
+	slock_t *mutex_;
+};
+}  // namespace
+
+void
+GpscStat::init()
+{
+	if (!process_shared_preload_libraries_in_progress)
+		return;
+	RequestAddinShmemSpace(sizeof(ProtectedData));
+	prev_shmem_startup_hook = shmem_startup_hook;
+	shmem_startup_hook = gpsc_shmem_startup;
+}
+
+void
+GpscStat::deinit()
+{
+	shmem_startup_hook = prev_shmem_startup_hook;
+}
+
+void
+GpscStat::reset()
+{
+	LockGuard lg(&data->mutex);
+	data->data = GpscStat::Data();
+}
+
+void
+GpscStat::report_send(int32_t msg_size)
+{
+	LockGuard lg(&data->mutex);
+	data->data.total++;
+	data->data.max_message_size =
+		std::max(msg_size, data->data.max_message_size);
+}
+
+void
+GpscStat::report_bad_connection()
+{
+	LockGuard lg(&data->mutex);
+	data->data.total++;
+	data->data.failed_connects++;
+}
+
+void
+GpscStat::report_bad_send(int32_t msg_size)
+{
+	LockGuard lg(&data->mutex);
+	data->data.total++;
+	data->data.failed_sends++;
+	data->data.max_message_size =
+		std::max(msg_size, data->data.max_message_size);
+}
+
+void
+GpscStat::report_error()
+{
+	LockGuard lg(&data->mutex);
+	data->data.total++;
+	data->data.failed_other++;
+}
+
+GpscStat::Data
+GpscStat::get_stats()
+{
+	LockGuard lg(&data->mutex);
+	return data->data;
+}
+
+bool
+GpscStat::loaded()
+{
+	return data != nullptr;
+}
diff --git a/gpcontrib/gp_stats_collector/src/GpscStat.h b/gpcontrib/gp_stats_collector/src/GpscStat.h
new file mode 100644
index 00000000000..d82930c7b5b
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/GpscStat.h
@@ -0,0 +1,52 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * GpscStat.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/GpscStat.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef GPSCSTAT_H
+#define GPSCSTAT_H
+
+#include <cstdint>
+
+class GpscStat
+{
+public:
+	struct Data
+	{
+		int64_t total, failed_sends, failed_connects, failed_other;
+		int32_t max_message_size;
+	};
+
+	static void init();
+	static void deinit();
+	static void reset();
+	static void report_send(int32_t msg_size);
+	static void report_bad_connection();
+	static void report_bad_send(int32_t msg_size);
+	static void report_error();
+	static Data get_stats();
+	static bool loaded();
+};
+#endif /* GPSCSTAT_H */
diff --git a/gpcontrib/gp_stats_collector/src/PgUtils.cpp b/gpcontrib/gp_stats_collector/src/PgUtils.cpp
new file mode 100644
index 00000000000..c473cc383f2
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/PgUtils.cpp
@@ -0,0 +1,104 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * PgUtils.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/PgUtils.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "PgUtils.h"
+#include "Config.h"
+#include "memory/gpdbwrappers.h"
+
+extern "C" {
+#include "cdb/cdbvars.h"
+#include "commands/resgroupcmds.h"
+}
+
+std::string
+get_user_name()
+{
+	// username is allocated on stack, we don't need to pfree it.
+	const char *username =
+		gpdb::get_config_option("session_authorization", false, false);
+	return username ? std::string(username) : "";
+}
+
+std::string
+get_db_name()
+{
+	char *dbname = gpdb::get_database_name(MyDatabaseId);
+	if (dbname)
+	{
+		std::string result(dbname);
+		gpdb::pfree(dbname);
+		return result;
+	}
+	return "";
+}
+
+std::string
+get_rg_name()
+{
+	auto groupId = gpdb::get_rg_id_by_session_id(MySessionState->sessionId);
+	if (!OidIsValid(groupId))
+		return "";
+
+	char *rgname = gpdb::get_rg_name_for_id(groupId);
+	if (rgname == nullptr)
+		return "";
+
+	std::string result(rgname);
+	gpdb::pfree(rgname);
+	return result;
+}
+
+/**
+ * Things get tricky with nested queries.
+ * a) A nested query on master is a real query optimized and executed from
+ * master. An example would be `select some_insert_function();`, where
+ * some_insert_function does something like `insert into tbl values (1)`. Master
+ * will create two statements. Outer select statement and inner insert statement
+ * with nesting level 1.
+ * For segments both statements are top-level statements with nesting level 0.
+ * b) A nested query on segment is something executed as sub-statement on
+ * segment. An example would be `select a from tbl where is_good_value(b);`. In
+ * this case master will issue one top-level statement, but segments will change
+ * contexts for UDF execution and execute  is_good_value(b) once for each tuple
+ * as a nested query. Creating massive load on external agent.
+ *
+ * Hence, here is a decision:
+ * 1) ignore all queries that are nested on segments
+ * 2) record (if enabled) all queries that are nested on master
+ * NODE: The truth is, we can't really ignore nested master queries, because
+ * segment sees those as top-level.
+ */
+
+bool
+is_top_level_query(QueryDesc *query_desc, int nesting_level)
+{
+	if (query_desc->gpsc_query_key == NULL)
+	{
+		return nesting_level == 0;
+	}
+	return query_desc->gpsc_query_key->nesting_level == 0;
+}
diff --git a/gpcontrib/gp_stats_collector/src/PgUtils.h b/gpcontrib/gp_stats_collector/src/PgUtils.h
new file mode 100644
index 00000000000..d9f673e7cbc
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/PgUtils.h
@@ -0,0 +1,38 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * PgUtils.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/PgUtils.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+extern "C" {
+#include "postgres.h"
+#include "commands/explain.h"
+}
+
+#include <string>
+
+std::string get_user_name();
+std::string get_db_name();
+std::string get_rg_name();
+bool is_top_level_query(QueryDesc *query_desc, int nesting_level);
diff --git a/gpcontrib/gp_stats_collector/src/ProcStats.cpp b/gpcontrib/gp_stats_collector/src/ProcStats.cpp
new file mode 100644
index 00000000000..e308b30dfa5
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/ProcStats.cpp
@@ -0,0 +1,144 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * ProcStats.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/ProcStats.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "ProcStats.h"
+#include <fstream>
+#include <string>
+#include <unistd.h>
+#include "gpsc_metrics.pb.h"
+
+extern "C" {
+#include "postgres.h"
+#include "utils/elog.h"
+}
+
+namespace
+{
+#define FILL_IO_STAT(stat_name)    \
+	uint64_t stat_name;            \
+	proc_stat >> tmp >> stat_name; \
+	stats->set_##stat_name(stat_name - stats->stat_name());
+
+void
+fill_io_stats(gpsc::SystemStat *stats)
+{
+	std::ifstream proc_stat("/proc/self/io");
+	std::string tmp;
+	FILL_IO_STAT(rchar);
+	FILL_IO_STAT(wchar);
+	FILL_IO_STAT(syscr);
+	FILL_IO_STAT(syscw);
+	FILL_IO_STAT(read_bytes);
+	FILL_IO_STAT(write_bytes);
+	FILL_IO_STAT(cancelled_write_bytes);
+}
+
+void
+fill_cpu_stats(gpsc::SystemStat *stats)
+{
+	static const int UTIME_ID = 13;
+	static const int STIME_ID = 14;
+	static const int VSIZE_ID = 22;
+	static const int RSS_ID = 23;
+	static const double tps = sysconf(_SC_CLK_TCK);
+
+	std::ifstream proc_stat("/proc/self/stat");
+	std::string trash;
+	for (int i = 0; i <= RSS_ID; ++i)
+	{
+		switch (i)
+		{
+			case UTIME_ID:
+				double utime;
+				proc_stat >> utime;
+				stats->set_usertimeseconds(utime / tps -
+										   stats->usertimeseconds());
+				break;
+			case STIME_ID:
+				double stime;
+				proc_stat >> stime;
+				stats->set_kerneltimeseconds(stime / tps -
+											 stats->kerneltimeseconds());
+				break;
+			case VSIZE_ID:
+				uint64_t vsize;
+				proc_stat >> vsize;
+				stats->set_vsize(vsize);
+				break;
+			case RSS_ID:
+				uint64_t rss;
+				proc_stat >> rss;
+				// NOTE: this is a double AFAIU, need to double-check
+				stats->set_rss(rss);
+				break;
+			default:
+				proc_stat >> trash;
+		}
+	}
+}
+
+void
+fill_status_stats(gpsc::SystemStat *stats)
+{
+	std::ifstream proc_stat("/proc/self/status");
+	std::string key, measure;
+	while (proc_stat >> key)
+	{
+		if (key == "VmPeak:")
+		{
+			uint64_t value;
+			proc_stat >> value;
+			stats->set_vmpeakkb(value);
+			proc_stat >> measure;
+			if (measure != "kB")
+			{
+				throw std::runtime_error(
+					"Expected memory sizes in kB, but got in " + measure);
+			}
+		}
+		else if (key == "VmSize:")
+		{
+			uint64_t value;
+			proc_stat >> value;
+			stats->set_vmsizekb(value);
+			if (measure != "kB")
+			{
+				throw std::runtime_error(
+					"Expected memory sizes in kB, but got in " + measure);
+			}
+		}
+	}
+}
+}  // namespace
+
+void
+fill_self_stats(gpsc::SystemStat *stats)
+{
+	fill_io_stats(stats);
+	fill_cpu_stats(stats);
+	fill_status_stats(stats);
+}
\ No newline at end of file
diff --git a/gpcontrib/gp_stats_collector/src/ProcStats.h b/gpcontrib/gp_stats_collector/src/ProcStats.h
new file mode 100644
index 00000000000..8b83dbfef02
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/ProcStats.h
@@ -0,0 +1,37 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * ProcStats.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/ProcStats.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef PROCSTATS_H
+#define PROCSTATS_H
+
+namespace gpsc
+{
+class SystemStat;
+}
+
+void fill_self_stats(gpsc::SystemStat *stats);
+#endif /* PROCSTATS_H */
diff --git a/gpcontrib/gp_stats_collector/src/ProtoUtils.cpp b/gpcontrib/gp_stats_collector/src/ProtoUtils.cpp
new file mode 100644
index 00000000000..b22f580303e
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/ProtoUtils.cpp
@@ -0,0 +1,375 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * ProtoUtils.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/ProtoUtils.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "ProtoUtils.h"
+#include "Config.h"
+#include "PgUtils.h"
+#include "ProcStats.h"
+#include "memory/gpdbwrappers.h"
+
+#define typeid __typeid
+#define operator __operator
+extern "C" {
+#include "postgres.h"
+#include "access/hash.h"
+#include "access/xact.h"
+#include "cdb/cdbinterconnect.h"
+#include "cdb/cdbvars.h"
+#include "cdb/ml_ipc.h"
+#ifdef IC_TEARDOWN_HOOK
+#include "cdb/ic_udpifc.h"
+#endif
+#include "utils/workfile_mgr.h"
+}
+#undef typeid
+#undef operator
+
+#include <ctime>
+#include <string>
+
+extern void gp_gettmid(int32 *);
+
+namespace
+{
+constexpr uint8_t UTF8_CONTINUATION_BYTE_MASK = (1 << 7) | (1 << 6);
+constexpr uint8_t UTF8_CONTINUATION_BYTE = (1 << 7);
+constexpr uint8_t UTF8_MAX_SYMBOL_BYTES = 4;
+
+// Returns true if byte is the starting byte of utf8
+// character, false if byte is the continuation (10xxxxxx).
+inline bool
+utf8_start_byte(uint8_t byte)
+{
+	return (byte & UTF8_CONTINUATION_BYTE_MASK) != UTF8_CONTINUATION_BYTE;
+}
+}  // namespace
+
+google::protobuf::Timestamp
+current_ts()
+{
+	google::protobuf::Timestamp current_ts;
+	struct timeval tv;
+	gettimeofday(&tv, nullptr);
+	current_ts.set_seconds(tv.tv_sec);
+	current_ts.set_nanos(static_cast<int32_t>(tv.tv_usec * 1000));
+	return current_ts;
+}
+
+void
+set_query_key(gpsc::QueryKey *key)
+{
+	key->set_ccnt(gp_command_count);
+	key->set_ssid(gp_session_id);
+	int32 tmid = 0;
+	gp_gettmid(&tmid);
+	key->set_tmid(tmid);
+}
+
+void
+set_segment_key(gpsc::SegmentKey *key)
+{
+	key->set_dbid(GpIdentity.dbid);
+	key->set_segindex(GpIdentity.segindex);
+}
+
+std::string
+trim_str_shrink_utf8(const char *str, size_t len, size_t lim)
+{
+	if (unlikely(str == nullptr))
+	{
+		return std::string();
+	}
+	if (likely(len <= lim || GetDatabaseEncoding() != PG_UTF8))
+	{
+		return std::string(str, std::min(len, lim));
+	}
+
+	// Handle trimming of utf8 correctly, do not cut multi-byte characters.
+	size_t cut_pos = lim;
+	size_t visited_bytes = 1;
+	while (visited_bytes < UTF8_MAX_SYMBOL_BYTES && cut_pos > 0)
+	{
+		if (utf8_start_byte(static_cast<uint8_t>(str[cut_pos])))
+		{
+			break;
+		}
+		++visited_bytes;
+		--cut_pos;
+	}
+
+	return std::string(str, cut_pos);
+}
+
+void
+set_query_plan(gpsc::SetQueryReq *req, QueryDesc *query_desc,
+			   const Config &config)
+{
+	if (Gp_role == GP_ROLE_DISPATCH && query_desc->plannedstmt)
+	{
+		auto qi = req->mutable_query_info();
+		qi->set_generator(query_desc->plannedstmt->planGen == PLANGEN_OPTIMIZER
+							  ? gpsc::PlanGenerator::PLAN_GENERATOR_OPTIMIZER
+							  : gpsc::PlanGenerator::PLAN_GENERATOR_PLANNER);
+		MemoryContext oldcxt =
+			gpdb::mem_ctx_switch_to(query_desc->estate->es_query_cxt);
+		ExplainState es = gpdb::get_explain_state(query_desc, true);
+		if (es.str)
+		{
+			*qi->mutable_plan_text() = trim_str_shrink_utf8(
+				es.str->data, es.str->len, config.max_plan_size());
+			StringInfo norm_plan = gpdb::gen_normplan(es.str->data);
+			if (norm_plan)
+			{
+				*qi->mutable_template_plan_text() = trim_str_shrink_utf8(
+					norm_plan->data, norm_plan->len, config.max_plan_size());
+				qi->set_plan_id(hash_any((unsigned char *) norm_plan->data,
+										 norm_plan->len));
+				gpdb::pfree(norm_plan->data);
+			}
+			qi->set_query_id(query_desc->plannedstmt->queryId);
+			gpdb::pfree(es.str->data);
+		}
+		gpdb::mem_ctx_switch_to(oldcxt);
+	}
+}
+
+void
+set_query_text(gpsc::SetQueryReq *req, QueryDesc *query_desc,
+			   const Config &config)
+{
+	if (Gp_role == GP_ROLE_DISPATCH && query_desc->sourceText)
+	{
+		auto qi = req->mutable_query_info();
+		*qi->mutable_query_text() = trim_str_shrink_utf8(
+			query_desc->sourceText, strlen(query_desc->sourceText),
+			config.max_text_size());
+		char *norm_query = gpdb::gen_normquery(query_desc->sourceText);
+		if (norm_query)
+		{
+			*qi->mutable_template_query_text() = trim_str_shrink_utf8(
+				norm_query, strlen(norm_query), config.max_text_size());
+			gpdb::pfree(norm_query);
+		}
+	}
+}
+
+void
+clear_big_fields(gpsc::SetQueryReq *req)
+{
+	if (Gp_role == GP_ROLE_DISPATCH)
+	{
+		auto qi = req->mutable_query_info();
+		qi->clear_plan_text();
+		qi->clear_template_plan_text();
+		qi->clear_query_text();
+		qi->clear_template_query_text();
+		qi->clear_analyze_text();
+	}
+}
+
+void
+set_query_info(gpsc::SetQueryReq *req)
+{
+	if (Gp_role == GP_ROLE_DISPATCH)
+	{
+		auto qi = req->mutable_query_info();
+		qi->set_username(get_user_name());
+		if (IsTransactionState())
+			qi->set_databasename(get_db_name());
+		qi->set_rsgname(get_rg_name());
+	}
+}
+
+void
+set_qi_nesting_level(gpsc::SetQueryReq *req, int nesting_level)
+{
+	auto aqi = req->mutable_add_info();
+	aqi->set_nested_level(nesting_level);
+}
+
+void
+set_qi_slice_id(gpsc::SetQueryReq *req)
+{
+	auto aqi = req->mutable_add_info();
+	aqi->set_slice_id(currentSliceId);
+}
+
+void
+set_qi_error_message(gpsc::SetQueryReq *req, const char *err_msg,
+					 const Config &config)
+{
+	auto aqi = req->mutable_add_info();
+	*aqi->mutable_error_message() =
+		trim_str_shrink_utf8(err_msg, strlen(err_msg), config.max_text_size());
+}
+
+void
+set_metric_instrumentation(gpsc::MetricInstrumentation *metrics,
+						   QueryDesc *query_desc, int nested_calls,
+						   double nested_time)
+{
+	auto instrument = query_desc->planstate->instrument;
+	if (instrument)
+	{
+		metrics->set_ntuples(instrument->ntuples);
+		metrics->set_nloops(instrument->nloops);
+		metrics->set_tuplecount(instrument->tuplecount);
+		metrics->set_firsttuple(instrument->firsttuple);
+		metrics->set_startup(instrument->startup);
+		metrics->set_total(instrument->total);
+		auto &buffusage = instrument->bufusage;
+		metrics->set_shared_blks_hit(buffusage.shared_blks_hit);
+		metrics->set_shared_blks_read(buffusage.shared_blks_read);
+		metrics->set_shared_blks_dirtied(buffusage.shared_blks_dirtied);
+		metrics->set_shared_blks_written(buffusage.shared_blks_written);
+		metrics->set_local_blks_hit(buffusage.local_blks_hit);
+		metrics->set_local_blks_read(buffusage.local_blks_read);
+		metrics->set_local_blks_dirtied(buffusage.local_blks_dirtied);
+		metrics->set_local_blks_written(buffusage.local_blks_written);
+		metrics->set_temp_blks_read(buffusage.temp_blks_read);
+		metrics->set_temp_blks_written(buffusage.temp_blks_written);
+		metrics->set_blk_read_time(
+			INSTR_TIME_GET_DOUBLE(buffusage.blk_read_time));
+		metrics->set_blk_write_time(
+			INSTR_TIME_GET_DOUBLE(buffusage.blk_write_time));
+	}
+	if (query_desc->estate && query_desc->estate->motionlayer_context)
+	{
+		MotionLayerState *mlstate =
+			(MotionLayerState *) query_desc->estate->motionlayer_context;
+		metrics->mutable_sent()->set_total_bytes(
+			mlstate->stat_total_bytes_sent);
+		metrics->mutable_sent()->set_tuple_bytes(
+			mlstate->stat_tuple_bytes_sent);
+		metrics->mutable_sent()->set_chunks(mlstate->stat_total_chunks_sent);
+		metrics->mutable_received()->set_total_bytes(
+			mlstate->stat_total_bytes_recvd);
+		metrics->mutable_received()->set_tuple_bytes(
+			mlstate->stat_tuple_bytes_recvd);
+		metrics->mutable_received()->set_chunks(
+			mlstate->stat_total_chunks_recvd);
+	}
+	metrics->set_inherited_calls(nested_calls);
+	metrics->set_inherited_time(nested_time);
+}
+
+void
+set_gp_metrics(gpsc::GPMetrics *metrics, QueryDesc *query_desc,
+			   int nested_calls, double nested_time)
+{
+	if (query_desc->planstate && query_desc->planstate->instrument)
+	{
+		set_metric_instrumentation(metrics->mutable_instrumentation(),
+								   query_desc, nested_calls, nested_time);
+	}
+	fill_self_stats(metrics->mutable_systemstat());
+	metrics->mutable_systemstat()->set_runningtimeseconds(
+		time(NULL) - metrics->mutable_systemstat()->runningtimeseconds());
+	metrics->mutable_spill()->set_filecount(
+		WorkfileTotalFilesCreated() - metrics->mutable_spill()->filecount());
+	metrics->mutable_spill()->set_totalbytes(
+		WorkfileTotalBytesWritten() - metrics->mutable_spill()->totalbytes());
+}
+
+#define UPDATE_IC_STATS(proto_name, stat_name)                   \
+	metrics->mutable_interconnect()->set_##proto_name(           \
+		ic_statistics->stat_name -                               \
+		metrics->mutable_interconnect()->proto_name());          \
+	Assert(metrics->mutable_interconnect()->proto_name() >= 0 && \
+		   metrics->mutable_interconnect()->proto_name() <=      \
+			   ic_statistics->stat_name)
+
+void
+set_ic_stats(gpsc::MetricInstrumentation *metrics,
+			 const ICStatistics *ic_statistics)
+{
+#ifdef IC_TEARDOWN_HOOK
+	UPDATE_IC_STATS(total_recv_queue_size, totalRecvQueueSize);
+	UPDATE_IC_STATS(recv_queue_size_counting_time, recvQueueSizeCountingTime);
+	UPDATE_IC_STATS(total_capacity, totalCapacity);
+	UPDATE_IC_STATS(capacity_counting_time, capacityCountingTime);
+	UPDATE_IC_STATS(total_buffers, totalBuffers);
+	UPDATE_IC_STATS(buffer_counting_time, bufferCountingTime);
+	UPDATE_IC_STATS(active_connections_num, activeConnectionsNum);
+	UPDATE_IC_STATS(retransmits, retransmits);
+	UPDATE_IC_STATS(startup_cached_pkt_num, startupCachedPktNum);
+	UPDATE_IC_STATS(mismatch_num, mismatchNum);
+	UPDATE_IC_STATS(crc_errors, crcErrors);
+	UPDATE_IC_STATS(snd_pkt_num, sndPktNum);
+	UPDATE_IC_STATS(recv_pkt_num, recvPktNum);
+	UPDATE_IC_STATS(disordered_pkt_num, disorderedPktNum);
+	UPDATE_IC_STATS(duplicated_pkt_num, duplicatedPktNum);
+	UPDATE_IC_STATS(recv_ack_num, recvAckNum);
+	UPDATE_IC_STATS(status_query_msg_num, statusQueryMsgNum);
+#endif
+}
+
+gpsc::SetQueryReq
+create_query_req(gpsc::QueryStatus status)
+{
+	gpsc::SetQueryReq req;
+	req.set_query_status(status);
+	*req.mutable_datetime() = current_ts();
+	set_query_key(req.mutable_query_key());
+	set_segment_key(req.mutable_segment_key());
+	return req;
+}
+
+double
+protots_to_double(const google::protobuf::Timestamp &ts)
+{
+	return double(ts.seconds()) + double(ts.nanos()) / 1000000000.0;
+}
+
+void
+set_analyze_plan_text(QueryDesc *query_desc, gpsc::SetQueryReq *req,
+					  const Config &config)
+{
+	// Make sure it is a valid txn and it is not an utility
+	// statement for ExplainPrintPlan() later.
+	if (!IsTransactionState() || !query_desc->plannedstmt)
+	{
+		return;
+	}
+	MemoryContext oldcxt =
+		gpdb::mem_ctx_switch_to(query_desc->estate->es_query_cxt);
+	ExplainState es = gpdb::get_analyze_state(
+		query_desc, query_desc->instrument_options && config.enable_analyze());
+	gpdb::mem_ctx_switch_to(oldcxt);
+	if (es.str)
+	{
+		// Remove last line break.
+		if (es.str->len > 0 && es.str->data[es.str->len - 1] == '\n')
+		{
+			es.str->data[--es.str->len] = '\0';
+		}
+		auto trimmed_analyze = trim_str_shrink_utf8(es.str->data, es.str->len,
+													config.max_plan_size());
+		req->mutable_query_info()->set_analyze_text(trimmed_analyze);
+		gpdb::pfree(es.str->data);
+	}
+}
diff --git a/gpcontrib/gp_stats_collector/src/ProtoUtils.h b/gpcontrib/gp_stats_collector/src/ProtoUtils.h
new file mode 100644
index 00000000000..6b38097fbcc
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/ProtoUtils.h
@@ -0,0 +1,57 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * ProtoUtils.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/ProtoUtils.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef PROTOUTILS_H
+#define PROTOUTILS_H
+
+#include "protos/gpsc_set_service.pb.h"
+
+struct QueryDesc;
+struct ICStatistics;
+class Config;
+
+google::protobuf::Timestamp current_ts();
+void set_query_plan(gpsc::SetQueryReq *req, QueryDesc *query_desc,
+					const Config &config);
+void set_query_text(gpsc::SetQueryReq *req, QueryDesc *query_desc,
+					const Config &config);
+void clear_big_fields(gpsc::SetQueryReq *req);
+void set_query_info(gpsc::SetQueryReq *req);
+void set_qi_nesting_level(gpsc::SetQueryReq *req, int nesting_level);
+void set_qi_slice_id(gpsc::SetQueryReq *req);
+void set_qi_error_message(gpsc::SetQueryReq *req, const char *err_msg,
+						  const Config &config);
+void set_gp_metrics(gpsc::GPMetrics *metrics, QueryDesc *query_desc,
+					int nested_calls, double nested_time);
+void set_ic_stats(gpsc::MetricInstrumentation *metrics,
+				  const ICStatistics *ic_statistics);
+gpsc::SetQueryReq create_query_req(gpsc::QueryStatus status);
+double protots_to_double(const google::protobuf::Timestamp &ts);
+void set_analyze_plan_text(QueryDesc *query_desc, gpsc::SetQueryReq *message,
+						   const Config &config);
+
+#endif /* PROTOUTILS_H */
diff --git a/gpcontrib/gp_stats_collector/src/UDSConnector.cpp b/gpcontrib/gp_stats_collector/src/UDSConnector.cpp
new file mode 100644
index 00000000000..056fa9071a5
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/UDSConnector.cpp
@@ -0,0 +1,144 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * UDSConnector.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/UDSConnector.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "UDSConnector.h"
+#include "Config.h"
+#include "GpscStat.h"
+#include "log/LogOps.h"
+#include "memory/gpdbwrappers.h"
+
+#include <string>
+#include <sys/fcntl.h>
+#include <sys/socket.h>
+#include <sys/types.h>
+#include <sys/un.h>
+#include <unistd.h>
+
+extern "C" {
+#include "postgres.h"
+}
+
+static void inline log_tracing_failure(const gpsc::SetQueryReq &req,
+									   const std::string &event)
+{
+	ereport(LOG, (errmsg("Query {%d-%d-%d} %s tracing failed with error %m",
+						 req.query_key().tmid(), req.query_key().ssid(),
+						 req.query_key().ccnt(), event.c_str())));
+}
+
+bool
+UDSConnector::report_query(const gpsc::SetQueryReq &req,
+						   const std::string &event, const Config &config)
+{
+	sockaddr_un address{};
+	address.sun_family = AF_UNIX;
+	const auto &uds_path = config.uds_path();
+
+	if (uds_path.size() >= sizeof(address.sun_path))
+	{
+		ereport(WARNING, (errmsg("UDS path is too long for socket buffer")));
+		GpscStat::report_error();
+		return false;
+	}
+	strcpy(address.sun_path, uds_path.c_str());
+
+	const auto sockfd = socket(AF_UNIX, SOCK_STREAM, 0);
+	if (sockfd == -1)
+	{
+		log_tracing_failure(req, event);
+		GpscStat::report_error();
+		return false;
+	}
+
+	// Close socket automatically on error path.
+	struct SockGuard
+	{
+		int fd;
+		~SockGuard()
+		{
+			close(fd);
+		}
+	} sock_guard{sockfd};
+
+	if (fcntl(sockfd, F_SETFL, O_NONBLOCK) == -1)
+	{
+		// That's a very important error that should never happen, so make it
+		// visible to an end-user and admins.
+		ereport(WARNING,
+				(errmsg("Unable to create non-blocking socket connection %m")));
+		GpscStat::report_error();
+		return false;
+	}
+
+	if (connect(sockfd, reinterpret_cast<sockaddr *>(&address),
+				sizeof(address)) == -1)
+	{
+		log_tracing_failure(req, event);
+		GpscStat::report_bad_connection();
+		return false;
+	}
+
+	const auto data_size = req.ByteSizeLong();
+	const auto total_size = data_size + sizeof(uint32_t);
+	auto *buf = static_cast<uint8_t *>(gpdb::palloc(total_size));
+	// Free buf automatically on error path.
+	struct BufGuard
+	{
+		void *p;
+		~BufGuard()
+		{
+			gpdb::pfree(p);
+		}
+	} buf_guard{buf};
+
+	*reinterpret_cast<uint32_t *>(buf) = data_size;
+	req.SerializeWithCachedSizesToArray(buf + sizeof(uint32_t));
+
+	int64_t sent = 0, sent_total = 0;
+	do
+	{
+		sent = send(sockfd, buf + sent_total, total_size - sent_total,
+					MSG_DONTWAIT);
+		if (sent > 0)
+			sent_total += sent;
+	} while (sent > 0 && size_t(sent_total) != total_size &&
+			 // the line below is a small throttling hack:
+			 // if a message does not fit a single packet, we take a nap
+			 // before sending the next one.
+			 // Otherwise, MSG_DONTWAIT send might overflow the UDS
+			 (pg_usleep(1000), true));
+
+	if (sent < 0)
+	{
+		log_tracing_failure(req, event);
+		GpscStat::report_bad_send(total_size);
+		return false;
+	}
+
+	GpscStat::report_send(total_size);
+	return true;
+}
diff --git a/gpcontrib/gp_stats_collector/src/UDSConnector.h b/gpcontrib/gp_stats_collector/src/UDSConnector.h
new file mode 100644
index 00000000000..ac56dd54f44
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/UDSConnector.h
@@ -0,0 +1,42 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * UDSConnector.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/UDSConnector.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef UDSCONNECTOR_H
+#define UDSCONNECTOR_H
+
+#include "protos/gpsc_set_service.pb.h"
+
+class Config;
+
+class UDSConnector
+{
+public:
+	bool static report_query(const gpsc::SetQueryReq &req,
+							 const std::string &event, const Config &config);
+};
+
+#endif /* UDSCONNECTOR_H */
diff --git a/gpcontrib/gp_stats_collector/src/gp_stats_collector.c b/gpcontrib/gp_stats_collector/src/gp_stats_collector.c
new file mode 100644
index 00000000000..d295e37b396
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/gp_stats_collector.c
@@ -0,0 +1,175 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * gp_stats_collector.c
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/gp_stats_collector.c
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "postgres.h"
+#include "cdb/cdbvars.h"
+#include "funcapi.h"
+#include "utils/builtins.h"
+
+#include "hook_wrappers.h"
+
+PG_MODULE_MAGIC;
+
+void _PG_init(void);
+void _PG_fini(void);
+PG_FUNCTION_INFO_V1(gpsc_stat_messages_reset);
+PG_FUNCTION_INFO_V1(gpsc_stat_messages);
+PG_FUNCTION_INFO_V1(gpsc_init_log);
+PG_FUNCTION_INFO_V1(gpsc_truncate_log);
+
+PG_FUNCTION_INFO_V1(gpsc_test_uds_start_server);
+PG_FUNCTION_INFO_V1(gpsc_test_uds_receive);
+PG_FUNCTION_INFO_V1(gpsc_test_uds_stop_server);
+
+void
+_PG_init(void)
+{
+	if (Gp_role == GP_ROLE_DISPATCH || Gp_role == GP_ROLE_EXECUTE)
+		hooks_init();
+}
+
+void
+_PG_fini(void)
+{
+	if (Gp_role == GP_ROLE_DISPATCH || Gp_role == GP_ROLE_EXECUTE)
+		hooks_deinit();
+}
+
+Datum
+gpsc_stat_messages_reset(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		funcctx = SRF_FIRSTCALL_INIT();
+		gpsc_functions_reset();
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+	SRF_RETURN_DONE(funcctx);
+}
+
+Datum
+gpsc_stat_messages(PG_FUNCTION_ARGS)
+{
+	return gpsc_functions_get(fcinfo);
+}
+
+Datum
+gpsc_init_log(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		funcctx = SRF_FIRSTCALL_INIT();
+		init_log();
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+	SRF_RETURN_DONE(funcctx);
+}
+
+Datum
+gpsc_truncate_log(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		funcctx = SRF_FIRSTCALL_INIT();
+		truncate_log();
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+	SRF_RETURN_DONE(funcctx);
+}
+
+Datum
+gpsc_test_uds_start_server(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		funcctx = SRF_FIRSTCALL_INIT();
+		char *path = text_to_cstring(PG_GETARG_TEXT_PP(0));
+		test_uds_start_server(path);
+		pfree(path);
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+	SRF_RETURN_DONE(funcctx);
+}
+
+Datum
+gpsc_test_uds_receive(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+	int64 *result;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		MemoryContext oldcontext;
+
+		funcctx = SRF_FIRSTCALL_INIT();
+		oldcontext = MemoryContextSwitchTo(funcctx->multi_call_memory_ctx);
+		result = (int64 *) palloc(sizeof(int64));
+		funcctx->user_fctx = result;
+		funcctx->max_calls = 1;
+		MemoryContextSwitchTo(oldcontext);
+
+		int timeout_ms = PG_GETARG_INT32(0);
+		*result = test_uds_receive(timeout_ms);
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+
+	if (funcctx->call_cntr < funcctx->max_calls)
+	{
+		result = (int64 *) funcctx->user_fctx;
+		SRF_RETURN_NEXT(funcctx, Int64GetDatum(*result));
+	}
+
+	SRF_RETURN_DONE(funcctx);
+}
+
+Datum
+gpsc_test_uds_stop_server(PG_FUNCTION_ARGS)
+{
+	FuncCallContext *funcctx;
+
+	if (SRF_IS_FIRSTCALL())
+	{
+		funcctx = SRF_FIRSTCALL_INIT();
+		test_uds_stop_server();
+	}
+
+	funcctx = SRF_PERCALL_SETUP();
+	SRF_RETURN_DONE(funcctx);
+}
diff --git a/gpcontrib/gp_stats_collector/src/hook_wrappers.cpp b/gpcontrib/gp_stats_collector/src/hook_wrappers.cpp
new file mode 100644
index 00000000000..38ea117bda2
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/hook_wrappers.cpp
@@ -0,0 +1,474 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * hook_wrappers.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/hook_wrappers.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#define typeid __typeid
+extern "C" {
+#include "postgres.h"
+#include "cdb/cdbvars.h"
+#include "cdb/ml_ipc.h"
+#include "executor/execUtils.h"
+#include "executor/executor.h"
+#include "funcapi.h"
+#include "stat_statements_parser/pg_stat_statements_parser.h"
+#include "tcop/utility.h"
+#include "utils/builtins.h"
+#include "utils/elog.h"
+#include "utils/metrics_utils.h"
+
+#include <errno.h>
+#include <poll.h>
+#include <sys/socket.h>
+#include <sys/un.h>
+#include <unistd.h>
+}
+#undef typeid
+
+#include "Config.h"
+#include "EventSender.h"
+#include "GpscStat.h"
+#include "hook_wrappers.h"
+#include "memory/gpdbwrappers.h"
+
+static ExecutorStart_hook_type previous_ExecutorStart_hook = nullptr;
+static ExecutorRun_hook_type previous_ExecutorRun_hook = nullptr;
+static ExecutorFinish_hook_type previous_ExecutorFinish_hook = nullptr;
+static ExecutorEnd_hook_type previous_ExecutorEnd_hook = nullptr;
+static query_info_collect_hook_type previous_query_info_collect_hook = nullptr;
+#ifdef ANALYZE_STATS_COLLECT_HOOK
+static analyze_stats_collect_hook_type previous_analyze_stats_collect_hook =
+	nullptr;
+#endif
+#ifdef IC_TEARDOWN_HOOK
+static ic_teardown_hook_type previous_ic_teardown_hook = nullptr;
+#endif
+static ProcessUtility_hook_type previous_ProcessUtility_hook = nullptr;
+
+static void gpsc_ExecutorStart_hook(QueryDesc *query_desc, int eflags);
+static void gpsc_ExecutorRun_hook(QueryDesc *query_desc,
+								  ScanDirection direction, uint64 count,
+								  bool execute_once);
+static void gpsc_ExecutorFinish_hook(QueryDesc *query_desc);
+static void gpsc_ExecutorEnd_hook(QueryDesc *query_desc);
+static void gpsc_query_info_collect_hook(QueryMetricsStatus status, void *arg);
+#ifdef IC_TEARDOWN_HOOK
+static void gpsc_ic_teardown_hook(ChunkTransportState *transportStates,
+								  bool hasErrors);
+#endif
+#ifdef ANALYZE_STATS_COLLECT_HOOK
+static void gpsc_analyze_stats_collect_hook(QueryDesc *query_desc);
+#endif
+static void gpsc_process_utility_hook(
+	PlannedStmt *pstmt, const char *queryString, bool readOnlyTree,
+	ProcessUtilityContext context, ParamListInfo params,
+	QueryEnvironment *queryEnv, DestReceiver *dest, QueryCompletion *qc);
+
+#define TEST_MAX_CONNECTIONS 4
+#define TEST_RCV_BUF_SIZE 8192
+#define TEST_POLL_TIMEOUT_MS 200
+
+static int test_server_fd = -1;
+static char *test_sock_path = NULL;
+
+static EventSender *sender = nullptr;
+
+static inline EventSender *
+get_sender()
+{
+	if (!sender)
+	{
+		sender = new EventSender();
+	}
+	return sender;
+}
+
+template <typename T, typename R, typename... Args>
+R
+cpp_call(T *obj, R (T::*func)(Args...), Args... args)
+{
+	try
+	{
+		return (obj->*func)(args...);
+	}
+	catch (const std::exception &e)
+	{
+		ereport(ERROR, (errmsg("Unexpected exception in gpsc %s", e.what())));
+		pg_unreachable();
+	}
+}
+
+void
+hooks_init()
+{
+	Config::init_gucs();
+	GpscStat::init();
+	previous_ExecutorStart_hook = ExecutorStart_hook;
+	ExecutorStart_hook = gpsc_ExecutorStart_hook;
+	previous_ExecutorRun_hook = ExecutorRun_hook;
+	ExecutorRun_hook = gpsc_ExecutorRun_hook;
+	previous_ExecutorFinish_hook = ExecutorFinish_hook;
+	ExecutorFinish_hook = gpsc_ExecutorFinish_hook;
+	previous_ExecutorEnd_hook = ExecutorEnd_hook;
+	ExecutorEnd_hook = gpsc_ExecutorEnd_hook;
+	previous_query_info_collect_hook = query_info_collect_hook;
+	query_info_collect_hook = gpsc_query_info_collect_hook;
+#ifdef IC_TEARDOWN_HOOK
+	previous_ic_teardown_hook = ic_teardown_hook;
+	ic_teardown_hook = gpsc_ic_teardown_hook;
+#endif
+#ifdef ANALYZE_STATS_COLLECT_HOOK
+	previous_analyze_stats_collect_hook = analyze_stats_collect_hook;
+	analyze_stats_collect_hook = gpsc_analyze_stats_collect_hook;
+#endif
+	stat_statements_parser_init();
+	previous_ProcessUtility_hook = ProcessUtility_hook;
+	ProcessUtility_hook = gpsc_process_utility_hook;
+}
+
+void
+hooks_deinit()
+{
+	ExecutorStart_hook = previous_ExecutorStart_hook;
+	ExecutorEnd_hook = previous_ExecutorEnd_hook;
+	ExecutorRun_hook = previous_ExecutorRun_hook;
+	ExecutorFinish_hook = previous_ExecutorFinish_hook;
+	query_info_collect_hook = previous_query_info_collect_hook;
+#ifdef IC_TEARDOWN_HOOK
+	ic_teardown_hook = previous_ic_teardown_hook;
+#endif
+#ifdef ANALYZE_STATS_COLLECT_HOOK
+	analyze_stats_collect_hook = previous_analyze_stats_collect_hook;
+#endif
+	stat_statements_parser_deinit();
+	if (sender)
+	{
+		delete sender;
+	}
+	GpscStat::deinit();
+	ProcessUtility_hook = previous_ProcessUtility_hook;
+}
+
+void
+gpsc_ExecutorStart_hook(QueryDesc *query_desc, int eflags)
+{
+	cpp_call(get_sender(), &EventSender::executor_before_start, query_desc,
+			 eflags);
+	if (previous_ExecutorStart_hook)
+	{
+		(*previous_ExecutorStart_hook)(query_desc, eflags);
+	}
+	else
+	{
+		standard_ExecutorStart(query_desc, eflags);
+	}
+	cpp_call(get_sender(), &EventSender::executor_after_start, query_desc,
+			 eflags);
+}
+
+void
+gpsc_ExecutorRun_hook(QueryDesc *query_desc, ScanDirection direction,
+					  uint64 count, bool execute_once)
+{
+	get_sender()->incr_depth();
+	PG_TRY();
+	{
+		if (previous_ExecutorRun_hook)
+			previous_ExecutorRun_hook(query_desc, direction, count,
+									  execute_once);
+		else
+			standard_ExecutorRun(query_desc, direction, count, execute_once);
+		get_sender()->decr_depth();
+	}
+	PG_CATCH();
+	{
+		get_sender()->decr_depth();
+		PG_RE_THROW();
+	}
+	PG_END_TRY();
+}
+
+void
+gpsc_ExecutorFinish_hook(QueryDesc *query_desc)
+{
+	get_sender()->incr_depth();
+	PG_TRY();
+	{
+		if (previous_ExecutorFinish_hook)
+			previous_ExecutorFinish_hook(query_desc);
+		else
+			standard_ExecutorFinish(query_desc);
+		get_sender()->decr_depth();
+	}
+	PG_CATCH();
+	{
+		get_sender()->decr_depth();
+		PG_RE_THROW();
+	}
+	PG_END_TRY();
+}
+
+void
+gpsc_ExecutorEnd_hook(QueryDesc *query_desc)
+{
+	cpp_call(get_sender(), &EventSender::executor_end, query_desc);
+	if (previous_ExecutorEnd_hook)
+	{
+		(*previous_ExecutorEnd_hook)(query_desc);
+	}
+	else
+	{
+		standard_ExecutorEnd(query_desc);
+	}
+}
+
+void
+gpsc_query_info_collect_hook(QueryMetricsStatus status, void *arg)
+{
+	cpp_call(get_sender(), &EventSender::query_metrics_collect, status,
+			 arg /* queryDesc */, false /* utility */, (ErrorData *) NULL);
+	if (previous_query_info_collect_hook)
+	{
+		(*previous_query_info_collect_hook)(status, arg);
+	}
+}
+
+#ifdef IC_TEARDOWN_HOOK
+void
+gpsc_ic_teardown_hook(ChunkTransportState *transportStates, bool hasErrors)
+{
+	cpp_call(get_sender(), &EventSender::ic_metrics_collect);
+	if (previous_ic_teardown_hook)
+	{
+		(*previous_ic_teardown_hook)(transportStates, hasErrors);
+	}
+}
+#endif
+
+#ifdef ANALYZE_STATS_COLLECT_HOOK
+void
+gpsc_analyze_stats_collect_hook(QueryDesc *query_desc)
+{
+	cpp_call(get_sender(), &EventSender::analyze_stats_collect, query_desc);
+	if (previous_analyze_stats_collect_hook)
+	{
+		(*previous_analyze_stats_collect_hook)(query_desc);
+	}
+}
+#endif
+
+static void
+gpsc_process_utility_hook(PlannedStmt *pstmt, const char *queryString,
+						  bool readOnlyTree, ProcessUtilityContext context,
+						  ParamListInfo params, QueryEnvironment *queryEnv,
+						  DestReceiver *dest, QueryCompletion *qc)
+{
+	/* Project utility data on QueryDesc to use existing logic */
+	QueryDesc *query_desc = (QueryDesc *) palloc0(sizeof(QueryDesc));
+	query_desc->sourceText = queryString;
+
+	cpp_call(get_sender(), &EventSender::query_metrics_collect,
+			 METRICS_QUERY_SUBMIT, (void *) query_desc, true /* utility */,
+			 (ErrorData *) NULL);
+
+	get_sender()->incr_depth();
+	PG_TRY();
+	{
+		if (previous_ProcessUtility_hook)
+		{
+			(*previous_ProcessUtility_hook)(pstmt, queryString, readOnlyTree,
+											context, params, queryEnv, dest,
+											qc);
+		}
+		else
+		{
+			standard_ProcessUtility(pstmt, queryString, readOnlyTree, context,
+									params, queryEnv, dest, qc);
+		}
+
+		get_sender()->decr_depth();
+		cpp_call(get_sender(), &EventSender::query_metrics_collect,
+				 METRICS_QUERY_DONE, (void *) query_desc, true /* utility */,
+				 (ErrorData *) NULL);
+
+		pfree(query_desc);
+	}
+	PG_CATCH();
+	{
+		ErrorData *edata;
+		MemoryContext oldctx;
+
+		oldctx = MemoryContextSwitchTo(TopMemoryContext);
+		edata = CopyErrorData();
+		FlushErrorState();
+		MemoryContextSwitchTo(oldctx);
+
+		get_sender()->decr_depth();
+		cpp_call(get_sender(), &EventSender::query_metrics_collect,
+				 METRICS_QUERY_ERROR, (void *) query_desc, true /* utility */,
+				 edata);
+
+		pfree(query_desc);
+		ReThrowError(edata);
+	}
+	PG_END_TRY();
+}
+
+static void
+check_stats_loaded()
+{
+	if (!GpscStat::loaded())
+	{
+		ereport(ERROR, (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+						errmsg("gp_stats_collector must be loaded via "
+							   "shared_preload_libraries")));
+	}
+}
+
+void
+gpsc_functions_reset()
+{
+	check_stats_loaded();
+	GpscStat::reset();
+}
+
+Datum
+gpsc_functions_get(FunctionCallInfo fcinfo)
+{
+	const int ATTNUM = 6;
+	check_stats_loaded();
+	auto stats = GpscStat::get_stats();
+	TupleDesc tupdesc = CreateTemplateTupleDesc(ATTNUM);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 1, "segid", INT4OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 2, "total_messages", INT8OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 3, "send_failures", INT8OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 4, "connection_failures", INT8OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 5, "other_errors", INT8OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	TupleDescInitEntry(tupdesc, (AttrNumber) 6, "max_message_size", INT4OID,
+					   -1 /* typmod */, 0 /* attdim */);
+	tupdesc = BlessTupleDesc(tupdesc);
+	Datum values[ATTNUM];
+	bool nulls[ATTNUM];
+	MemSet(nulls, 0, sizeof(nulls));
+	values[0] = Int32GetDatum(GpIdentity.segindex);
+	values[1] = Int64GetDatum(stats.total);
+	values[2] = Int64GetDatum(stats.failed_sends);
+	values[3] = Int64GetDatum(stats.failed_connects);
+	values[4] = Int64GetDatum(stats.failed_other);
+	values[5] = Int32GetDatum(stats.max_message_size);
+	HeapTuple tuple = gpdb::heap_form_tuple(tupdesc, values, nulls);
+	Datum result = HeapTupleGetDatum(tuple);
+	PG_RETURN_DATUM(result);
+}
+
+void
+test_uds_stop_server()
+{
+	if (test_server_fd >= 0)
+	{
+		close(test_server_fd);
+		test_server_fd = -1;
+	}
+	if (test_sock_path)
+	{
+		unlink(test_sock_path);
+		pfree(test_sock_path);
+		test_sock_path = NULL;
+	}
+}
+
+void
+test_uds_start_server(const char *path)
+{
+	struct sockaddr_un addr = {.sun_family = AF_UNIX};
+
+	if (strlen(path) >= sizeof(addr.sun_path))
+		ereport(ERROR, (errmsg("path too long")));
+
+	test_uds_stop_server();
+
+	strlcpy(addr.sun_path, path, sizeof(addr.sun_path));
+	test_sock_path = MemoryContextStrdup(TopMemoryContext, path);
+	unlink(path);
+
+	if ((test_server_fd = socket(AF_UNIX, SOCK_STREAM, 0)) < 0 ||
+		bind(test_server_fd, (struct sockaddr *) &addr, sizeof(addr)) < 0 ||
+		listen(test_server_fd, TEST_MAX_CONNECTIONS) < 0)
+	{
+		test_uds_stop_server();
+		ereport(ERROR, (errmsg("socket setup failed: %m")));
+	}
+}
+
+int64
+test_uds_receive(int timeout_ms)
+{
+	char buf[TEST_RCV_BUF_SIZE];
+	int rc;
+	struct pollfd pfd = {.fd = test_server_fd, .events = POLLIN};
+	int64 total = 0;
+
+	if (test_server_fd < 0)
+		ereport(ERROR, (errmsg("server not started")));
+
+	for (;;)
+	{
+		CHECK_FOR_INTERRUPTS();
+		rc = poll(&pfd, 1, Min(timeout_ms, TEST_POLL_TIMEOUT_MS));
+		if (rc > 0)
+			break;
+		if (rc < 0 && errno != EINTR)
+			ereport(ERROR, (errmsg("poll: %m")));
+		timeout_ms -= TEST_POLL_TIMEOUT_MS;
+		if (timeout_ms <= 0)
+			return total;
+	}
+
+	if (pfd.revents & POLLIN)
+	{
+		int client = accept(test_server_fd, NULL, NULL);
+		ssize_t n;
+
+		if (client < 0)
+			ereport(ERROR, (errmsg("accept: %m")));
+
+		while ((n = recv(client, buf, sizeof(buf), 0)) != 0)
+		{
+			if (n > 0)
+				total += n;
+			else if (errno != EINTR)
+				break;
+		}
+
+		close(client);
+	}
+
+	return total;
+}
\ No newline at end of file
diff --git a/gpcontrib/gp_stats_collector/src/hook_wrappers.h b/gpcontrib/gp_stats_collector/src/hook_wrappers.h
new file mode 100644
index 00000000000..a04f5a95144
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/hook_wrappers.h
@@ -0,0 +1,50 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * hook_wrappers.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/hook_wrappers.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef HOOK_WRAPPERS_H
+#define HOOK_WRAPPERS_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+extern void hooks_init();
+extern void hooks_deinit();
+extern void gpsc_functions_reset();
+extern Datum gpsc_functions_get(FunctionCallInfo fcinfo);
+
+extern void init_log();
+extern void truncate_log();
+
+extern void test_uds_start_server(const char *path);
+extern int64_t test_uds_receive(int timeout_ms);
+extern void test_uds_stop_server();
+
+#ifdef __cplusplus
+}
+#endif
+#endif /* HOOK_WRAPPERS_H */
diff --git a/gpcontrib/gp_stats_collector/src/log/LogOps.cpp b/gpcontrib/gp_stats_collector/src/log/LogOps.cpp
new file mode 100644
index 00000000000..865e0f6ce3f
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/log/LogOps.cpp
@@ -0,0 +1,173 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * LogOps.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/log/LogOps.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "protos/gpsc_set_service.pb.h"
+
+#include "LogOps.h"
+#include "LogSchema.h"
+
+extern "C" {
+#include "postgres.h"
+
+#include "access/heapam.h"
+#include "access/htup_details.h"
+#include "access/xact.h"
+#include "catalog/dependency.h"
+#include "catalog/heap.h"
+#include "catalog/namespace.h"
+#include "catalog/pg_namespace.h"
+#include "catalog/pg_type.h"
+#include "cdb/cdbvars.h"
+#include "commands/tablecmds.h"
+#include "fmgr.h"
+#include "funcapi.h"
+#include "utils/builtins.h"
+#include "utils/lsyscache.h"
+#include "utils/rel.h"
+#include "utils/snapmgr.h"
+#include "utils/timestamp.h"
+}
+
+void
+init_log()
+{
+	Oid namespaceId;
+	Oid relationId;
+	ObjectAddress tableAddr;
+	ObjectAddress schemaAddr;
+
+	namespaceId = get_namespace_oid(schema_name.data(), false /* missing_ok */);
+
+	/* Create table */
+	relationId = heap_create_with_catalog(
+		log_relname.data() /* relname */, namespaceId /* namespace */,
+		0 /* tablespace */, InvalidOid /* relid */,
+		InvalidOid /* reltype oid */, InvalidOid /* reloftypeid */,
+		GetUserId() /* owner */, HEAP_TABLE_AM_OID,
+		DescribeTuple() /* rel tuple */, NIL /* cooked_constraints */,
+		RELKIND_RELATION, RELPERSISTENCE_PERMANENT, false /* shared_relation */,
+		false /* mapped_relation */, ONCOMMIT_NOOP, NULL /* GP Policy */,
+		(Datum) 0 /* reloptions */, false /* use_user_acl */,
+		true /* allow_system_table_mods */, true /* is_internal */,
+		InvalidOid /* relrewrite */, NULL /* typaddress */,
+		false /* valid_opts */);
+
+	/* Make the table visible */
+	CommandCounterIncrement();
+
+	/* Record dependency of the table on the schema */
+	if (OidIsValid(relationId) && OidIsValid(namespaceId))
+	{
+		ObjectAddressSet(tableAddr, RelationRelationId, relationId);
+		ObjectAddressSet(schemaAddr, NamespaceRelationId, namespaceId);
+
+		/* Table can be dropped only via DROP EXTENSION */
+		recordDependencyOn(&tableAddr, &schemaAddr, DEPENDENCY_EXTENSION);
+	}
+	else
+	{
+		ereport(NOTICE, (errmsg("GPSC failed to create log table or schema")));
+	}
+
+	/* Make changes visible */
+	CommandCounterIncrement();
+}
+
+void
+insert_log(const gpsc::SetQueryReq &req, bool utility)
+{
+	Oid namespaceId;
+	Oid relationId;
+	Relation rel;
+	HeapTuple tuple;
+
+	/* Return if xact is not valid (needed for catalog lookups). */
+	if (!IsTransactionState())
+	{
+		return;
+	}
+
+	/* Return if extension was not loaded */
+	namespaceId = get_namespace_oid(schema_name.data(), true /* missing_ok */);
+	if (!OidIsValid(namespaceId))
+	{
+		return;
+	}
+
+	/* Return if the table was not created yet */
+	relationId = get_relname_relid(log_relname.data(), namespaceId);
+	if (!OidIsValid(relationId))
+	{
+		return;
+	}
+
+	bool nulls[natts_gpsc_log];
+	Datum values[natts_gpsc_log];
+
+	memset(nulls, true, sizeof(nulls));
+	memset(values, 0, sizeof(values));
+
+	extract_query_req(req, "", values, nulls);
+	nulls[attnum_gpsc_log_utility] = false;
+	values[attnum_gpsc_log_utility] = BoolGetDatum(utility);
+
+	rel = heap_open(relationId, RowExclusiveLock);
+
+	/* Insert the tuple as a frozen one to ensure it is logged even if txn rolls
+   * back or aborts */
+	tuple = heap_form_tuple(RelationGetDescr(rel), values, nulls);
+	frozen_heap_insert(rel, tuple);
+
+	heap_freetuple(tuple);
+	/* Keep lock on rel until end of xact */
+	heap_close(rel, NoLock);
+
+	/* Make changes visible */
+	CommandCounterIncrement();
+}
+
+void
+truncate_log()
+{
+	Oid namespaceId;
+	Oid relationId;
+	Relation relation;
+
+	namespaceId = get_namespace_oid(schema_name.data(), false /* missing_ok */);
+	relationId = get_relname_relid(log_relname.data(), namespaceId);
+
+	relation = heap_open(relationId, AccessExclusiveLock);
+
+	/* Truncate the main table */
+	heap_truncate_one_rel(relation);
+
+	/* Keep lock on rel until end of xact */
+	heap_close(relation, NoLock);
+
+	/* Make changes visible */
+	CommandCounterIncrement();
+}
\ No newline at end of file
diff --git a/gpcontrib/gp_stats_collector/src/log/LogOps.h b/gpcontrib/gp_stats_collector/src/log/LogOps.h
new file mode 100644
index 00000000000..45d79cd4560
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/log/LogOps.h
@@ -0,0 +1,49 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * LogOps.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/log/LogOps.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef LOGOPS_H
+#define LOGOPS_H
+
+#include <string>
+
+extern "C" {
+#include "postgres.h"
+#include "fmgr.h"
+}
+
+extern "C" {
+/* CREATE TABLE gpsc.__log (...); */
+void init_log();
+
+/* TRUNCATE gpsc.__log */
+void truncate_log();
+}
+
+/* INSERT INTO gpsc.__log VALUES (...) */
+void insert_log(const gpsc::SetQueryReq &req, bool utility);
+
+#endif /* LOGOPS_H */
diff --git a/gpcontrib/gp_stats_collector/src/log/LogSchema.cpp b/gpcontrib/gp_stats_collector/src/log/LogSchema.cpp
new file mode 100644
index 00000000000..254b1b04af4
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/log/LogSchema.cpp
@@ -0,0 +1,189 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * LogSchema.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/log/LogSchema.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "google/protobuf/descriptor.h"
+#include "google/protobuf/reflection.h"
+#include "google/protobuf/timestamp.pb.h"
+
+#include "LogSchema.h"
+
+const std::unordered_map<std::string_view, size_t> &
+proto_name_to_col_idx()
+{
+	static const auto name_col_idx = [] {
+		std::unordered_map<std::string_view, size_t> map;
+		map.reserve(log_tbl_desc.size());
+
+		for (size_t idx = 0; idx < natts_gpsc_log; ++idx)
+		{
+			map.emplace(log_tbl_desc[idx].proto_field_name, idx);
+		}
+
+		return map;
+	}();
+	return name_col_idx;
+}
+
+TupleDesc
+DescribeTuple()
+{
+	TupleDesc tupdesc = CreateTemplateTupleDesc(natts_gpsc_log);
+
+	for (size_t anum = 1; anum <= natts_gpsc_log; ++anum)
+	{
+		TupleDescInitEntry(
+			tupdesc, anum, log_tbl_desc[anum - 1].pg_att_name.data(),
+			log_tbl_desc[anum - 1].type_oid, -1 /* typmod */, 0 /* attdim */);
+	}
+
+	return tupdesc;
+}
+
+Datum
+protots_to_timestamptz(const google::protobuf::Timestamp &ts)
+{
+	TimestampTz pgtimestamp =
+		(TimestampTz) ts.seconds() * USECS_PER_SEC + (ts.nanos() / 1000);
+	pgtimestamp -= (POSTGRES_EPOCH_JDATE - UNIX_EPOCH_JDATE) * USECS_PER_DAY;
+	return TimestampTzGetDatum(pgtimestamp);
+}
+
+Datum
+field_to_datum(const google::protobuf::FieldDescriptor *field,
+			   const google::protobuf::Reflection *reflection,
+			   const google::protobuf::Message &msg)
+{
+	using namespace google::protobuf;
+
+	switch (field->cpp_type())
+	{
+		case FieldDescriptor::CPPTYPE_INT32:
+			return Int32GetDatum(reflection->GetInt32(msg, field));
+		case FieldDescriptor::CPPTYPE_INT64:
+			return Int64GetDatum(reflection->GetInt64(msg, field));
+		case FieldDescriptor::CPPTYPE_UINT32:
+			return Int64GetDatum(reflection->GetUInt32(msg, field));
+		case FieldDescriptor::CPPTYPE_UINT64:
+			return Int64GetDatum(
+				static_cast<int64_t>(reflection->GetUInt64(msg, field)));
+		case FieldDescriptor::CPPTYPE_DOUBLE:
+			return Float8GetDatum(reflection->GetDouble(msg, field));
+		case FieldDescriptor::CPPTYPE_FLOAT:
+			return Float4GetDatum(reflection->GetFloat(msg, field));
+		case FieldDescriptor::CPPTYPE_BOOL:
+			return BoolGetDatum(reflection->GetBool(msg, field));
+		case FieldDescriptor::CPPTYPE_ENUM:
+			return CStringGetTextDatum(
+				reflection->GetEnum(msg, field)->name().data());
+		case FieldDescriptor::CPPTYPE_STRING:
+			return CStringGetTextDatum(
+				reflection->GetString(msg, field).c_str());
+		default:
+			return (Datum) 0;
+	}
+}
+
+void
+process_field(const google::protobuf::FieldDescriptor *field,
+			  const google::protobuf::Reflection *reflection,
+			  const google::protobuf::Message &msg,
+			  const std::string &field_name, Datum *values, bool *nulls)
+{
+	auto proto_idx_map = proto_name_to_col_idx();
+	auto it = proto_idx_map.find(field_name);
+
+	if (it == proto_idx_map.end())
+	{
+		ereport(NOTICE,
+				(errmsg("GPSC protobuf field %s is not registered in log table",
+						field_name.c_str())));
+		return;
+	}
+
+	int idx = it->second;
+
+	if (!reflection->HasField(msg, field))
+	{
+		nulls[idx] = true;
+		return;
+	}
+
+	if (field->cpp_type() ==
+			google::protobuf::FieldDescriptor::CPPTYPE_MESSAGE &&
+		field->message_type()->full_name() == "google.protobuf.Timestamp")
+	{
+		const auto &ts = static_cast<const google::protobuf::Timestamp &>(
+			reflection->GetMessage(msg, field));
+		values[idx] = protots_to_timestamptz(ts);
+	}
+	else
+	{
+		values[idx] = field_to_datum(field, reflection, msg);
+	}
+	nulls[idx] = false;
+
+	return;
+}
+
+void
+extract_query_req(const google::protobuf::Message &msg,
+				  const std::string &prefix, Datum *values, bool *nulls)
+{
+	using namespace google::protobuf;
+
+	const Descriptor *descriptor = msg.GetDescriptor();
+	const Reflection *reflection = msg.GetReflection();
+
+	for (int i = 0; i < descriptor->field_count(); ++i)
+	{
+		const FieldDescriptor *field = descriptor->field(i);
+
+		// For now, we do not log any repeated fields plus they need special
+		// treatment.
+		if (field->is_repeated())
+		{
+			continue;
+		}
+
+		std::string curr_pref = prefix.empty() ? "" : prefix + ".";
+		std::string field_name = curr_pref + field->name().data();
+
+		if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE &&
+			field->message_type()->full_name() != "google.protobuf.Timestamp")
+		{
+			if (reflection->HasField(msg, field))
+			{
+				const Message &nested = reflection->GetMessage(msg, field);
+				extract_query_req(nested, field_name, values, nulls);
+			}
+		}
+		else
+		{
+			process_field(field, reflection, msg, field_name, values, nulls);
+		}
+	}
+}
diff --git a/gpcontrib/gp_stats_collector/src/log/LogSchema.h b/gpcontrib/gp_stats_collector/src/log/LogSchema.h
new file mode 100644
index 00000000000..f6c2247370a
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/log/LogSchema.h
@@ -0,0 +1,199 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * LogSchema.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/log/LogSchema.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef LOGSCHEMA_H
+#define LOGSCHEMA_H
+
+#include <array>
+#include <string>
+#include <string_view>
+#include <unordered_map>
+
+extern "C" {
+#include "postgres.h"
+#include "access/htup_details.h"
+#include "access/tupdesc.h"
+#include "catalog/pg_type.h"
+#include "utils/builtins.h"
+#include "utils/timestamp.h"
+}
+
+namespace google
+{
+namespace protobuf
+{
+class FieldDescriptor;
+class Message;
+class Reflection;
+class Timestamp;
+}  // namespace protobuf
+}  // namespace google
+
+inline constexpr std::string_view schema_name = "gpsc";
+inline constexpr std::string_view log_relname = "__log";
+
+struct LogDesc
+{
+	std::string_view pg_att_name;
+	std::string_view proto_field_name;
+	Oid type_oid;
+};
+
+/*
+ * Definition of the log table structure.
+ *
+ * System stats collected as %lu (unsigned) may
+ * overflow INT8OID (signed), but this is acceptable.
+ */
+/* clang-format off */
+inline constexpr std::array log_tbl_desc = {  
+ /* 8-byte aligned types first - Query Info */  
+ LogDesc{"query_id",             "query_info.query_id",   INT8OID},  
+ LogDesc{"plan_id",              "query_info.plan_id",    INT8OID},  
+ LogDesc{"nested_level",         "add_info.nested_level", INT8OID},  
+ LogDesc{"slice_id",             "add_info.slice_id",     INT8OID},  
+ /* 8-byte aligned types - System Stats */  
+ LogDesc{"systemstat_vsize",                  "query_metrics.systemStat.vsize",                 INT8OID},  
+ LogDesc{"systemstat_rss",                    "query_metrics.systemStat.rss",                   INT8OID},  
+ LogDesc{"systemstat_vmsizekb",               "query_metrics.systemStat.VmSizeKb",              INT8OID},  
+ LogDesc{"systemstat_vmpeakkb",               "query_metrics.systemStat.VmPeakKb",              INT8OID},  
+ LogDesc{"systemstat_rchar",                  "query_metrics.systemStat.rchar",                 INT8OID},  
+ LogDesc{"systemstat_wchar",                  "query_metrics.systemStat.wchar",                 INT8OID},  
+ LogDesc{"systemstat_syscr",                  "query_metrics.systemStat.syscr",                 INT8OID},  
+ LogDesc{"systemstat_syscw",                  "query_metrics.systemStat.syscw",                 INT8OID},  
+ LogDesc{"systemstat_read_bytes",             "query_metrics.systemStat.read_bytes",            INT8OID},  
+ LogDesc{"systemstat_write_bytes",            "query_metrics.systemStat.write_bytes",           INT8OID},  
+ LogDesc{"systemstat_cancelled_write_bytes",  "query_metrics.systemStat.cancelled_write_bytes", INT8OID},  
+ /* 8-byte aligned types - Metric Instrumentation */  
+ LogDesc{"instrumentation_ntuples",                  "query_metrics.instrumentation.ntuples",             INT8OID},  
+ LogDesc{"instrumentation_nloops",                   "query_metrics.instrumentation.nloops",              INT8OID},  
+ LogDesc{"instrumentation_tuplecount",               "query_metrics.instrumentation.tuplecount",          INT8OID},  
+ LogDesc{"instrumentation_shared_blks_hit",          "query_metrics.instrumentation.shared_blks_hit",     INT8OID},  
+ LogDesc{"instrumentation_shared_blks_read",         "query_metrics.instrumentation.shared_blks_read",    INT8OID},  
+ LogDesc{"instrumentation_shared_blks_dirtied",      "query_metrics.instrumentation.shared_blks_dirtied", INT8OID},  
+ LogDesc{"instrumentation_shared_blks_written",      "query_metrics.instrumentation.shared_blks_written", INT8OID},  
+ LogDesc{"instrumentation_local_blks_hit",           "query_metrics.instrumentation.local_blks_hit",      INT8OID},  
+ LogDesc{"instrumentation_local_blks_read",          "query_metrics.instrumentation.local_blks_read",     INT8OID},  
+ LogDesc{"instrumentation_local_blks_dirtied",       "query_metrics.instrumentation.local_blks_dirtied",  INT8OID},  
+ LogDesc{"instrumentation_local_blks_written",       "query_metrics.instrumentation.local_blks_written",  INT8OID},  
+ LogDesc{"instrumentation_temp_blks_read",           "query_metrics.instrumentation.temp_blks_read",      INT8OID},  
+ LogDesc{"instrumentation_temp_blks_written",        "query_metrics.instrumentation.temp_blks_written",   INT8OID},  
+ LogDesc{"instrumentation_inherited_calls",          "query_metrics.instrumentation.inherited_calls",     INT8OID},  
+ /* 8-byte aligned types - Network Stats */  
+ LogDesc{"instrumentation_sent_total_bytes",         "query_metrics.instrumentation.sent.total_bytes",     INT8OID},  
+ LogDesc{"instrumentation_sent_tuple_bytes",         "query_metrics.instrumentation.sent.tuple_bytes",     INT8OID},  
+ LogDesc{"instrumentation_sent_chunks",              "query_metrics.instrumentation.sent.chunks",          INT8OID},  
+ LogDesc{"instrumentation_received_total_bytes",     "query_metrics.instrumentation.received.total_bytes", INT8OID},  
+ LogDesc{"instrumentation_received_tuple_bytes",     "query_metrics.instrumentation.received.tuple_bytes", INT8OID},  
+ LogDesc{"instrumentation_received_chunks",          "query_metrics.instrumentation.received.chunks",      INT8OID},  
+ /* 8-byte aligned types - Interconnect Stats and spilled bytes */  
+ LogDesc{"interconnect_total_recv_queue_size",         "query_metrics.instrumentation.interconnect.total_recv_queue_size",         INT8OID},  
+ LogDesc{"interconnect_recv_queue_size_counting_time", "query_metrics.instrumentation.interconnect.recv_queue_size_counting_time", INT8OID},  
+ LogDesc{"interconnect_total_capacity",                "query_metrics.instrumentation.interconnect.total_capacity",                INT8OID},  
+ LogDesc{"interconnect_capacity_counting_time",        "query_metrics.instrumentation.interconnect.capacity_counting_time",        INT8OID},  
+ LogDesc{"interconnect_total_buffers",                 "query_metrics.instrumentation.interconnect.total_buffers",                 INT8OID},  
+ LogDesc{"interconnect_buffer_counting_time",          "query_metrics.instrumentation.interconnect.buffer_counting_time",          INT8OID},  
+ LogDesc{"interconnect_active_connections_num",        "query_metrics.instrumentation.interconnect.active_connections_num",        INT8OID},  
+ LogDesc{"interconnect_retransmits",                   "query_metrics.instrumentation.interconnect.retransmits",                   INT8OID},  
+ LogDesc{"interconnect_startup_cached_pkt_num",        "query_metrics.instrumentation.interconnect.startup_cached_pkt_num",        INT8OID},  
+ LogDesc{"interconnect_mismatch_num",                  "query_metrics.instrumentation.interconnect.mismatch_num",                  INT8OID},  
+ LogDesc{"interconnect_crc_errors",                    "query_metrics.instrumentation.interconnect.crc_errors",                    INT8OID},  
+ LogDesc{"interconnect_snd_pkt_num",                   "query_metrics.instrumentation.interconnect.snd_pkt_num",                   INT8OID},  
+ LogDesc{"interconnect_recv_pkt_num",                  "query_metrics.instrumentation.interconnect.recv_pkt_num",                  INT8OID},  
+ LogDesc{"interconnect_disordered_pkt_num",            "query_metrics.instrumentation.interconnect.disordered_pkt_num",            INT8OID},  
+ LogDesc{"interconnect_duplicated_pkt_num",            "query_metrics.instrumentation.interconnect.duplicated_pkt_num",            INT8OID},  
+ LogDesc{"interconnect_recv_ack_num",                  "query_metrics.instrumentation.interconnect.recv_ack_num",                  INT8OID},  
+ LogDesc{"interconnect_status_query_msg_num",          "query_metrics.instrumentation.interconnect.status_query_msg_num",          INT8OID},
+ LogDesc{"spill_totalbytes",                           "query_metrics.spill.totalBytes",                                           INT8OID},
+ /* 8-byte aligned types - Float and Timestamp */  
+ LogDesc{"systemstat_runningtimeseconds",     "query_metrics.systemStat.runningTimeSeconds",  FLOAT8OID},  
+ LogDesc{"systemstat_usertimeseconds",        "query_metrics.systemStat.userTimeSeconds",     FLOAT8OID},  
+ LogDesc{"systemstat_kerneltimeseconds",      "query_metrics.systemStat.kernelTimeSeconds",   FLOAT8OID},  
+ LogDesc{"instrumentation_firsttuple",        "query_metrics.instrumentation.firsttuple",     FLOAT8OID},  
+ LogDesc{"instrumentation_startup",           "query_metrics.instrumentation.startup",        FLOAT8OID},  
+ LogDesc{"instrumentation_total",             "query_metrics.instrumentation.total",          FLOAT8OID},  
+ LogDesc{"instrumentation_blk_read_time",     "query_metrics.instrumentation.blk_read_time",  FLOAT8OID},  
+ LogDesc{"instrumentation_blk_write_time",    "query_metrics.instrumentation.blk_write_time", FLOAT8OID},  
+ LogDesc{"instrumentation_startup_time",      "query_metrics.instrumentation.startup_time",   FLOAT8OID},  
+ LogDesc{"instrumentation_inherited_time",    "query_metrics.instrumentation.inherited_time", FLOAT8OID},  
+ LogDesc{"datetime",            "datetime",                       TIMESTAMPTZOID},  
+ LogDesc{"submit_time",         "submit_time",                    TIMESTAMPTZOID},  
+ LogDesc{"start_time",          "start_time",                     TIMESTAMPTZOID},  
+ LogDesc{"end_time",            "end_time",                       TIMESTAMPTZOID},  
+ /* 4-byte aligned types - Query Key */  
+ LogDesc{"tmid",                "query_key.tmid",                 INT4OID},  
+ LogDesc{"ssid",                "query_key.ssid",                 INT4OID},  
+ LogDesc{"ccnt",                "query_key.ccnt",                 INT4OID},  
+ /* 4-byte aligned types - Segment Key */  
+ LogDesc{"dbid",                "segment_key.dbid",               INT4OID},  
+ LogDesc{"segid",               "segment_key.segindex",           INT4OID},  
+ LogDesc{"spill_filecount",     "query_metrics.spill.fileCount",  INT4OID},  
+ /* Variable-length types - Query Info */  
+ LogDesc{"generator",           "query_info.generator",           TEXTOID},  
+ LogDesc{"query_text",          "query_info.query_text",          TEXTOID},  
+ LogDesc{"plan_text",           "query_info.plan_text",           TEXTOID},  
+ LogDesc{"template_query_text", "query_info.template_query_text", TEXTOID},  
+ LogDesc{"template_plan_text",  "query_info.template_plan_text",  TEXTOID},  
+ LogDesc{"user_name",           "query_info.userName",            TEXTOID},  
+ LogDesc{"database_name",       "query_info.databaseName",        TEXTOID},  
+ LogDesc{"rsgname",             "query_info.rsgname",             TEXTOID},  
+ LogDesc{"analyze_text",        "query_info.analyze_text",        TEXTOID},  
+ LogDesc{"error_message",       "add_info.error_message",         TEXTOID},  
+ LogDesc{"query_status",        "query_status",                   TEXTOID},  
+ /* Extra field */
+ LogDesc{"utility",             "",                               BOOLOID},  
+};
+/* clang-format on */
+
+inline constexpr size_t natts_gpsc_log = log_tbl_desc.size();
+inline constexpr size_t attnum_gpsc_log_utility = natts_gpsc_log - 1;
+
+const std::unordered_map<std::string_view, size_t> &proto_name_to_col_idx();
+
+TupleDesc DescribeTuple();
+
+Datum protots_to_timestamptz(const google::protobuf::Timestamp &ts);
+
+Datum field_to_datum(const google::protobuf::FieldDescriptor *field,
+					 const google::protobuf::Reflection *reflection,
+					 const google::protobuf::Message &msg);
+
+/* Process a single proto field and store in values/nulls arrays */
+void process_field(const google::protobuf::FieldDescriptor *field,
+				   const google::protobuf::Reflection *reflection,
+				   const google::protobuf::Message &msg,
+				   const std::string &field_name, Datum *values, bool *nulls);
+
+/*
+ * Extracts values from msg into values/nulls arrays. Caller must
+ * pre-init nulls[] to true (this function does net set nulls
+ * to true for nested messages if parent message is missing).
+ */
+void extract_query_req(const google::protobuf::Message &msg,
+					   const std::string &prefix, Datum *values, bool *nulls);
+
+#endif /* LOGSCHEMA_H */
diff --git a/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.cpp b/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.cpp
new file mode 100644
index 00000000000..de54a716016
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.cpp
@@ -0,0 +1,316 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * gpdbwrappers.cpp
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "gpdbwrappers.h"
+#include "log/LogOps.h"
+
+extern "C" {
+#include "postgres.h"
+#include "access/htup.h"
+#include "access/tupdesc.h"
+#include "cdb/cdbexplain.h"
+#include "commands/dbcommands.h"
+#include "commands/explain.h"
+#include "commands/resgroupcmds.h"
+#include "executor/instrument.h"
+#include "nodes/pg_list.h"
+#include "stat_statements_parser/pg_stat_statements_parser.h"
+#include "utils/builtins.h"
+#include "utils/elog.h"
+#include "utils/guc.h"
+#include "utils/varlena.h"
+}
+
+namespace
+{
+
+template <bool Throws, typename Func, typename... Args>
+auto
+wrap(Func &&func, Args &&...args) noexcept(!Throws)
+	-> decltype(func(std::forward<Args>(args)...))
+{
+	using RetType = decltype(func(std::forward<Args>(args)...));
+
+	// Empty struct for void return type.
+	struct VoidResult
+	{
+	};
+	using ResultHolder = std::conditional_t<std::is_void_v<RetType>, VoidResult,
+											std::optional<RetType>>;
+
+	bool success;
+	ErrorData *edata;
+	ResultHolder result_holder;
+
+	PG_TRY();
+	{
+		if constexpr (!std::is_void_v<RetType>)
+		{
+			result_holder.emplace(func(std::forward<Args>(args)...));
+		}
+		else
+		{
+			func(std::forward<Args>(args)...);
+		}
+		edata = NULL;
+		success = true;
+	}
+	PG_CATCH();
+	{
+		MemoryContext oldctx = MemoryContextSwitchTo(TopMemoryContext);
+		edata = CopyErrorData();
+		MemoryContextSwitchTo(oldctx);
+		FlushErrorState();
+		success = false;
+	}
+	PG_END_TRY();
+
+	if (!success)
+	{
+		std::string err;
+		if (edata && edata->message)
+		{
+			err = std::string(edata->message);
+		}
+		else
+		{
+			err = "Unknown error occurred";
+		}
+
+		if (edata)
+		{
+			FreeErrorData(edata);
+		}
+
+		if constexpr (Throws)
+		{
+			throw std::runtime_error(err);
+		}
+
+		if constexpr (!std::is_void_v<RetType>)
+		{
+			return RetType{};
+		}
+		else
+		{
+			return;
+		}
+	}
+
+	if constexpr (!std::is_void_v<RetType>)
+	{
+		return *std::move(result_holder);
+	}
+	else
+	{
+		return;
+	}
+}
+
+template <typename Func, typename... Args>
+auto
+wrap_throw(Func &&func, Args &&...args)
+	-> decltype(func(std::forward<Args>(args)...))
+{
+	return wrap<true>(std::forward<Func>(func), std::forward<Args>(args)...);
+}
+
+template <typename Func, typename... Args>
+auto
+wrap_noexcept(Func &&func, Args &&...args) noexcept
+	-> decltype(func(std::forward<Args>(args)...))
+{
+	return wrap<false>(std::forward<Func>(func), std::forward<Args>(args)...);
+}
+}  // namespace
+
+void *
+gpdb::palloc(Size size)
+{
+	return wrap_throw(::palloc, size);
+}
+
+void *
+gpdb::palloc0(Size size)
+{
+	return wrap_throw(::palloc0, size);
+}
+
+char *
+gpdb::pstrdup(const char *str)
+{
+	return wrap_throw(::pstrdup, str);
+}
+
+char *
+gpdb::get_database_name(Oid dbid) noexcept
+{
+	return wrap_noexcept(::get_database_name, dbid);
+}
+
+bool
+gpdb::split_identifier_string(char *rawstring, char separator,
+							  List **namelist) noexcept
+{
+	return wrap_noexcept(SplitIdentifierString, rawstring, separator, namelist);
+}
+
+ExplainState
+gpdb::get_explain_state(QueryDesc *query_desc, bool costs) noexcept
+{
+	return wrap_noexcept([&]() {
+		ExplainState *es = NewExplainState();
+		es->costs = costs;
+		es->verbose = true;
+		es->format = EXPLAIN_FORMAT_TEXT;
+		ExplainBeginOutput(es);
+		ExplainPrintPlan(es, query_desc);
+		ExplainEndOutput(es);
+		return *es;
+	});
+}
+
+ExplainState
+gpdb::get_analyze_state(QueryDesc *query_desc, bool analyze) noexcept
+{
+	return wrap_noexcept([&]() {
+		ExplainState *es = NewExplainState();
+		es->analyze = analyze;
+		es->verbose = true;
+		es->buffers = es->analyze;
+		es->timing = es->analyze;
+		es->summary = es->analyze;
+		es->format = EXPLAIN_FORMAT_TEXT;
+		ExplainBeginOutput(es);
+		if (analyze)
+		{
+			ExplainPrintPlan(es, query_desc);
+			ExplainPrintExecStatsEnd(es, query_desc);
+		}
+		ExplainEndOutput(es);
+		return *es;
+	});
+}
+
+Instrumentation *
+gpdb::instr_alloc(size_t n, int instrument_options, bool async_mode)
+{
+	return wrap_throw(InstrAlloc, n, instrument_options, async_mode);
+}
+
+HeapTuple
+gpdb::heap_form_tuple(TupleDesc tupleDescriptor, Datum *values, bool *isnull)
+{
+	if (!tupleDescriptor || !values || !isnull)
+		throw std::runtime_error(
+			"Invalid input parameters for heap tuple formation");
+
+	return wrap_throw(::heap_form_tuple, tupleDescriptor, values, isnull);
+}
+
+void
+gpdb::pfree(void *pointer) noexcept
+{
+	// Note that ::pfree asserts that pointer != NULL.
+	if (!pointer)
+		return;
+
+	wrap_noexcept(::pfree, pointer);
+}
+
+MemoryContext
+gpdb::mem_ctx_switch_to(MemoryContext context) noexcept
+{
+	return MemoryContextSwitchTo(context);
+}
+
+const char *
+gpdb::get_config_option(const char *name, bool missing_ok,
+						bool restrict_superuser) noexcept
+{
+	if (!name)
+		return nullptr;
+
+	return wrap_noexcept(GetConfigOption, name, missing_ok, restrict_superuser);
+}
+
+void
+gpdb::list_free(List *list) noexcept
+{
+	if (!list)
+		return;
+
+	wrap_noexcept(::list_free, list);
+}
+
+CdbExplain_ShowStatCtx *
+gpdb::cdbexplain_showExecStatsBegin(QueryDesc *query_desc, instr_time starttime)
+{
+	if (!query_desc)
+		throw std::runtime_error("Invalid query descriptor");
+
+	return wrap_throw(::cdbexplain_showExecStatsBegin, query_desc, starttime);
+}
+
+void
+gpdb::instr_end_loop(Instrumentation *instr)
+{
+	if (!instr)
+		throw std::runtime_error("Invalid instrumentation pointer");
+
+	wrap_throw(::InstrEndLoop, instr);
+}
+
+char *
+gpdb::gen_normquery(const char *query) noexcept
+{
+	return wrap_noexcept(::gen_normquery, query);
+}
+
+StringInfo
+gpdb::gen_normplan(const char *exec_plan) noexcept
+{
+	return wrap_noexcept(::gen_normplan, exec_plan);
+}
+
+char *
+gpdb::get_rg_name_for_id(Oid group_id)
+{
+	return wrap_throw(GetResGroupNameForId, group_id);
+}
+
+Oid
+gpdb::get_rg_id_by_session_id(int session_id)
+{
+	return wrap_throw(ResGroupGetGroupIdBySessionId, session_id);
+}
+
+void
+gpdb::insert_log(const gpsc::SetQueryReq &req, bool utility)
+{
+	return wrap_throw(::insert_log, req, utility);
+}
diff --git a/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.h b/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.h
new file mode 100644
index 00000000000..5237b6be68a
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.h
@@ -0,0 +1,86 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * gpdbwrappers.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/memory/gpdbwrappers.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef GPDBWRAPPERS_H
+#define GPDBWRAPPERS_H
+
+extern "C" {
+#include "postgres.h"
+#include "access/htup.h"
+#include "commands/explain.h"
+#include "executor/instrument.h"
+#include "nodes/pg_list.h"
+#include "utils/elog.h"
+#include "utils/memutils.h"
+}
+
+#include <optional>
+#include <stdexcept>
+#include <string>
+#include <type_traits>
+#include <utility>
+
+namespace gpsc
+{
+class SetQueryReq;
+}  // namespace gpsc
+
+namespace gpdb
+{
+
+// Functions that call palloc().
+// Make sure correct memory context is set.
+void *palloc(Size size);
+void *palloc0(Size size);
+char *pstrdup(const char *str);
+char *get_database_name(Oid dbid) noexcept;
+bool split_identifier_string(char *rawstring, char separator,
+							 List **namelist) noexcept;
+ExplainState get_explain_state(QueryDesc *query_desc, bool costs) noexcept;
+ExplainState get_analyze_state(QueryDesc *query_desc, bool analyze) noexcept;
+Instrumentation *instr_alloc(size_t n, int instrument_options, bool async_mode);
+HeapTuple heap_form_tuple(TupleDesc tupleDescriptor, Datum *values,
+						  bool *isnull);
+CdbExplain_ShowStatCtx *cdbexplain_showExecStatsBegin(QueryDesc *query_desc,
+													  instr_time starttime);
+void instr_end_loop(Instrumentation *instr);
+char *gen_normquery(const char *query) noexcept;
+StringInfo gen_normplan(const char *executionPlan) noexcept;
+char *get_rg_name_for_id(Oid group_id);
+void insert_log(const gpsc::SetQueryReq &req, bool utility);
+
+// Palloc-free functions.
+void pfree(void *pointer) noexcept;
+MemoryContext mem_ctx_switch_to(MemoryContext context) noexcept;
+const char *get_config_option(const char *name, bool missing_ok,
+							  bool restrict_superuser) noexcept;
+void list_free(List *list) noexcept;
+Oid get_rg_id_by_session_id(int session_id);
+
+}  // namespace gpdb
+
+#endif /* GPDBWRAPPERS_H */
diff --git a/gpcontrib/gp_stats_collector/src/stat_statements_parser/README.md b/gpcontrib/gp_stats_collector/src/stat_statements_parser/README.md
new file mode 100644
index 00000000000..927189474fe
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/stat_statements_parser/README.md
@@ -0,0 +1,20 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one
+  or more contributor license agreements.  See the NOTICE file
+  distributed with this work for additional information
+  regarding copyright ownership.  The ASF licenses this file
+  to you under the Apache License, Version 2.0 (the
+  "License"); you may not use this file except in compliance
+  with the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing,
+  software distributed under the License is distributed on an
+  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  KIND, either express or implied.  See the License for the
+  specific language governing permissions and limitations
+  under the License.
+-->
+
+This directory contains a slightly modified subset of pg_stat_statements for PG v9.4 to be used in query and plan ID generation.
diff --git a/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.c b/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.c
new file mode 100644
index 00000000000..8e7bd917541
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.c
@@ -0,0 +1,378 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * pg_stat_statements_parser.c
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.c
+ *
+ *-------------------------------------------------------------------------
+ */
+
+// NOTE: this file is just a bunch of code borrowed from pg_stat_statements for PG 9.4
+// and from our own inhouse implementation of pg_stat_statements for managed PG
+
+#include "postgres.h"
+
+#include <sys/stat.h>
+#include <unistd.h>
+
+#include "common/hashfn.h"
+#include "lib/stringinfo.h"
+#include "mb/pg_wchar.h"
+#include "miscadmin.h"
+#include "parser/scanner.h"
+#include "utils/builtins.h"
+#include "utils/memutils.h"
+#include "utils/queryjumble.h"
+
+#include "pg_stat_statements_parser.h"
+
+#ifndef FCONST
+#define FCONST 260
+#endif
+#ifndef SCONST
+#define SCONST 261
+#endif
+#ifndef BCONST
+#define BCONST 263
+#endif
+#ifndef XCONST
+#define XCONST 264
+#endif
+#ifndef ICONST
+#define ICONST 266
+#endif
+
+static void fill_in_constant_lengths(JumbleState *jstate, const char *query);
+static int comp_location(const void *a, const void *b);
+StringInfo gen_normplan(const char *execution_plan);
+static bool need_replace(int token);
+static char *generate_normalized_query(JumbleState *jstate, const char *query,
+									   int *query_len_p, int encoding);
+
+void
+stat_statements_parser_init(void)
+{
+	EnableQueryId();
+}
+
+void
+stat_statements_parser_deinit(void)
+{
+	/* NO-OP */
+}
+
+/* check if token should be replaced by substitute varable */
+static bool
+need_replace(int token)
+{
+	return (token == FCONST) || (token == ICONST) || (token == SCONST) ||
+		   (token == BCONST) || (token == XCONST);
+}
+
+/*
+ * gen_normplan - parse execution plan using flex and replace all CONST to
+ * substitute variables.
+ */
+StringInfo
+gen_normplan(const char *execution_plan)
+{
+	core_yyscan_t yyscanner;
+	core_yy_extra_type yyextra;
+	core_YYSTYPE yylval;
+	YYLTYPE yylloc;
+	int tok;
+	int bind_prefix = 1;
+	char *tmp_str;
+	YYLTYPE last_yylloc = 0;
+	int last_tok = 0;
+	StringInfo plan_out = makeStringInfo();
+	;
+
+	yyscanner = scanner_init(execution_plan, &yyextra,
+#if PG_VERSION_NUM >= 120000
+							 &ScanKeywords, ScanKeywordTokens
+#else
+							 ScanKeywords, NumScanKeywords
+#endif
+	);
+
+	for (;;)
+	{
+		/* get the next lexem */
+		tok = core_yylex(&yylval, &yylloc, yyscanner);
+
+		/* now we store end previsous lexem in yylloc - so could prcess it */
+		if (need_replace(last_tok))
+		{
+			/* substitute variable instead of CONST */
+			int s_len = asprintf(&tmp_str, "$%i", bind_prefix++);
+			if (s_len > 0)
+			{
+				appendStringInfoString(plan_out, tmp_str);
+				free(tmp_str);
+			}
+			else
+			{
+				appendStringInfoString(plan_out, "??");
+			}
+		}
+		else
+		{
+			/* do not change - just copy as-is */
+			tmp_str = strndup((char *) execution_plan + last_yylloc,
+							  yylloc - last_yylloc);
+			appendStringInfoString(plan_out, tmp_str);
+			free(tmp_str);
+		}
+		/* check if further parsing not needed */
+		if (tok == 0)
+			break;
+		last_tok = tok;
+		last_yylloc = yylloc;
+	}
+
+	scanner_finish(yyscanner);
+
+	return plan_out;
+}
+
+/*
+ * comp_location: comparator for qsorting LocationLen structs by location
+ */
+static int
+comp_location(const void *a, const void *b)
+{
+	int l = ((const LocationLen *) a)->location;
+	int r = ((const LocationLen *) b)->location;
+
+	if (l < r)
+		return -1;
+	else if (l > r)
+		return +1;
+	else
+		return 0;
+}
+
+/*
+ * Given a valid SQL string and an array of constant-location records,
+ * fill in the textual lengths of those constants.
+ *
+ * The constants may use any allowed constant syntax, such as float literals,
+ * bit-strings, single-quoted strings and dollar-quoted strings.  This is
+ * accomplished by using the public API for the core scanner.
+ *
+ * It is the caller's job to ensure that the string is a valid SQL statement
+ * with constants at the indicated locations.  Since in practice the string
+ * has already been parsed, and the locations that the caller provides will
+ * have originated from within the authoritative parser, this should not be
+ * a problem.
+ *
+ * Duplicate constant pointers are possible, and will have their lengths
+ * marked as '-1', so that they are later ignored.  (Actually, we assume the
+ * lengths were initialized as -1 to start with, and don't change them here.)
+ *
+ * N.B. There is an assumption that a '-' character at a Const location begins
+ * a negative numeric constant.  This precludes there ever being another
+ * reason for a constant to start with a '-'.
+ */
+static void
+fill_in_constant_lengths(JumbleState *jstate, const char *query)
+{
+	LocationLen *locs;
+	core_yyscan_t yyscanner;
+	core_yy_extra_type yyextra;
+	core_YYSTYPE yylval;
+	YYLTYPE yylloc;
+	int last_loc = -1;
+	int i;
+
+	/*
+	 * Sort the records by location so that we can process them in order while
+	 * scanning the query text.
+	 */
+	if (jstate->clocations_count > 1)
+		qsort(jstate->clocations, jstate->clocations_count, sizeof(LocationLen),
+			  comp_location);
+	locs = jstate->clocations;
+
+	/* initialize the flex scanner --- should match raw_parser() */
+	yyscanner = scanner_init(query, &yyextra, &ScanKeywords, ScanKeywordTokens);
+
+	/* Search for each constant, in sequence */
+	for (i = 0; i < jstate->clocations_count; i++)
+	{
+		int loc = locs[i].location;
+		int tok;
+
+		Assert(loc >= 0);
+
+		if (loc <= last_loc)
+			continue; /* Duplicate constant, ignore */
+
+		/* Lex tokens until we find the desired constant */
+		for (;;)
+		{
+			tok = core_yylex(&yylval, &yylloc, yyscanner);
+
+			/* We should not hit end-of-string, but if we do, behave sanely */
+			if (tok == 0)
+				break; /* out of inner for-loop */
+
+			/*
+			 * We should find the token position exactly, but if we somehow
+			 * run past it, work with that.
+			 */
+			if (yylloc >= loc)
+			{
+				if (query[loc] == '-')
+				{
+					/*
+					 * It's a negative value - this is the one and only case
+					 * where we replace more than a single token.
+					 *
+					 * Do not compensate for the core system's special-case
+					 * adjustment of location to that of the leading '-'
+					 * operator in the event of a negative constant.  It is
+					 * also useful for our purposes to start from the minus
+					 * symbol.  In this way, queries like "select * from foo
+					 * where bar = 1" and "select * from foo where bar = -2"
+					 * will have identical normalized query strings.
+					 */
+					tok = core_yylex(&yylval, &yylloc, yyscanner);
+					if (tok == 0)
+						break; /* out of inner for-loop */
+				}
+
+				/*
+				 * We now rely on the assumption that flex has placed a zero
+				 * byte after the text of the current token in scanbuf.
+				 */
+				locs[i].length = strlen(yyextra.scanbuf + loc);
+				break; /* out of inner for-loop */
+			}
+		}
+
+		/* If we hit end-of-string, give up, leaving remaining lengths -1 */
+		if (tok == 0)
+			break;
+
+		last_loc = loc;
+	}
+
+	scanner_finish(yyscanner);
+}
+
+/*
+ * Generate a normalized version of the query string that will be used to
+ * represent all similar queries.
+ *
+ * Note that the normalized representation may well vary depending on
+ * just which "equivalent" query is used to create the hashtable entry.
+ * We assume this is OK.
+ *
+ * *query_len_p contains the input string length, and is updated with
+ * the result string length (which cannot be longer) on exit.
+ *
+ * Returns a palloc'd string.
+ */
+static char *
+generate_normalized_query(JumbleState *jstate, const char *query,
+						  int *query_len_p, int encoding)
+{
+	char *norm_query;
+	int query_len = *query_len_p;
+	int i, len_to_wrt,	  /* Length (in bytes) to write */
+		quer_loc = 0,	  /* Source query byte location */
+		n_quer_loc = 0,	  /* Normalized query byte location */
+		last_off = 0,	  /* Offset from start for previous tok */
+		last_tok_len = 0; /* Length (in bytes) of that tok */
+
+	/*
+	 * Get constants' lengths (core system only gives us locations).  Note
+	 * this also ensures the items are sorted by location.
+	 */
+	fill_in_constant_lengths(jstate, query);
+
+	/* Allocate result buffer */
+	norm_query = palloc(query_len + 1);
+
+	for (i = 0; i < jstate->clocations_count; i++)
+	{
+		int off,	 /* Offset from start for cur tok */
+			tok_len; /* Length (in bytes) of that tok */
+
+		off = jstate->clocations[i].location;
+		tok_len = jstate->clocations[i].length;
+
+		if (tok_len < 0)
+			continue; /* ignore any duplicates */
+
+		/* Copy next chunk (what precedes the next constant) */
+		len_to_wrt = off - last_off;
+		len_to_wrt -= last_tok_len;
+
+		Assert(len_to_wrt >= 0);
+		memcpy(norm_query + n_quer_loc, query + quer_loc, len_to_wrt);
+		n_quer_loc += len_to_wrt;
+
+		/* And insert a '?' in place of the constant token */
+		norm_query[n_quer_loc++] = '?';
+
+		quer_loc = off + tok_len;
+		last_off = off;
+		last_tok_len = tok_len;
+	}
+
+	/*
+	 * We've copied up until the last ignorable constant.  Copy over the
+	 * remaining bytes of the original query string.
+	 */
+	len_to_wrt = query_len - quer_loc;
+
+	Assert(len_to_wrt >= 0);
+	memcpy(norm_query + n_quer_loc, query + quer_loc, len_to_wrt);
+	n_quer_loc += len_to_wrt;
+
+	Assert(n_quer_loc <= query_len);
+	norm_query[n_quer_loc] = '\0';
+
+	*query_len_p = n_quer_loc;
+	return norm_query;
+}
+
+char *
+gen_normquery(const char *query)
+{
+	if (!query)
+	{
+		return NULL;
+	}
+	JumbleState jstate;
+	jstate.jumble = (unsigned char *) palloc(JUMBLE_SIZE);
+	jstate.jumble_len = 0;
+	jstate.clocations_buf_size = 32;
+	jstate.clocations = (LocationLen *) palloc(jstate.clocations_buf_size *
+											   sizeof(LocationLen));
+	jstate.clocations_count = 0;
+	int query_len = strlen(query);
+	return generate_normalized_query(&jstate, query, &query_len,
+									 GetDatabaseEncoding());
+}
\ No newline at end of file
diff --git a/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.h b/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.h
new file mode 100644
index 00000000000..b6c5dea7b36
--- /dev/null
+++ b/gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.h
@@ -0,0 +1,45 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * pg_stat_statements_parser.h
+ *
+ * IDENTIFICATION
+ *	  gpcontrib/gp_stats_collector/src/stat_statements_parser/pg_stat_statements_parser.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef PG_STAT_STATEMENTS_PARSER_H
+#define PG_STAT_STATEMENTS_PARSER_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+extern void stat_statements_parser_init(void);
+extern void stat_statements_parser_deinit(void);
+
+StringInfo gen_normplan(const char *executionPlan);
+char *gen_normquery(const char *query);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif /* PG_STAT_STATEMENTS_PARSER_H */
diff --git a/pom.xml b/pom.xml
index 0e000093399..b9915331c0c 100644
--- a/pom.xml
+++ b/pom.xml
@@ -572,9 +572,6 @@ code or new licensing patterns.
             <include>src/backend/gporca/**/Makefile</include>
 
             <exclude>src/backend/gporca/cmake/FindXerces.cmake</exclude>
-            <exclude>src/backend/gporca/concourse/build_and_test.py</exclude>
-            <exclude>src/backend/gporca/concourse/xerces-c/build_xerces.py</exclude>
-            <exclude>src/backend/gporca/concourse/xerces-c/xerces-c-3.1.2.tar.gz.sha256</exclude>
             <exclude>src/backend/gporca/server/fixdxl.sh</exclude>
             <exclude>src/backend/gporca/server/include/unittest/gpopt/operators/CScalarIsDistinctFromTest.h</exclude>
             <exclude>src/backend/gporca/server/dxl.xsd</exclude>
@@ -1050,6 +1047,7 @@ code or new licensing patterns.
             <exclude>src/backend/postmaster/test/checkpointer_test.c</exclude>
             <exclude>src/backend/postmaster/README.auto-ANALYZE</exclude>
             <exclude>src/backend/mock.mk</exclude>
+            <exclude>src/backend/catalog/system_views_gp.in</exclude>
             <exclude>src/backend/catalog/storage_tablespace.c</exclude>
             <exclude>src/backend/catalog/test/storage_tablespace_test.c</exclude>
             <exclude>src/backend/catalog/sql_features.txt</exclude>
@@ -1272,6 +1270,13 @@ code or new licensing patterns.
             <exclude>src/include/task/task_states.h</exclude>
             <exclude>src/include/task/job_metadata.h</exclude>
 
+            <!-- The following files are from extension's ecosystem,
+                 introduced by Cloudberry.
+            -->
+            <exclude>gpcontrib/gp_stats_collector/gp_stats_collector.control</exclude>
+            <exclude>gpcontrib/gp_stats_collector/.clang-format</exclude>
+            <exclude>gpcontrib/gp_stats_collector/Makefile</exclude>
+
             <!-- The following files are used by PAX as the 
                  submodules or created originally by Cloudberry.
             -->
@@ -1744,7 +1749,8 @@ code or new licensing patterns.
 
             <exclude>devops/deploy/docker/build/rocky8/tests/requirements.txt</exclude>
             <exclude>devops/deploy/docker/build/rocky9/tests/requirements.txt</exclude>
-	          <exclude>devops/deploy/docker/build/ubuntu22.04/tests/requirements.txt</exclude>
+            <exclude>devops/deploy/docker/build/rocky10/tests/requirements.txt</exclude>
+            <exclude>devops/deploy/docker/build/ubuntu22.04/tests/requirements.txt</exclude>
             <exclude>devops/deploy/docker/build/ubuntu24.04/tests/requirements.txt</exclude>
 
 	    <!-- Exclude ubuntu debian packaging files since they do not support comments
diff --git a/src/Makefile.global.in b/src/Makefile.global.in
index 77b58e7aa76..d413bd86761 100644
--- a/src/Makefile.global.in
+++ b/src/Makefile.global.in
@@ -271,6 +271,8 @@ with_zstd 		= @with_zstd@
 ZSTD_CFLAGS		= @ZSTD_CFLAGS@
 ZSTD_LIBS		= @ZSTD_LIBS@
 EVENT_LIBS		= @EVENT_LIBS@
+with_diskquota		= @with_diskquota@
+with_gp_stats_collector		= @with_gp_stats_collector@
 
 ##########################################################################
 #
diff --git a/src/backend/access/aocs/aocsam_handler.c b/src/backend/access/aocs/aocsam_handler.c
index c2faa538e10..4b3cd2a52ef 100644
--- a/src/backend/access/aocs/aocsam_handler.c
+++ b/src/backend/access/aocs/aocsam_handler.c
@@ -2044,15 +2044,25 @@ static uint64
 aoco_relation_size(Relation rel, ForkNumber forkNumber)
 {
 	AOCSFileSegInfo	  **allseg;
-	Snapshot			snapshot;
 	uint64				totalbytes	= 0;
 	int					totalseg;
 
 	if (forkNumber != MAIN_FORKNUM)
 		return totalbytes;
 
-	snapshot = RegisterSnapshot(GetLatestSnapshot());
-	allseg = GetAllAOCSFileSegInfo(rel, snapshot, &totalseg, NULL);
+	/*
+	 * Pass NULL as snapshot so that GetAllAOCSFileSegInfo -> systable_beginscan
+	 * uses GetCatalogSnapshot() internally.  This is consistent with
+	 * appendonly_relation_size() for AO row tables and ensures pg_aocsseg
+	 * entries are visible even when called within the same transaction that
+	 * populated them (e.g. ALTER TABLE SET DISTRIBUTED BY).
+	 *
+	 * Using GetLatestSnapshot() here previously caused the metadata to be
+	 * invisible on QE segments during in-transaction redistribution, leading
+	 * to a zero return value and a subsequent assertion failure in
+	 * vac_update_relstats().
+	 */
+	allseg = GetAllAOCSFileSegInfo(rel, NULL, &totalseg, NULL);
 	for (int seg = 0; seg < totalseg; seg++)
 	{
 		for (int attr = 0; attr < RelationGetNumberOfAttributes(rel); attr++)
@@ -2079,7 +2089,6 @@ aoco_relation_size(Relation rel, ForkNumber forkNumber)
 		FreeAllAOCSSegFileInfo(allseg, totalseg);
 		pfree(allseg);
 	}
-	UnregisterSnapshot(snapshot);
 
 	return totalbytes;
 }
diff --git a/src/backend/access/common/reloptions_gp.c b/src/backend/access/common/reloptions_gp.c
index fbf75fb9e10..cbfe5d7e28a 100644
--- a/src/backend/access/common/reloptions_gp.c
+++ b/src/backend/access/common/reloptions_gp.c
@@ -1791,7 +1791,7 @@ transformColumnEncoding(const TableAmRoutine *tam, Relation rel, List *colDefs,
 	return result;
 }
 
-List* transfromColumnEncodingAocoRootPartition(List *colDefs, List *stenc, List *withOptions, bool errorOnEncodingClause)
+List* transformColumnEncodingAocoRootPartition(List *colDefs, List *stenc, List *withOptions, bool errorOnEncodingClause)
 {
 	ColumnReferenceStorageDirective *deflt = NULL;
 	ListCell   *lc;
diff --git a/src/backend/access/external/external.c b/src/backend/access/external/external.c
index 62cff75db53..e42b4255af3 100644
--- a/src/backend/access/external/external.c
+++ b/src/backend/access/external/external.c
@@ -34,6 +34,47 @@
 
 static List *create_external_scan_uri_list(ExtTableEntry *ext, bool *ismasteronly);
 
+/*
+ * parse_fdw_encoding_option
+ *
+ * Parse the value of an "encoding" FDW OPTIONS entry (whether on creation,
+ * during validation, or when reading back stored ftoptions) into a numeric
+ * encoding ID. Accepts a symbolic encoding name (e.g. "UTF8", "utf-8", "GBK")
+ * resolved via pg_char_to_encoding(), or a strictly numeric string (e.g. "6")
+ * validated via PG_VALID_ENCODING(). Anything else raises ERROR.
+ *
+ * Note: atoi() is intentionally avoided in the numeric fallback. atoi("UTF8")
+ * silently returns 0 (= SQL_ASCII), which is exactly the bug this helper
+ * exists to fix. strtol() with end-of-string and range checks is strict.
+ */
+int
+parse_fdw_encoding_option(const char *value)
+{
+	int			encoding;
+	char	   *endptr;
+	long		n;
+
+	if (value == NULL || *value == '\0')
+		ereport(ERROR,
+				(errcode(ERRCODE_FDW_INVALID_ATTRIBUTE_VALUE),
+				 errmsg("encoding option must not be empty")));
+
+	encoding = pg_char_to_encoding(value);
+	if (encoding >= 0)
+		return encoding;
+
+	errno = 0;
+	n = strtol(value, &endptr, 10);
+	if (endptr != value && *endptr == '\0' && errno == 0 &&
+		n >= 0 && PG_VALID_ENCODING((int) n))
+		return (int) n;
+
+	ereport(ERROR,
+			(errcode(ERRCODE_FDW_INVALID_ATTRIBUTE_VALUE),
+			 errmsg("\"%s\" is not a valid encoding name or code", value)));
+	return -1;					/* unreachable, keeps compiler happy */
+}
+
 void
 gfile_printf_then_putc_newline(const char *format,...)
 {
@@ -277,7 +318,7 @@ GetExtFromForeignTableOptions(List *ftoptons, Oid relid)
 
 		if (pg_strcasecmp(def->defname, "encoding") == 0)
 		{
-			extentry->encoding = atoi(defGetString(def));
+			extentry->encoding = parse_fdw_encoding_option(defGetString(def));
 			encoding_found = true;
 			continue;
 		}
diff --git a/src/backend/access/heap/visibilitymap.c b/src/backend/access/heap/visibilitymap.c
index e198df65d82..7d252fa94ab 100644
--- a/src/backend/access/heap/visibilitymap.c
+++ b/src/backend/access/heap/visibilitymap.c
@@ -645,6 +645,14 @@ vm_extend(Relation rel, BlockNumber vm_nblocks)
 		!smgrexists(rel->rd_smgr, VISIBILITYMAP_FORKNUM))
 		smgrcreate(rel->rd_smgr, VISIBILITYMAP_FORKNUM, false);
 
+	/*
+	 * Might have to re-open if smgrcreate triggered AcceptInvalidationMessages
+	 * (via TablespaceCreateDbspace -> LockSharedObject for non-default
+	 * tablespaces), which may have processed a pending SHAREDINVALSMGR_ID
+	 * message and closed our smgr entry.
+	 */
+	RelationOpenSmgr(rel);
+
 	/* Invalidate cache so that smgrnblocks() asks the kernel. */
 	rel->rd_smgr->smgr_cached_nblocks[VISIBILITYMAP_FORKNUM] = InvalidBlockNumber;
 	vm_nblocks_now = smgrnblocks(rel->rd_smgr, VISIBILITYMAP_FORKNUM);
diff --git a/src/backend/access/transam/xact.c b/src/backend/access/transam/xact.c
index d6b44fc8412..62ddae7a649 100644
--- a/src/backend/access/transam/xact.c
+++ b/src/backend/access/transam/xact.c
@@ -3036,13 +3036,15 @@ CommitTransaction(void)
 	DoPendingDbDeletes(true);
 
 	/*
-	 * Only QD holds the session level lock this long for a movedb operation.
-	 * This is to prevent another transaction from moving database objects into
-	 * the source database oid directory while it is being deleted. We don't
-	 * worry about aborts as we release session level locks automatically during
-	 * an abort as opposed to a commit.
-	 */
-	if(Gp_role == GP_ROLE_DISPATCH || IS_SINGLENODE())
+	 * Release the session level lock held for a movedb operation. This is to
+	 * prevent another transaction from moving database objects into the source
+	 * database oid directory while it is being deleted. We don't worry about
+	 * aborts as we release session level locks automatically during an abort
+	 * as opposed to a commit. We must also release in utility mode (e.g.
+	 * standalone backends used in TAP tests).
+	 */
+	if (Gp_role == GP_ROLE_DISPATCH || Gp_role == GP_ROLE_UTILITY ||
+		IS_SINGLENODE())
 		MoveDbSessionLockRelease();
 
 	/*
diff --git a/src/backend/catalog/.gitignore b/src/backend/catalog/.gitignore
index 6c4c6d228db..3912b022a03 100644
--- a/src/backend/catalog/.gitignore
+++ b/src/backend/catalog/.gitignore
@@ -8,3 +8,4 @@
 /pg_*_d.h
 /gp_*_d.h
 /bki-stamp
+/system_views_gp.sql
diff --git a/src/backend/catalog/Makefile b/src/backend/catalog/Makefile
index b95f92f2e6e..e2ad48a8699 100644
--- a/src/backend/catalog/Makefile
+++ b/src/backend/catalog/Makefile
@@ -56,6 +56,9 @@ OBJS += pg_extprotocol.o \
 	   gp_matview_aux.o \
        pg_directory_table.o storage_directory_table.o
 
+GP_SYSVIEW_IN = system_views_gp.in
+GP_SYSVIEW_SQL = system_views_gp.sql
+
 CATALOG_JSON:= $(addprefix $(top_srcdir)/gpMgmt/bin/gppylib/data/, $(addsuffix .json,$(GP_MAJORVERSION)))
 
 include $(top_srcdir)/src/backend/common.mk
@@ -133,7 +136,7 @@ POSTGRES_BKI_DATA += $(addprefix $(top_srcdir)/src/include/catalog/,\
 	$(top_builddir)/src/include/catalog/gp_version_at_initdb.dat
 
 
-all: distprep generated-header-symlinks
+all: distprep generated-header-symlinks $(GP_SYSVIEW_SQL)
 
 distprep: bki-stamp
 
@@ -197,6 +200,8 @@ ifeq ($(USE_INTERNAL_FTS_FOUND), false)
 endif
 	$(INSTALL_DATA) $(srcdir)/system_functions.sql '$(DESTDIR)$(datadir)/system_functions.sql'
 	$(INSTALL_DATA) $(srcdir)/system_views.sql '$(DESTDIR)$(datadir)/system_views.sql'
+	$(INSTALL_DATA) $(srcdir)/$(GP_SYSVIEW_SQL) '$(DESTDIR)$(datadir)/$(GP_SYSVIEW_SQL)'
+	$(INSTALL_DATA) $(srcdir)/system_views_gp_summary.sql '$(DESTDIR)$(datadir)/system_views_gp_summary.sql'
 	$(INSTALL_DATA) $(srcdir)/information_schema.sql '$(DESTDIR)$(datadir)/information_schema.sql'
 	$(INSTALL_DATA) $(call vpathsearch,cdb_schema.sql) '$(DESTDIR)$(datadir)/cdb_init.d/cdb_schema.sql'
 	$(INSTALL_DATA) $(srcdir)/sql_features.txt '$(DESTDIR)$(datadir)/sql_features.txt'
@@ -208,7 +213,8 @@ installdirs:
 
 .PHONY: uninstall-data
 uninstall-data:
-	rm -f $(addprefix '$(DESTDIR)$(datadir)'/, postgres.bki system_constraints.sql system_functions.sql system_views.sql information_schema.sql cdb_init.d/cdb_schema.sql cdb_init.d/gp_toolkit.sql sql_features.txt fix-CVE-2024-4317.sql)
+	rm -f $(addprefix '$(DESTDIR)$(datadir)'/, postgres.bki system_constraints.sql system_functions.sql system_views.sql system_views_gp_summary.sql information_schema.sql cdb_init.d/cdb_schema.sql cdb_init.d/gp_toolkit.sql sql_features.txt fix-CVE-2024-4317.sql)
+
 ifeq ($(USE_INTERNAL_FTS_FOUND), false)
 	rm -f $(addprefix '$(DESTDIR)$(datadir)'/, external_fts.sql)
 endif
@@ -217,4 +223,4 @@ endif
 clean:
 
 maintainer-clean: clean
-	rm -f bki-stamp postgres.bki system_constraints.sql $(GENERATED_HEADERS)
+	rm -f bki-stamp postgres.bki system_constraints.sql $(GENERATED_HEADERS) $(GP_SYSVIEW_SQL)
diff --git a/src/backend/catalog/system_views.sql b/src/backend/catalog/system_views.sql
index 86e938a3b87..e68262830d4 100644
--- a/src/backend/catalog/system_views.sql
+++ b/src/backend/catalog/system_views.sql
@@ -657,7 +657,7 @@ REVOKE EXECUTE ON FUNCTION pg_get_backend_memory_contexts() FROM PUBLIC;
 
 -- Statistics views
 
-CREATE VIEW pg_stat_all_tables_internal AS
+CREATE VIEW pg_stat_all_tables AS
     SELECT
             C.oid AS relid,
             N.nspname AS schemaname,
@@ -689,81 +689,6 @@ CREATE VIEW pg_stat_all_tables_internal AS
     WHERE C.relkind IN ('r', 't', 'm', 'o', 'b', 'M', 'p')
     GROUP BY C.oid, N.nspname, C.relname;
 
--- Gather data from segments on user tables, and use data on coordinator on system tables.
-
-CREATE VIEW pg_stat_all_tables AS
-SELECT
-    s.relid,
-    s.schemaname,
-    s.relname,
-    m.seq_scan,
-    m.seq_tup_read,
-    m.idx_scan,
-    m.idx_tup_fetch,
-    m.n_tup_ins,
-    m.n_tup_upd,
-    m.n_tup_del,
-    m.n_tup_hot_upd,
-    m.n_live_tup,
-    m.n_dead_tup,
-    m.n_mod_since_analyze,
-    m.n_ins_since_vacuum,
-    s.last_vacuum,
-    s.last_autovacuum,
-    s.last_analyze,
-    s.last_autoanalyze,
-    s.vacuum_count,
-    s.autovacuum_count,
-    s.analyze_count,
-    s.autoanalyze_count
-FROM
-    (SELECT
-         allt.relid,
-         allt.schemaname,
-         allt.relname,
-         case when d.policytype = 'r' then (sum(seq_scan)/d.numsegments)::bigint else sum(seq_scan) end seq_scan,
-         case when d.policytype = 'r' then (sum(seq_tup_read)/d.numsegments)::bigint else sum(seq_tup_read) end seq_tup_read,
-         case when d.policytype = 'r' then (sum(idx_scan)/d.numsegments)::bigint else sum(idx_scan) end idx_scan,
-         case when d.policytype = 'r' then (sum(idx_tup_fetch)/d.numsegments)::bigint else sum(idx_tup_fetch) end idx_tup_fetch,
-         case when d.policytype = 'r' then (sum(n_tup_ins)/d.numsegments)::bigint else sum(n_tup_ins) end n_tup_ins,
-         case when d.policytype = 'r' then (sum(n_tup_upd)/d.numsegments)::bigint else sum(n_tup_upd) end n_tup_upd,
-         case when d.policytype = 'r' then (sum(n_tup_del)/d.numsegments)::bigint else sum(n_tup_del) end n_tup_del,
-         case when d.policytype = 'r' then (sum(n_tup_hot_upd)/d.numsegments)::bigint else sum(n_tup_hot_upd) end n_tup_hot_upd,
-         case when d.policytype = 'r' then (sum(n_live_tup)/d.numsegments)::bigint else sum(n_live_tup) end n_live_tup,
-         case when d.policytype = 'r' then (sum(n_dead_tup)/d.numsegments)::bigint else sum(n_dead_tup) end n_dead_tup,
-         case when d.policytype = 'r' then (sum(n_mod_since_analyze)/d.numsegments)::bigint else sum(n_mod_since_analyze) end n_mod_since_analyze,
-         case when d.policytype = 'r' then (sum(n_ins_since_vacuum)/d.numsegments)::bigint else sum(n_ins_since_vacuum) end n_ins_since_vacuum,
-         max(last_vacuum) as last_vacuum,
-         max(last_autovacuum) as last_autovacuum,
-         max(last_analyze) as last_analyze,
-         max(last_autoanalyze) as last_autoanalyze,
-         max(vacuum_count) as vacuum_count,
-         max(autovacuum_count) as autovacuum_count,
-         max(analyze_count) as analyze_count,
-         max(autoanalyze_count) as autoanalyze_count
-     FROM
-         gp_dist_random('pg_stat_all_tables_internal') allt
-         inner join pg_class c
-               on allt.relid = c.oid
-         left outer join gp_distribution_policy d
-              on allt.relid = d.localoid
-     WHERE
-        relid >= 16384
-        and (
-            d.localoid is not null
-            or c.relkind in ('o', 'b', 'M')
-            )
-     GROUP BY allt.relid, allt.schemaname, allt.relname, d.policytype, d.numsegments
-
-     UNION ALL
-
-     SELECT
-         *
-     FROM
-         pg_stat_all_tables_internal
-     WHERE
-             relid < 16384) m, pg_stat_all_tables_internal s
-WHERE m.relid = s.relid;
 
 CREATE VIEW pg_stat_xact_all_tables AS
     SELECT
@@ -812,10 +737,11 @@ CREATE VIEW pg_stat_user_tables AS
 -- since we don't have segments.
 -- We create a new view for single node mode.
 CREATE VIEW pg_stat_user_tables_single_node AS
-    SELECT * FROM pg_stat_all_tables_internal
+    SELECT * FROM pg_stat_all_tables
     WHERE schemaname NOT IN ('pg_catalog', 'information_schema') AND
           schemaname !~ '^pg_toast';
 
+
 CREATE VIEW pg_stat_xact_user_tables AS
     SELECT * FROM pg_stat_xact_all_tables
     WHERE schemaname NOT IN ('pg_catalog', 'information_schema') AND
@@ -856,7 +782,7 @@ CREATE VIEW pg_statio_user_tables AS
     WHERE schemaname NOT IN ('pg_catalog', 'information_schema') AND
           schemaname !~ '^pg_toast';
 
-CREATE VIEW pg_stat_all_indexes_internal AS
+CREATE VIEW pg_stat_all_indexes AS
     SELECT
             C.oid AS relid,
             I.oid AS indexrelid,
@@ -872,44 +798,6 @@ CREATE VIEW pg_stat_all_indexes_internal AS
             LEFT JOIN pg_namespace N ON (N.oid = C.relnamespace)
     WHERE C.relkind IN ('r', 't', 'm', 'o', 'b', 'M');
 
--- Gather data from segments on user tables, and use data on coordinator on system tables.
-
-CREATE VIEW pg_stat_all_indexes AS
-SELECT
-    s.relid,
-    s.indexrelid,
-    s.schemaname,
-    s.relname,
-    s.indexrelname,
-    m.idx_scan,
-    m.idx_tup_read,
-    m.idx_tup_fetch
-FROM
-    (SELECT
-         relid,
-         indexrelid,
-         schemaname,
-         relname,
-         indexrelname,
-         sum(idx_scan) as idx_scan,
-         sum(idx_tup_read) as idx_tup_read,
-         sum(idx_tup_fetch) as idx_tup_fetch
-     FROM
-         gp_dist_random('pg_stat_all_indexes_internal')
-     WHERE
-             relid >= 16384
-     GROUP BY relid, indexrelid, schemaname, relname, indexrelname
-
-     UNION ALL
-
-     SELECT
-         *
-     FROM
-         pg_stat_all_indexes_internal
-     WHERE
-             relid < 16384) m, pg_stat_all_indexes_internal s
-WHERE m.indexrelid = s.indexrelid;
-
 CREATE VIEW pg_stat_sys_indexes AS
     SELECT * FROM pg_stat_all_indexes
     WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
@@ -1095,6 +983,7 @@ $$
 $$
 LANGUAGE SQL EXECUTE ON ALL SEGMENTS;
 
+-- This view has an additional column than pg_stat_replication so cannot be generated using system_views_gp.in
 CREATE VIEW gp_stat_replication AS
     SELECT *, pg_catalog.gp_replication_error() AS sync_error
     FROM pg_catalog.gp_stat_get_master_replication() AS R
@@ -1802,11 +1691,6 @@ UNION ALL
   SELECT gp_segment_id, gp_get_suboverflowed_backends() FROM gp_dist_random('gp_id') order by 1;
 
 
-CREATE OR REPLACE VIEW gp_stat_archiver AS
-    SELECT -1 AS gp_segment_id, * FROM pg_stat_archiver
-    UNION
-    SELECT gp_execution_segment() AS gp_segment_id, * FROM gp_dist_random('pg_stat_archiver');
-
 CREATE FUNCTION gp_get_session_endpoints (OUT gp_segment_id int, OUT auth_token text,
 									  OUT cursorname text, OUT sessionid int, OUT hostname varchar(64),
 									  OUT port int, OUT username text, OUT state text,
diff --git a/src/backend/catalog/system_views_gp.in b/src/backend/catalog/system_views_gp.in
new file mode 100644
index 00000000000..cd865cea662
--- /dev/null
+++ b/src/backend/catalog/system_views_gp.in
@@ -0,0 +1,50 @@
+# This file lists all the PG system views 'pg_%' that we would like to create an
+# MPP-aware view 'gp_%' out of. The generated 'gp_%' view definitions will be placed
+# in system_views_gp.sql, and initialized at the same time as system_views.sql.
+#pg_backend_memory_contexts
+pg_config
+pg_cursors
+pg_file_settings
+pg_replication_origin_status
+pg_replication_slots
+pg_settings
+pg_stat_activity
+pg_stat_all_indexes
+pg_stat_all_tables
+pg_stat_archiver
+pg_stat_bgwriter
+#pg_stat_database
+pg_stat_database_conflicts
+pg_stat_gssapi
+pg_stat_operations
+#pg_stat_progress_analyze
+#pg_stat_progress_basebackup
+#pg_stat_progress_cluster
+#pg_stat_progress_copy
+#pg_stat_progress_create_index
+#pg_stat_progress_vacuum
+pg_stat_slru
+pg_stat_ssl
+pg_stat_subscription
+pg_stat_sys_indexes
+pg_stat_sys_tables
+pg_stat_user_functions
+pg_stat_user_indexes
+pg_stat_user_tables
+#pg_stat_wal
+pg_stat_wal_receiver
+pg_stat_xact_all_tables
+pg_stat_xact_sys_tables
+pg_stat_xact_user_functions
+pg_stat_xact_user_tables
+pg_statio_all_indexes
+pg_statio_all_sequences
+pg_statio_all_tables
+pg_statio_sys_indexes
+pg_statio_sys_sequences
+pg_statio_sys_tables
+pg_statio_user_indexes
+pg_statio_user_sequences
+pg_statio_user_tables
+#pg_stats ERROR:  column "most_common_vals" has pseudo-type anyarray
+pg_stats_ext
diff --git a/src/backend/catalog/system_views_gp_summary.sql b/src/backend/catalog/system_views_gp_summary.sql
new file mode 100644
index 00000000000..f83329203ab
--- /dev/null
+++ b/src/backend/catalog/system_views_gp_summary.sql
@@ -0,0 +1,490 @@
+/*
+ * Greenplum System Summary Views
+ *
+ * Portions Copyright (c) 2006-2010, Greenplum inc.
+ * Portions Copyright (c) 2012-Present VMware, Inc. or its affiliates.
+ * Copyright (c) 1996-2019, PostgreSQL Global Development Group
+ *
+ * src/backend/catalog/system_views_gp_summary.sql
+ *
+
+ * This file contains summary views for various Greenplum system catalog
+ * views. These summary views are designed to provide aggregated or averaged
+ * information for partitioned and replicated tables, considering multiple
+ * segments in a Greenplum database.
+ *
+ * Note: this file is read in single-user -j mode, which means that the
+ * command terminator is semicolon-newline-newline; whenever the backend
+ * sees that, it stops and executes what it's got.  If you write a lot of
+ * statements without empty lines between, they'll all get quoted to you
+ * in any error message about one of them, so don't do that.  Also, you
+ * cannot write a semicolon immediately followed by an empty line in a
+ * string literal (including a function body!) or a multiline comment.
+ */
+
+CREATE VIEW gp_stat_archiver_summary AS
+SELECT
+    sum(gsa.archived_count) as archived_count,
+    max(gsa.last_archived_wal) as last_archived_wal,
+    max(gsa.last_archived_time) as last_archived_time,
+    sum(gsa.failed_count) as failed_count,
+    max(gsa.last_failed_wal) as last_failed_wal,
+    max(gsa.last_failed_time) as last_failed_time,
+    max(gsa.stats_reset) as stats_reset
+FROM
+    gp_stat_archiver gsa;
+
+CREATE VIEW gp_stat_bgwriter_summary AS
+SELECT
+    sum(gsb.checkpoints_timed) as checkpoints_timed,
+    sum(gsb.checkpoints_req) as checkpoints_req,
+    sum(gsb.checkpoint_write_time) as checkpoint_write_time,
+    sum(gsb.checkpoint_sync_time) as checkpoint_sync_time,
+    sum(gsb.buffers_checkpoint) as buffers_checkpoint,
+    sum(gsb.buffers_clean) as buffers_clean,
+    sum(gsb.maxwritten_clean) as maxwritten_clean,
+    sum(gsb.buffers_backend) as buffers_backend,
+    sum(gsb.buffers_backend_fsync) as buffers_backend_fsync,
+    sum(gsb.buffers_alloc) as buffers_alloc,
+    max(gsb.stats_reset) as stats_reset
+FROM
+    gp_stat_bgwriter gsb;
+
+CREATE VIEW gp_stat_wal_summary AS
+SELECT
+    sum(gsw.wal_records) as wal_records,
+    sum(gsw.wal_fpw) as wal_fpw,
+    sum(gsw.wal_bytes) as wal_bytes,
+    sum(gsw.wal_buffers_full) as wal_buffers_full,
+    sum(gsw.wal_write) as wal_write,
+    sum(gsw.wal_sync) as wal_sync,
+    sum(gsw.wal_write_time) as wal_write_time,
+    sum(gsw.wal_sync_time) as wal_sync_time,
+    max(gsw.stats_reset) as stats_reset
+from
+    gp_stat_wal gsw;
+
+CREATE VIEW gp_stat_database_summary AS
+SELECT
+    sdb.datid,
+    sdb.datname,
+    sum(sdb.numbackends) as numbackends,
+    max(sdb.xact_commit) as xact_commit,
+    max(sdb.xact_rollback) as xact_rollback,
+    sum(sdb.blks_read) as blks_read,
+    sum(sdb.blks_hit) as blks_hit,
+    sum(sdb.tup_returned) as tup_returned,
+    sum(sdb.tup_fetched) as tup_fetched,
+    sum(sdb.tup_inserted) as tup_inserted,
+    sum(sdb.tup_updated) as tup_updated,
+    sum(sdb.tup_deleted) as tup_deleted,
+    max(sdb.conflicts) as conflicts,
+    sum(sdb.temp_files) as temp_files,
+    sum(sdb.temp_bytes) as temp_bytes,
+    sum(sdb.deadlocks) as deadlocks,
+    sum(sdb.checksum_failures) as checksum_failures,
+    max(sdb.checksum_last_failure) as checksum_last_failure,
+    sum(sdb.blk_read_time) as blk_read_time,
+    sum(sdb.blk_write_time) as blk_write_time,
+    max(sdb.stats_reset) as stats_reset
+FROM
+    gp_stat_database sdb
+GROUP BY
+    sdb.datid,
+    sdb.datname;
+
+
+-- Gather data from segments on user tables, and use data on coordinator on system tables.
+CREATE VIEW gp_stat_all_tables_summary AS
+SELECT
+    s.relid,
+    s.schemaname,
+    s.relname,
+    m.seq_scan,
+    m.seq_tup_read,
+    m.idx_scan,
+    m.idx_tup_fetch,
+    m.n_tup_ins,
+    m.n_tup_upd,
+    m.n_tup_del,
+    m.n_tup_hot_upd,
+    m.n_live_tup,
+    m.n_dead_tup,
+    m.n_mod_since_analyze,
+    s.last_vacuum,
+    s.last_autovacuum,
+    s.last_analyze,
+    s.last_autoanalyze,
+    s.vacuum_count,
+    s.autovacuum_count,
+    s.analyze_count,
+    s.autoanalyze_count
+FROM
+    (SELECT
+         allt.relid,
+         allt.schemaname,
+         allt.relname,
+         case when d.policytype = 'r' then (sum(seq_scan)/d.numsegments)::bigint else sum(seq_scan) end seq_scan,
+         case when d.policytype = 'r' then (sum(seq_tup_read)/d.numsegments)::bigint else sum(seq_tup_read) end seq_tup_read,
+         case when d.policytype = 'r' then (sum(idx_scan)/d.numsegments)::bigint else sum(idx_scan) end idx_scan,
+         case when d.policytype = 'r' then (sum(idx_tup_fetch)/d.numsegments)::bigint else sum(idx_tup_fetch) end idx_tup_fetch,
+         case when d.policytype = 'r' then (sum(n_tup_ins)/d.numsegments)::bigint else sum(n_tup_ins) end n_tup_ins,
+         case when d.policytype = 'r' then (sum(n_tup_upd)/d.numsegments)::bigint else sum(n_tup_upd) end n_tup_upd,
+         case when d.policytype = 'r' then (sum(n_tup_del)/d.numsegments)::bigint else sum(n_tup_del) end n_tup_del,
+         case when d.policytype = 'r' then (sum(n_tup_hot_upd)/d.numsegments)::bigint else sum(n_tup_hot_upd) end n_tup_hot_upd,
+         case when d.policytype = 'r' then (sum(n_live_tup)/d.numsegments)::bigint else sum(n_live_tup) end n_live_tup,
+         case when d.policytype = 'r' then (sum(n_dead_tup)/d.numsegments)::bigint else sum(n_dead_tup) end n_dead_tup,
+         case when d.policytype = 'r' then (sum(n_mod_since_analyze)/d.numsegments)::bigint else sum(n_mod_since_analyze) end n_mod_since_analyze,
+         max(last_vacuum) as last_vacuum,
+         max(last_autovacuum) as last_autovacuum,
+         max(last_analyze) as last_analyze,
+         max(last_autoanalyze) as last_autoanalyze,
+         max(vacuum_count) as vacuum_count,
+         max(autovacuum_count) as autovacuum_count,
+         max(analyze_count) as analyze_count,
+         max(autoanalyze_count) as autoanalyze_count
+     FROM
+         gp_dist_random('pg_stat_all_tables') allt
+         inner join pg_class c
+               on allt.relid = c.oid
+         left outer join gp_distribution_policy d
+              on allt.relid = d.localoid
+     WHERE
+        relid >= 16384
+        and (
+            d.localoid is not null
+            or c.relkind in ('o', 'b', 'M')
+            )
+     GROUP BY allt.relid, allt.schemaname, allt.relname, d.policytype, d.numsegments
+
+     UNION ALL
+
+     SELECT
+         *
+     FROM
+         pg_stat_all_tables
+     WHERE
+             relid < 16384) m, pg_stat_all_tables s
+WHERE m.relid = s.relid;
+
+CREATE VIEW gp_stat_user_tables_summary AS
+    SELECT * FROM gp_stat_all_tables_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+CREATE VIEW gp_stat_sys_tables_summary AS
+    SELECT * FROM gp_stat_all_tables_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_stat_xact_all_tables_summary AS
+SELECT
+    sxa.relid,
+    sxa.schemaname,
+    sxa.relname,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.seq_scan)/dst.numsegments)::bigint ELSE sum(sxa.seq_scan) END AS seq_scan,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.seq_tup_read)/dst.numsegments)::bigint ELSE sum(sxa.seq_tup_read) END AS seq_tup_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.idx_scan)/dst.numsegments)::bigint ELSE sum(sxa.idx_scan) END AS idx_scan,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.idx_tup_fetch)/dst.numsegments)::bigint ELSE sum(sxa.idx_tup_fetch) END AS idx_tup_fetch,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.n_tup_ins)/dst.numsegments)::bigint ELSE sum(sxa.n_tup_ins) END AS n_tup_ins,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.n_tup_upd)/dst.numsegments)::bigint ELSE sum(sxa.n_tup_upd) END AS n_tup_upd,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.n_tup_del)/dst.numsegments)::bigint ELSE sum(sxa.n_tup_del) END AS n_tup_del,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sxa.n_tup_hot_upd)/dst.numsegments)::bigint ELSE sum(sxa.n_tup_hot_upd) END AS n_tup_hot_upd
+FROM
+    gp_stat_xact_all_tables sxa
+    LEFT OUTER JOIN gp_distribution_policy dst
+         ON sxa.relid = dst.localoid
+GROUP BY
+    sxa.relid,
+    sxa.schemaname,
+    sxa.relname,
+    dst.policytype,
+    dst.numsegments;
+
+CREATE VIEW gp_stat_xact_sys_tables_summary as
+    SELECT * FROM gp_stat_xact_all_tables_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_stat_xact_user_tables_summary AS
+    SELECT * FROM gp_stat_xact_all_tables_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+-- Gather data from segments on user tables, and use data on coordinator on system tables.
+CREATE VIEW gp_stat_all_indexes_summary AS
+SELECT
+    s.relid,
+    s.indexrelid,
+    s.schemaname,
+    s.relname,
+    s.indexrelname,
+    m.idx_scan,
+    m.idx_tup_read,
+    m.idx_tup_fetch
+FROM
+    (SELECT
+         alli.relid,
+         alli.indexrelid,
+         alli.schemaname,
+         alli.relname,
+         alli.indexrelname,
+         case when d.policytype = 'r' then (sum(alli.idx_scan)/d.numsegments)::bigint else sum(alli.idx_scan) end idx_scan,
+         case when d.policytype = 'r' then (sum(alli.idx_tup_read)/d.numsegments)::bigint else sum(alli.idx_tup_read) end idx_tup_read,
+         case when d.policytype = 'r' then (sum(alli.idx_tup_fetch)/d.numsegments)::bigint else sum(alli.idx_tup_fetch) end idx_tup_fetch
+     FROM
+         gp_dist_random('pg_stat_all_indexes') alli
+         inner join pg_class c
+               on alli.relid = c.oid
+         left outer join gp_distribution_policy d
+              on alli.relid = d.localoid
+     WHERE
+        relid >= 16384
+     GROUP BY alli.relid, alli.indexrelid, alli.schemaname, alli.relname, alli.indexrelname, d.policytype, d.numsegments
+
+     UNION ALL
+
+     SELECT
+         *
+     FROM
+         pg_stat_all_indexes
+     WHERE
+             relid < 16384) m, pg_stat_all_indexes s
+WHERE m.relid = s.relid;
+
+CREATE VIEW gp_stat_sys_indexes_summary AS
+    SELECT * FROM gp_stat_all_indexes_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_stat_user_indexes_summary AS
+    SELECT * FROM gp_stat_all_indexes_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+CREATE VIEW gp_statio_all_tables_summary as
+SELECT
+    sat.relid,
+    sat.schemaname,
+    sat.relname,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.heap_blks_read)/dst.numsegments)::bigint ELSE sum(sat.heap_blks_read) END AS heap_blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.heap_blks_hit)/dst.numsegments)::bigint ELSE sum(sat.heap_blks_hit) END AS heap_blks_hit,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.idx_blks_read)/dst.numsegments)::bigint ELSE sum(sat.idx_blks_read) END AS idx_blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.idx_blks_hit)/dst.numsegments)::bigint ELSE sum(sat.idx_blks_hit) END AS idx_blks_hit,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.toast_blks_read)/dst.numsegments)::bigint ELSE sum(sat.toast_blks_read) END AS toast_blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.toast_blks_hit)/dst.numsegments)::bigint ELSE sum(sat.toast_blks_hit) END AS toast_blks_hit,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.tidx_blks_read)/dst.numsegments)::bigint ELSE sum(sat.tidx_blks_read) END AS tidx_blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sat.tidx_blks_hit)/dst.numsegments)::bigint ELSE sum(sat.tidx_blks_hit) END AS tidx_blks_hit
+FROM
+    gp_statio_all_tables sat
+    LEFT OUTER JOIN gp_distribution_policy dst
+         ON sat.relid = dst.localoid
+GROUP BY
+    sat.relid,
+    sat.schemaname,
+    sat.relname,
+    dst.policytype,
+    dst.numsegments;
+
+CREATE VIEW gp_statio_sys_tables_summary AS
+    SELECT * FROM gp_statio_all_tables_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_statio_user_tables_summary AS
+    SELECT * FROM gp_stat_all_tables_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+CREATE VIEW gp_statio_all_sequences_summary as
+SELECT
+    sas.relid,
+    sas.schemaname,
+    sas.relname,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sas.blks_read)/dst.numsegments)::bigint ELSE sum(sas.blks_read) END AS blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sas.blks_hit)/dst.numsegments)::bigint ELSE sum(sas.blks_hit) END AS blks_hit
+FROM
+    gp_statio_all_sequences sas
+    LEFT OUTER JOIN gp_distribution_policy dst
+         ON sas.relid = dst.localoid
+GROUP BY
+    sas.relid,
+    sas.schemaname,
+    sas.relname,
+    dst.policytype,
+    dst.numsegments;
+
+CREATE VIEW gp_statio_sys_sequences_summary AS
+    SELECT * FROM gp_statio_all_sequences_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_statio_user_sequences_summary AS
+    SELECT * FROM gp_statio_all_sequences_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+CREATE VIEW gp_statio_all_indexes_summary AS
+SELECT
+    sai.relid,
+    sai.indexrelid,
+    sai.schemaname,
+    sai.relname,
+    sai.indexrelname,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sai.idx_blks_read)/dst.numsegments)::bigint ELSE sum(sai.idx_blks_read) END AS idx_blks_read,
+    CASE WHEN dst.policytype = 'r' THEN (sum(sai.idx_blks_hit)/dst.numsegments)::bigint ELSE sum(sai.idx_blks_hit) END AS idx_blks_hit
+FROM
+    gp_statio_all_indexes sai
+    LEFT OUTER JOIN gp_distribution_policy dst
+         ON sai.relid = dst.localoid
+GROUP BY
+    sai.relid,
+    sai.indexrelid,
+    sai.schemaname,
+    sai.relname,
+    sai.indexrelname,
+    dst.policytype,
+    dst.numsegments;
+
+CREATE VIEW gp_statio_sys_indexes_summary AS
+    SELECT * FROM gp_statio_all_indexes_summary
+    WHERE schemaname IN ('pg_catalog', 'information_schema', 'pg_aoseg') OR
+          schemaname ~ '^pg_toast';
+
+CREATE VIEW gp_statio_user_indexes_summary AS
+    SELECT * FROM gp_statio_all_indexes_summary
+    WHERE schemaname NOT IN ('pg_catalog', 'information_schema', 'pg_aoseg') AND
+          schemaname !~ '^pg_toast';
+
+CREATE VIEW gp_stat_user_functions_summary AS
+SELECT
+    guf.funcid,
+    guf.schemaname,
+    guf.funcname,
+    sum(guf.calls) AS calls,
+    sum(guf.total_time) AS total_time,
+    sum(guf.self_time) AS self_time
+FROM
+    gp_stat_user_functions guf
+GROUP BY
+    guf.funcid,
+    guf.schemaname,
+    guf.funcname;
+
+CREATE VIEW gp_stat_xact_user_functions_summary AS
+SELECT
+    xuf.funcid,
+    xuf.schemaname,
+    xuf.funcname,
+    sum(xuf.calls) AS calls,
+    sum(xuf.total_time) AS total_time,
+    sum(xuf.self_time) AS self_time
+FROM
+    gp_stat_xact_user_functions xuf
+GROUP BY
+    xuf.funcid,
+    xuf.schemaname,
+    xuf.funcname;
+
+CREATE VIEW gp_stat_slru_summary AS
+SELECT
+    gss.name,
+    sum(gss.blks_zeroed) AS blks_zeroed,
+    sum(gss.blks_hit) AS blks_hit,
+    sum(gss.blks_read) AS blks_read,
+    sum(gss.blks_written) AS blks_written,
+    sum(gss.blks_exists) AS blks_exists,
+    sum(gss.flushes) AS flushes,
+    sum(gss.truncates) AS truncates,
+    max(gss.stats_reset) AS stats_reset
+FROM
+    gp_stat_slru gss
+GROUP BY
+    gss.name;
+
+
+CREATE VIEW gp_stat_progress_vacuum_summary AS
+SELECT
+    max(coalesce(a1.pid, 0)) as pid,
+    a.datid,
+    a.datname,
+    a.relid,
+    a.phase,
+    case when d.policytype = 'r' then (sum(a.heap_blks_total)/d.numsegments)::bigint else sum(a.heap_blks_total) end heap_blks_total,
+    case when d.policytype = 'r' then (sum(a.heap_blks_scanned)/d.numsegments)::bigint else sum(a.heap_blks_scanned) end heap_blks_scanned,
+    case when d.policytype = 'r' then (sum(a.heap_blks_vacuumed)/d.numsegments)::bigint else sum(a.heap_blks_vacuumed) end heap_blks_vacuumed,
+    case when d.policytype = 'r' then (sum(a.index_vacuum_count)/d.numsegments)::bigint else sum(a.index_vacuum_count) end index_vacuum_count,
+    case when d.policytype = 'r' then (sum(a.max_dead_tuples)/d.numsegments)::bigint else sum(a.max_dead_tuples) end max_dead_tuples,
+    case when d.policytype = 'r' then (sum(a.num_dead_tuples)/d.numsegments)::bigint else sum(a.num_dead_tuples) end num_dead_tuples
+FROM gp_stat_progress_vacuum a
+    JOIN pg_class c ON a.relid = c.oid
+    LEFT JOIN gp_distribution_policy d ON c.oid = d.localoid
+    LEFT JOIN gp_stat_progress_vacuum a1 ON a.pid = a1.pid AND a1.gp_segment_id = -1
+WHERE a.gp_segment_id > -1
+GROUP BY a.datid, a.datname, a.relid, a.phase, d.policytype, d.numsegments;
+
+CREATE OR REPLACE VIEW gp_stat_progress_analyze_summary AS
+SELECT
+    max(coalesce(a1.pid, 0)) as pid,
+    a.datid,
+    a.datname,
+    a.relid,
+    a.phase,
+    case when d.policytype = 'r' then (sum(a.sample_blks_total)/d.numsegments)::bigint else sum(a.sample_blks_total) end sample_blks_total,
+    case when d.policytype = 'r' then (sum(a.sample_blks_scanned)/d.numsegments)::bigint else sum(a.sample_blks_scanned) end sample_blks_scanned,
+    case when d.policytype = 'r' then (sum(a.ext_stats_total)/d.numsegments)::bigint else sum(a.ext_stats_total) end ext_stats_total,
+    case when d.policytype = 'r' then (sum(a.ext_stats_computed)/d.numsegments)::bigint else sum(a.ext_stats_computed) end ext_stats_computed,
+    case when d.policytype = 'r' then (sum(a.child_tables_total)/d.numsegments)::bigint else sum(a.child_tables_total) end child_tables_total,
+    case when d.policytype = 'r' then (sum(a.child_tables_done)/d.numsegments)::bigint else sum(a.child_tables_done) end child_tables_done
+FROM gp_stat_progress_analyze a
+    JOIN pg_class c ON a.relid = c.oid
+    LEFT JOIN gp_distribution_policy d ON c.oid = d.localoid
+    LEFT JOIN gp_stat_progress_analyze a1 ON a.pid = a1.pid AND a1.gp_segment_id = -1
+WHERE a.gp_segment_id > -1
+GROUP BY a.datid, a.datname, a.relid, a.phase, d.policytype, d.numsegments;
+
+CREATE OR REPLACE VIEW gp_stat_progress_cluster_summary AS
+SELECT
+    max(coalesce(a1.pid, 0)) as pid,
+    a.datid,
+    a.datname,
+    a.relid,
+    a.command,
+    a.phase,
+    a.cluster_index_relid,
+    case when d.policytype = 'r' then (sum(a.heap_tuples_scanned)/d.numsegments)::bigint else sum(a.heap_tuples_scanned) end heap_tuples_scanned,
+    case when d.policytype = 'r' then (sum(a.heap_tuples_written)/d.numsegments)::bigint else sum(a.heap_tuples_written) end heap_tuples_written,
+    case when d.policytype = 'r' then (sum(a.heap_blks_total)/d.numsegments)::bigint else sum(a.heap_blks_total) end heap_blks_total,
+    case when d.policytype = 'r' then (sum(a.heap_blks_scanned)/d.numsegments)::bigint else sum(a.heap_blks_scanned) end heap_blks_scanned,
+    case when d.policytype = 'r' then (sum(a.index_rebuild_count)/d.numsegments)::bigint else sum(a.index_rebuild_count) end index_rebuild_count
+FROM gp_stat_progress_cluster a
+    JOIN pg_class c ON a.relid = c.oid
+    LEFT JOIN gp_distribution_policy d ON c.oid = d.localoid
+    LEFT JOIN gp_stat_progress_cluster a1 ON a.pid = a1.pid AND a1.gp_segment_id = -1
+WHERE a.gp_segment_id > -1
+GROUP BY a.datid, a.datname, a.relid, a.command, a.phase, a.cluster_index_relid, d.policytype, d.numsegments;
+
+CREATE OR REPLACE VIEW gp_stat_progress_create_index_summary AS
+SELECT
+    max(coalesce(a1.pid, 0)) as pid,
+    a.datid,
+    a.datname,
+    a.relid,
+    a.index_relid,
+    a.command,
+    a.phase,
+    case when d.policytype = 'r' then (sum(a.lockers_total)/d.numsegments)::bigint else sum(a.lockers_total) end lockers_total,
+    case when d.policytype = 'r' then (sum(a.lockers_done)/d.numsegments)::bigint else sum(a.lockers_done) end lockers_done,
+    max(a.current_locker_pid) as current_locker_pid,
+    case when d.policytype = 'r' then (sum(a.blocks_total)/d.numsegments)::bigint else sum(a.blocks_total) end blocks_total,
+    case when d.policytype = 'r' then (sum(a.blocks_done)/d.numsegments)::bigint else sum(a.blocks_done) end blocks_done,
+    case when d.policytype = 'r' then (sum(a.tuples_total)/d.numsegments)::bigint else sum(a.tuples_total) end tuples_total,
+    case when d.policytype = 'r' then (sum(a.tuples_done)/d.numsegments)::bigint else sum(a.tuples_done) end tuples_done,
+    case when d.policytype = 'r' then (sum(a.partitions_total)/d.numsegments)::bigint else sum(a.partitions_total) end partitions_total,
+    case when d.policytype = 'r' then (sum(a.partitions_done)/d.numsegments)::bigint else sum(a.partitions_done) end partitions_done
+FROM gp_stat_progress_create_index a
+    JOIN pg_class c ON a.relid = c.oid
+    LEFT JOIN gp_distribution_policy d ON c.oid = d.localoid
+    LEFT JOIN gp_stat_progress_create_index a1 ON a.pid = a1.pid AND a1.gp_segment_id = -1
+WHERE a.gp_segment_id > -1
+GROUP BY a.datid, a.datname, a.relid, a.index_relid, a.command, a.phase, d.policytype, d.numsegments;
diff --git a/src/backend/cdb/cdbpath.c b/src/backend/cdb/cdbpath.c
index 9e3697a3b03..e9d7dac9895 100644
--- a/src/backend/cdb/cdbpath.c
+++ b/src/backend/cdb/cdbpath.c
@@ -3112,8 +3112,9 @@ cdbpath_motion_for_parallel_join(PlannerInfo *root,
 		case JOIN_UNIQUE_INNER:
 		case JOIN_RIGHT:
 		case JOIN_FULL:
-			/* Join types are not supported in parallel yet. */
-			goto fail;
+			outer.ok_to_replicate = false;
+			inner.ok_to_replicate = false;
+			break;
 		case JOIN_DEDUP_SEMI:
 			if (!enable_parallel_dedup_semi_join)
 				goto fail;
diff --git a/src/backend/cdb/cdbpathlocus.c b/src/backend/cdb/cdbpathlocus.c
index 29930085429..dddae1aa64c 100644
--- a/src/backend/cdb/cdbpathlocus.c
+++ b/src/backend/cdb/cdbpathlocus.c
@@ -119,6 +119,11 @@ cdbpathlocus_equal(CdbPathLocus a, CdbPathLocus b)
 		list_length(a.distkey) != list_length(b.distkey))
 		return false;
 
+	/*
+	 * CBDB_PARALLEL: What if both a and b are HashedOJ with parallel workers > 0 ?
+	 * Are they equal in practice?
+	 */
+
 	if ((CdbPathLocus_IsHashed(a) || CdbPathLocus_IsHashedOJ(a)) &&
 		(CdbPathLocus_IsHashed(b) || CdbPathLocus_IsHashedOJ(b)))
 		return cdbpath_distkey_equal(a.distkey, b.distkey);
@@ -544,7 +549,7 @@ cdbpathlocus_from_subquery(struct PlannerInfo *root,
 		else
 		{
 			Assert(CdbPathLocus_IsHashedOJ(subpath->locus));
-			CdbPathLocus_MakeHashedOJ(&locus, distkeys, numsegments);
+			CdbPathLocus_MakeHashedOJ(&locus, distkeys, numsegments, subpath->locus.parallel_workers);
 		}
 	}
 	else
@@ -711,7 +716,7 @@ cdbpathlocus_pull_above_projection(struct PlannerInfo *root,
 			CdbPathLocus_MakeHashedWorkers(&newlocus, newdistkeys, numsegments, locus.parallel_workers);
 		}
 		else
-			CdbPathLocus_MakeHashedOJ(&newlocus, newdistkeys, numsegments);
+			CdbPathLocus_MakeHashedOJ(&newlocus, newdistkeys, numsegments, locus.parallel_workers);
 		return newlocus;
 	}
 	else
@@ -880,7 +885,7 @@ cdbpathlocus_join(JoinType jointype, CdbPathLocus a, CdbPathLocus b)
 
 			newdistkeys = lappend(newdistkeys, newdistkey);
 		}
-		CdbPathLocus_MakeHashedOJ(&resultlocus, newdistkeys, numsegments);
+		CdbPathLocus_MakeHashedOJ(&resultlocus, newdistkeys, numsegments, 0 /* Both are 0 parallel here*/);
 	}
 	Assert(cdbpathlocus_is_valid(resultlocus));
 	return resultlocus;
@@ -1236,8 +1241,14 @@ cdbpathlocus_parallel_join(JoinType jointype, CdbPathLocus a, CdbPathLocus b, bo
 	Assert(cdbpathlocus_is_valid(a));
 	Assert(cdbpathlocus_is_valid(b));
 
-	/* Do both input rels have same locus? */
-	if (cdbpathlocus_equal(a, b))
+	/*
+	 * Do both input rels have same locus? 
+	 * CBDB_PARALLEL: for FULL JOIN, it could be different even both
+	 * are same loucs. Because the NULL values could be on any segments
+	 * after join.
+	 */
+
+	if (jointype != JOIN_FULL && cdbpathlocus_equal(a, b))
 		return a;
 
 	/*
@@ -1412,8 +1423,9 @@ cdbpathlocus_parallel_join(JoinType jointype, CdbPathLocus a, CdbPathLocus b, bo
 	 * If inner is hashed workers, and outer is hashed. Join locus will be hashed.
 	 * If outer is hashed workers, and inner is hashed. Join locus will be hashed workers.
 	 * Seems we should just return outer locus anyway.
+	 * Things changed since we have parallel full join now.
 	 */
-	if (parallel_aware)
+	if (parallel_aware && jointype != JOIN_FULL)
 		return a;
 
 	numsegments = CdbPathLocus_NumSegments(a);
@@ -1469,7 +1481,9 @@ cdbpathlocus_parallel_join(JoinType jointype, CdbPathLocus a, CdbPathLocus b, bo
 			newdistkeys = lappend(newdistkeys, newdistkey);
 		}
 
-		CdbPathLocus_MakeHashedOJ(&resultlocus, newdistkeys, numsegments);
+		Assert(CdbPathLocus_NumParallelWorkers(a) == CdbPathLocus_NumParallelWorkers(b));
+
+		CdbPathLocus_MakeHashedOJ(&resultlocus, newdistkeys, numsegments, CdbPathLocus_NumParallelWorkers(a));
 	}
 	Assert(cdbpathlocus_is_valid(resultlocus));
 	return resultlocus;
diff --git a/src/backend/cdb/cdbutil.c b/src/backend/cdb/cdbutil.c
index fbf3f8900f2..2503049b434 100644
--- a/src/backend/cdb/cdbutil.c
+++ b/src/backend/cdb/cdbutil.c
@@ -593,8 +593,13 @@ getCdbComponentInfo(void)
 			continue;
 
 		hsEntry = (HostPrimaryCountEntry *) hash_search(hostPrimaryCountHash, cdbInfo->config->hostname, HASH_FIND, &found);
-		Assert(found);
-		cdbInfo->hostPrimaryCount = hsEntry->segmentCount;
+		Assert(found || IS_HOT_STANDBY_QD());
+		/*
+		 * Standby and mirror entries can legitimately live on hosts that do not
+		 * own any primary segments. In that case the lookup is absent and the
+		 * count should be treated as zero instead of dereferencing a NULL entry.
+		 */
+		cdbInfo->hostPrimaryCount = found ? hsEntry->segmentCount : 0;
 	}
 
 	for (i = 0; i < component_databases->total_entry_dbs; i++)
@@ -605,8 +610,13 @@ getCdbComponentInfo(void)
 			continue;
 
 		hsEntry = (HostPrimaryCountEntry *) hash_search(hostPrimaryCountHash, cdbInfo->config->hostname, HASH_FIND, &found);
-		Assert(found);
-		cdbInfo->hostPrimaryCount = hsEntry->segmentCount;
+		Assert(found || IS_HOT_STANDBY_QD());
+		/*
+		 * Standby and mirror entries can legitimately live on hosts that do not
+		 * own any primary segments. In that case the lookup is absent and the
+		 * count should be treated as zero instead of dereferencing a NULL entry.
+		 */
+		cdbInfo->hostPrimaryCount = found ? hsEntry->segmentCount : 0;
 	}
 
 	hash_destroy(hostPrimaryCountHash);
diff --git a/src/backend/cdb/motion/cdbmotion.c b/src/backend/cdb/motion/cdbmotion.c
index 24b112cd1bd..ad3b1c49a65 100644
--- a/src/backend/cdb/motion/cdbmotion.c
+++ b/src/backend/cdb/motion/cdbmotion.c
@@ -133,8 +133,8 @@ RemoveMotionLayer(MotionLayerState *mlStates)
 	/* Emit statistics to log */
 	if (gp_log_interconnect >= GPVARS_VERBOSITY_VERBOSE)
 		elog(LOG, "RemoveMotionLayer(): dumping stats\n"
-			 "      Sent: %9u chunks %9u total bytes %9u tuple bytes\n"
-			 "  Received: %9u chunks %9u total bytes %9u tuple bytes; "
+			 "      Sent: %9" INT64_MODIFIER "u chunks %9" INT64_MODIFIER "u total bytes %9" INT64_MODIFIER "u tuple bytes\n"
+			 "  Received: %9" INT64_MODIFIER "u chunks %9" INT64_MODIFIER "u total bytes %9" INT64_MODIFIER "u tuple bytes; "
 			 "%9u chunkproc calls\n",
 			 mlStates->stat_total_chunks_sent,
 			 mlStates->stat_total_bytes_sent,
diff --git a/src/backend/commands/analyze.c b/src/backend/commands/analyze.c
index 8d329d44503..6f8b5e3d0ec 100644
--- a/src/backend/commands/analyze.c
+++ b/src/backend/commands/analyze.c
@@ -884,7 +884,7 @@ do_analyze_rel(Relation onerel, VacuumParams *params,
 
 			if (Gp_role == GP_ROLE_DISPATCH && GpPolicyIsPartitioned(onerel->rd_cdbpolicy))
 			{
-				stats->stadistinctbyseg = colNDVBySeg[i];
+				stats->stadistinctbyseg = colNDVBySeg[stats->attr->attnum - 1];
 			}
 
 			stats->tupDesc = onerel->rd_att;
@@ -1008,7 +1008,7 @@ do_analyze_rel(Relation onerel, VacuumParams *params,
 
 			if (Gp_role == GP_ROLE_EXECUTE) {
 				Assert(ctx->stadistincts);
-				ctx->stadistincts[i] = Float8GetDatum(stats->stadistinct);
+				ctx->stadistincts[stats->attr->attnum - 1] = Float8GetDatum(stats->stadistinct);
 			}
 
 			MemoryContextResetAndDeleteChildren(col_context);
@@ -1896,6 +1896,7 @@ acquire_sample_rows(Relation onerel, int elevel,
 
 		pgstat_progress_update_param(PROGRESS_ANALYZE_BLOCKS_DONE,
 									 ++blksdone);
+		SIMPLE_FAULT_INJECTOR("analyze_block");
 	}
 
 	ExecDropSingleTupleTableSlot(slot);
diff --git a/src/backend/commands/copy.c b/src/backend/commands/copy.c
index c9d2ac4f968..4ccd3798067 100644
--- a/src/backend/commands/copy.c
+++ b/src/backend/commands/copy.c
@@ -58,7 +58,6 @@
 #include "catalog/catalog.h"
 #include "catalog/gp_matview_aux.h"
 #include "catalog/namespace.h"
-#include "catalog/pg_inherits.h"
 #include "catalog/pg_extprotocol.h"
 #include "cdb/cdbappendonlyam.h"
 #include "cdb/cdbaocsam.h"
@@ -137,37 +136,6 @@ DoCopy(ParseState *pstate, const CopyStmt *stmt,
 	{
 		/* Open and lock the relation, using the appropriate lock type. */
 		rel = table_openrv(stmt->relation, lockmode);
-
-		/*
-		 * For COPY TO, refresh the active snapshot after acquiring the lock.
-		 *
-		 * The snapshot was originally pushed by PortalRunUtility() before
-		 * DoCopy() was called, which means it was taken before we acquired
-		 * the lock on the relation. If we had to wait for a conflicting lock
-		 * (e.g., AccessExclusiveLock held by a concurrent ALTER TABLE ...
-		 * SET WITH (reorganize=true)), the snapshot may predate the
-		 * concurrent transaction's commit. After the lock is granted, scanning
-		 * with such a stale snapshot would miss all tuples written by the
-		 * concurrent transaction, resulting in COPY returning zero rows.
-		 *
-		 * This mirrors the approach used by exec_simple_query() for SELECT
-		 * statements, which pops the parse/analyze snapshot and takes a fresh
-		 * one in PortalStart() after locks have been acquired (see the comment
-		 * at postgres.c:1859-1867). It is also consistent with how VACUUM and
-		 * CLUSTER manage their own snapshots internally.
-		 *
-		 * In REPEATABLE READ or SERIALIZABLE mode, GetTransactionSnapshot()
-		 * returns the same transaction-level snapshot regardless, making this
-		 * a harmless no-op.
-		 *
-		 * We only do this for COPY TO (!is_from) because COPY FROM inserts
-		 * data and does not scan existing tuples with a snapshot.
-		 */
-		if (!is_from && ActiveSnapshotSet())
-		{
-			PopActiveSnapshot();
-			PushActiveSnapshot(GetTransactionSnapshot());
-		}
 	}
 	
 	/*
@@ -304,55 +272,6 @@ DoCopy(ParseState *pstate, const CopyStmt *stmt,
 						 errmsg("COPY FROM not supported with row-level security"),
 						 errhint("Use INSERT statements instead.")));
 
-			/*
-			 * For partitioned table COPY TO: eagerly acquire AccessShareLock
-			 * on all child partitions before refreshing the snapshot.
-			 *
-			 * When COPY is performed on a partitioned table, the parent
-			 * relation's AccessShareLock is acquired above (via table_openrv)
-			 * and Method A already refreshed the snapshot.  However, the
-			 * parent's AccessShareLock does NOT conflict with an
-			 * AccessExclusiveLock held on a child partition by a concurrent
-			 * reorganize.  As a result, Method A's snapshot may still predate
-			 * the child's reorganize commit.
-			 *
-			 * Child partition locks are acquired later, deep inside
-			 * ExecutorStart() via ExecInitAppend(), by which time the snapshot
-			 * has already been embedded in the QueryDesc via
-			 * PushCopiedSnapshot() in BeginCopy().  Even a second snapshot
-			 * refresh in BeginCopy() (after AcquireRewriteLocks) would not
-			 * help, because AcquireRewriteLocks only locks the parent (child
-			 * partitions are not in the initial range table of
-			 * "SELECT * FROM parent").
-			 *
-			 * The fix: call find_all_inheritors() with AccessShareLock to
-			 * acquire locks on every child partition NOW, before building the
-			 * query.  If a child partition's reorganize holds
-			 * AccessExclusiveLock, this call blocks until that transaction
-			 * commits.  Once it returns, all child-level reorganize operations
-			 * have committed, and a fresh snapshot taken here will see all
-			 * reorganized child data.
-			 *
-			 * find_all_inheritors() acquires locks that persist to end of
-			 * transaction.  The executor will re-acquire them during scan
-			 * initialization, which is a lock-manager no-op.
-			 */
-			if (!is_from && rel->rd_rel->relkind == RELKIND_PARTITIONED_TABLE)
-			{
-				List	   *part_oids;
-
-				part_oids = find_all_inheritors(RelationGetRelid(rel),
-												AccessShareLock, NULL);
-				list_free(part_oids);
-
-				/* Refresh snapshot: all child partition locks now held */
-				if (ActiveSnapshotSet())
-				{
-					PopActiveSnapshot();
-					PushActiveSnapshot(GetTransactionSnapshot());
-				}
-			}
-
 			/*
 			 * Build target list
 			 *
diff --git a/src/backend/commands/copyto.c b/src/backend/commands/copyto.c
index 88e61305250..871a973235e 100644
--- a/src/backend/commands/copyto.c
+++ b/src/backend/commands/copyto.c
@@ -1198,43 +1198,6 @@ BeginCopy(ParseState *pstate,
 
 		Assert(query->utilityStmt == NULL);
 
-		/*
-		 * Refresh the active snapshot after pg_analyze_and_rewrite() has
-		 * acquired all necessary relation locks via AcquireRewriteLocks().
-		 *
-		 * The snapshot in use was pushed by PortalRunUtility() before DoCopy()
-		 * was called -- before any table locks were acquired.  If
-		 * AcquireRewriteLocks() had to wait for a conflicting
-		 * AccessExclusiveLock (e.g., held by a concurrent ALTER TABLE ...
-		 * SET WITH (reorganize=true)), the lock wait is now over and the
-		 * reorganize transaction has committed.  The snapshot taken before the
-		 * wait does not reflect that commit: after reorganize completes,
-		 * swap_relation_files() has replaced the physical storage, so old
-		 * tuples no longer exist and the new tuples have xmin = reorganize_xid
-		 * which is not yet visible in the pre-wait snapshot.  Scanning with
-		 * the stale snapshot returns 0 rows -- a violation of transaction
-		 * atomicity (the reader must see either all old rows or all new rows).
-		 *
-		 * By refreshing the snapshot here -- after all locks are acquired --
-		 * we guarantee that the query will see the committed post-reorganize
-		 * data.
-		 *
-		 * This applies to:
-		 *   - Pure query-based COPY TO: COPY (SELECT ...) TO
-		 *   - RLS table COPY TO: converted to query-based in DoCopy(); the
-		 *     RLS policy references an external lookup table whose lock is
-		 *     acquired by AcquireRewriteLocks().
-		 *
-		 * In REPEATABLE READ or SERIALIZABLE isolation,
-		 * GetTransactionSnapshot() returns the same transaction-level
-		 * snapshot, making this a harmless no-op.
-		 */
-		if (ActiveSnapshotSet())
-		{
-			PopActiveSnapshot();
-			PushActiveSnapshot(GetTransactionSnapshot());
-		}
-
 		/*
 		 * Similarly the grammar doesn't enforce the presence of a RETURNING
 		 * clause, but this is required here.
diff --git a/src/backend/commands/createas.c b/src/backend/commands/createas.c
index 6822032fe0d..a3d2f155fd8 100644
--- a/src/backend/commands/createas.c
+++ b/src/backend/commands/createas.c
@@ -478,10 +478,6 @@ ExecCreateTableAs(ParseState *pstate, CreateTableAsStmt *stmt,
 									dest, params, queryEnv, 0);
 	}
 
-	/* GPDB hook for collecting query info */
-	if (query_info_collect_hook)
-		(*query_info_collect_hook)(METRICS_QUERY_SUBMIT, queryDesc);
-
 	if (into->skipData)
 	{
 		/*
@@ -495,6 +491,10 @@ ExecCreateTableAs(ParseState *pstate, CreateTableAsStmt *stmt,
 	}
 	else
 	{
+		/* GPDB hook for collecting query info */
+		if (query_info_collect_hook)
+			(*query_info_collect_hook)(METRICS_QUERY_SUBMIT, queryDesc);
+
 		check_and_unassign_from_resgroup(queryDesc->plannedstmt);
 		queryDesc->plannedstmt->query_mem = ResourceManagerGetQueryMemoryLimit(queryDesc->plannedstmt);
 
diff --git a/src/backend/commands/matview.c b/src/backend/commands/matview.c
index 1555ea9d334..dc8efd4d892 100644
--- a/src/backend/commands/matview.c
+++ b/src/backend/commands/matview.c
@@ -63,6 +63,7 @@
 #include "tcop/tcopprot.h"
 #include "utils/builtins.h"
 #include "utils/lsyscache.h"
+#include "utils/metrics_utils.h"
 #include "utils/rel.h"
 #include "utils/snapmgr.h"
 #include "utils/syscache.h"
@@ -842,6 +843,10 @@ refresh_matview_datafill(DestReceiver *dest, Query *query,
 								GetActiveSnapshot(), InvalidSnapshot,
 								dest, NULL, NULL, 0);
 
+	/* GPDB hook for collecting query info */
+	if (query_info_collect_hook)
+		(*query_info_collect_hook)(METRICS_QUERY_SUBMIT, queryDesc);
+
 	RestoreOidAssignments(saved_dispatch_oids);
 
 	/* call ExecutorStart to prepare the plan for execution */
diff --git a/src/backend/commands/portalcmds.c b/src/backend/commands/portalcmds.c
index 4817c14f07d..e23dc1d9c43 100644
--- a/src/backend/commands/portalcmds.c
+++ b/src/backend/commands/portalcmds.c
@@ -35,6 +35,7 @@
 #include "tcop/pquery.h"
 #include "tcop/tcopprot.h"
 #include "utils/memutils.h"
+#include "utils/metrics_utils.h"
 #include "utils/snapmgr.h"
 
 #include "cdb/cdbendpoint.h"
@@ -374,6 +375,22 @@ PortalCleanup(Portal portal)
 
 			CurrentResourceOwner = saveResourceOwner;
 		}
+		else
+		{
+			/* GPDB hook for collecting query info */
+			if (queryDesc->gpsc_query_key && query_info_collect_hook)
+			{
+				PG_TRY();
+				{
+					(*query_info_collect_hook)(METRICS_QUERY_ERROR, queryDesc);
+				}
+				PG_CATCH();
+				{
+					FlushErrorState();
+				}
+				PG_END_TRY();
+			}
+		}
 	}
 
 	/* 
diff --git a/src/backend/commands/tablecmds.c b/src/backend/commands/tablecmds.c
index 34c910565a9..76e939cf54d 100644
--- a/src/backend/commands/tablecmds.c
+++ b/src/backend/commands/tablecmds.c
@@ -1183,7 +1183,7 @@ DefineRelation(CreateStmt *stmt, char relkind, Oid ownerId,
 		 * table access method. The partition table will have the same behaviors on
 		 * relam, reloptions, attribute encodings in the future.
 		 */
-		stmt->attr_encodings = transfromColumnEncodingAocoRootPartition(schema,
+		stmt->attr_encodings = transformColumnEncodingAocoRootPartition(schema,
 								stmt->attr_encodings,
 								stmt->options,
 								!AMHandlerIsAoCols(amHandlerOid)
diff --git a/src/backend/commands/tablespace.c b/src/backend/commands/tablespace.c
index 2416522d016..e6822521694 100644
--- a/src/backend/commands/tablespace.c
+++ b/src/backend/commands/tablespace.c
@@ -328,7 +328,7 @@ CreateTableSpace(CreateTableSpaceStmt *stmt)
 	}
 
 	if (!location)
-		location = pstrdup(stmt->location);
+		location = pstrdup(stmt->location ? stmt->location : "");
 
 	if (stmt->filehandler)
 		fileHandler = pstrdup(stmt->filehandler);
@@ -1230,14 +1230,19 @@ destroy_tablespace_directories(Oid tablespaceoid, bool redo)
 	linkloc = pstrdup(linkloc_with_version_dir);
 	get_parent_directory(linkloc);
 
-	/* Remove the symlink target directory if it exists or is valid. */
+	/*
+	 * Remove the symlink target directory if it exists or is valid.
+	 * If linkloc is a directory (e.g. in-place tablespace), readlink()
+	 * will fail with EINVAL, which we can safely skip.
+	 */
 	rllen = readlink(linkloc, link_target_dir, sizeof(link_target_dir));
 	if(rllen < 0)
 	{
-		ereport(redo ? LOG : ERROR,
-				(errcode_for_file_access(),
-					errmsg("could not read symbolic link \"%s\": %m",
-						   linkloc)));
+		if (errno != EINVAL)
+			ereport(redo ? LOG : ERROR,
+					(errcode_for_file_access(),
+						errmsg("could not read symbolic link \"%s\": %m",
+							   linkloc)));
 	}
 	else if(rllen >= sizeof(link_target_dir))
 	{
diff --git a/src/backend/commands/vacuum_ao.c b/src/backend/commands/vacuum_ao.c
index 466fe30665d..dff6ecf332d 100644
--- a/src/backend/commands/vacuum_ao.c
+++ b/src/backend/commands/vacuum_ao.c
@@ -224,6 +224,14 @@ ao_vacuum_rel_pre_cleanup(Relation onerel, VacuumParams *params, BufferAccessStr
 	 */
 	ao_vacuum_rel_recycle_dead_segments(onerel, params, bstrategy, vacrelstats);
 
+	/*
+	 * Make the pg_aoseg updates above visible to AppendOptimizedTruncateToEOF's
+	 * catalog snapshot; without this the zeroed-eof rows are invisible (same
+	 * CommandId) and the old non-zero-eof rows appear live, triggering "file
+	 * size smaller than logical eof".
+	 */
+	CommandCounterIncrement();
+
 	/*
 	 * Also truncate all live segments to the EOF values stored in pg_aoseg.
 	 * This releases space left behind by aborted inserts.
diff --git a/src/backend/executor/nodeHash.c b/src/backend/executor/nodeHash.c
index a236f5b4819..e59a7c7ccc3 100644
--- a/src/backend/executor/nodeHash.c
+++ b/src/backend/executor/nodeHash.c
@@ -2011,6 +2011,7 @@ ExecParallelHashTableInsert(HashJoinTable hashtable,
 		/* Store the hash value in the HashJoinTuple header. */
 		hashTuple->hashvalue = hashvalue;
 		memcpy(HJTUPLE_MINTUPLE(hashTuple), tuple, tuple->t_len);
+		HeapTupleHeaderClearMatch(HJTUPLE_MINTUPLE(hashTuple));
 
 		/* Push it onto the front of the bucket's list */
 		ExecParallelHashPushTuple(&hashtable->buckets.shared[bucketno],
@@ -2395,6 +2396,69 @@ ExecPrepHashTableForUnmatched(HashJoinState *hjstate)
 	hjstate->hj_CurTuple = NULL;
 }
 
+/*
+ * Decide if this process is allowed to run the unmatched scan.  If so, the
+ * batch barrier is advanced to PHJ_BATCH_SCAN and true is returned.
+ * Otherwise the batch is detached and false is returned.
+ */
+bool
+ExecParallelPrepHashTableForUnmatched(HashJoinState *hjstate)
+{
+	HashJoinTable hashtable = hjstate->hj_HashTable;
+	int			curbatch = hashtable->curbatch;
+	ParallelHashJoinBatch *batch = hashtable->batches[curbatch].shared;
+
+	Assert(BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_PROBING);
+
+	/*
+	 * It would not be deadlock-free to wait on the batch barrier, because it
+	 * is in PHJ_BATCH_PROBING phase, and thus processes attached to it have
+	 * already emitted tuples.  Therefore, we'll hold a wait-free election:
+	 * only one process can continue to the next phase, and all others detach
+	 * from this batch.  They can still go any work on other batches, if there
+	 * are any.
+	 */
+	if (!BarrierArriveAndDetachExceptLast(&batch->batch_barrier))
+	{
+		/* This process considers the batch to be done. */
+		hashtable->batches[hashtable->curbatch].done = true;
+
+		/* Make sure any temporary files are closed. */
+		sts_end_parallel_scan(hashtable->batches[curbatch].inner_tuples);
+		sts_end_parallel_scan(hashtable->batches[curbatch].outer_tuples);
+
+		/*
+		 * Track largest batch we've seen, which would normally happen in
+		 * ExecHashTableDetachBatch().
+		 */
+		hashtable->spacePeak =
+			Max(hashtable->spacePeak,
+				batch->size + sizeof(dsa_pointer_atomic) * hashtable->nbuckets);
+		hashtable->curbatch = -1;
+		return false;
+	}
+
+	/* Now we are alone with this batch. */
+	Assert(BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_SCAN);
+	Assert(BarrierParticipants(&batch->batch_barrier) == 1);
+
+	/*
+	 * Has another process decided to give up early and command all processes
+	 * to skip the unmatched scan?
+	 */
+	if (batch->skip_unmatched)
+	{
+		hashtable->batches[hashtable->curbatch].done = true;
+		ExecHashTableDetachBatch(hashtable);
+		return false;
+	}
+
+	/* Now prepare the process local state, just as for non-parallel join. */
+	ExecPrepHashTableForUnmatched(hjstate);
+
+	return true;
+}
+
 /*
  * ExecScanHashTableForUnmatched
  *		scan the hash table for unmatched inner tuples
@@ -2469,6 +2533,72 @@ ExecScanHashTableForUnmatched(HashJoinState *hjstate, ExprContext *econtext)
 	return false;
 }
 
+/*
+ * ExecParallelScanHashTableForUnmatched
+ *		scan the hash table for unmatched inner tuples, in parallel join
+ *
+ * On success, the inner tuple is stored into hjstate->hj_CurTuple and
+ * econtext->ecxt_innertuple, using hjstate->hj_HashTupleSlot as the slot
+ * for the latter.
+ */
+bool
+ExecParallelScanHashTableForUnmatched(HashJoinState *hjstate,
+									  ExprContext *econtext)
+{
+	HashJoinTable hashtable = hjstate->hj_HashTable;
+	HashJoinTuple hashTuple = hjstate->hj_CurTuple;
+
+	for (;;)
+	{
+		/*
+		 * hj_CurTuple is the address of the tuple last returned from the
+		 * current bucket, or NULL if it's time to start scanning a new
+		 * bucket.
+		 */
+		if (hashTuple != NULL)
+			hashTuple = ExecParallelHashNextTuple(hashtable, hashTuple);
+		else if (hjstate->hj_CurBucketNo < hashtable->nbuckets)
+			hashTuple = ExecParallelHashFirstTuple(hashtable,
+												   hjstate->hj_CurBucketNo++);
+		else
+			break;				/* finished all buckets */
+
+		while (hashTuple != NULL)
+		{
+			if (!HeapTupleHeaderHasMatch(HJTUPLE_MINTUPLE(hashTuple)))
+			{
+				TupleTableSlot *inntuple;
+
+				/* insert hashtable's tuple into exec slot */
+				inntuple = ExecStoreMinimalTuple(HJTUPLE_MINTUPLE(hashTuple),
+												 hjstate->hj_HashTupleSlot,
+												 false);	/* do not pfree */
+				econtext->ecxt_innertuple = inntuple;
+
+				/*
+				 * Reset temp memory each time; although this function doesn't
+				 * do any qual eval, the caller will, so let's keep it
+				 * parallel to ExecScanHashBucket.
+				 */
+				ResetExprContext(econtext);
+
+				hjstate->hj_CurTuple = hashTuple;
+				return true;
+			}
+
+			hashTuple = ExecParallelHashNextTuple(hashtable, hashTuple);
+		}
+
+		/* allow this loop to be cancellable */
+		CHECK_FOR_INTERRUPTS();
+	}
+
+	/*
+	 * no more unmatched tuples
+	 */
+	return false;
+}
+
 /*
  * ExecHashTableReset
  *
@@ -3797,6 +3927,7 @@ ExecParallelHashEnsureBatchAccessors(HashJoinTable hashtable)
 		accessor->shared = shared;
 		accessor->preallocated = 0;
 		accessor->done = false;
+		accessor->outer_eof = false;
 		accessor->inner_tuples =
 			sts_attach(ParallelHashJoinBatchInner(shared),
 					   hashtable->hjstate->worker_id,
@@ -3842,25 +3973,63 @@ ExecHashTableDetachBatch(HashJoinTable hashtable)
 	{
 		int			curbatch = hashtable->curbatch;
 		ParallelHashJoinBatch *batch = hashtable->batches[curbatch].shared;
+		bool		attached = true;
 
 		/* Make sure any temporary files are closed. */
 		sts_end_parallel_scan(hashtable->batches[curbatch].inner_tuples);
 		sts_end_parallel_scan(hashtable->batches[curbatch].outer_tuples);
 
-		/* Detach from the batch we were last working on. */
+		/* After attaching we always get at least to PHJ_BATCH_PROBING. */
+		Assert(BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_PROBING ||
+			   BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_SCAN);
+
+		/*
+		 * If we're abandoning the PHJ_BATCH_PROBING phase early without having
+		 * reached the end of it, it means the plan doesn't want any more
+		 * tuples, and it is happy to abandon any tuples buffered in this
+		 * process's subplans.  For correctness, we can't allow any process to
+		 * execute the PHJ_BATCH_SCAN phase, because we will never have the
+		 * complete set of match bits.  Therefore we skip emitting unmatched
+		 * tuples in all backends (if this is a full/right join), as if those
+		 * tuples were all due to be emitted by this process and it has
+		 * abandoned them too.
+		 */
 		/*
 		 * CBDB_PARALLEL: Parallel Hash Left Anti Semi (Not-In) Join(parallel-aware)
 		 * If phs_lasj_has_null is true, that means we have found null when building hash table,
 		 * there were no batches to detach.
 		 */
-		if (!hashtable->parallel_state->phs_lasj_has_null && BarrierArriveAndDetach(&batch->batch_barrier))
+		if (BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_PROBING &&
+			!hashtable->parallel_state->phs_lasj_has_null && /* CBDB_PARALLEL */
+			!hashtable->batches[curbatch].outer_eof)
+		{
+			/*
+			 * This flag may be written to by multiple backends during
+			 * PHJ_BATCH_PROBING phase, but will only be read in PHJ_BATCH_SCAN
+			 * phase so requires no extra locking.
+			 */
+			batch->skip_unmatched = true;
+		}
+
+		/*
+		 * Even if we aren't doing a full/right outer join, we'll step through
+		 * the PHJ_BATCH_SCAN phase just to maintain the invariant that
+		 * freeing happens in PHJ_BATCH_FREE, but that'll be wait-free.
+		 */
+		if (BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_PROBING &&
+			!hashtable->parallel_state->phs_lasj_has_null /* CBDB_PARALLEL */)
+			attached = BarrierArriveAndDetachExceptLast(&batch->batch_barrier);
+		if (attached && !hashtable->parallel_state->phs_lasj_has_null /* CBDB_PARALLEL */ &&
+			BarrierArriveAndDetach(&batch->batch_barrier))
 		{
 			/*
-			 * Technically we shouldn't access the barrier because we're no
-			 * longer attached, but since there is no way it's moving after
-			 * this point it seems safe to make the following assertion.
+			 * We are not longer attached to the batch barrier, but we're the
+			 * process that was chosen to free resources and it's safe to
+			 * assert the current phase.  The ParallelHashJoinBatch can't go
+			 * away underneath us while we are attached to the build barrier,
+			 * making this access safe.
 			 */
-			Assert(BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_DONE);
+			Assert(BarrierPhase(&batch->batch_barrier) == PHJ_BATCH_FREE);
 
 			/* Free shared chunks and buckets. */
 			while (DsaPointerIsValid(batch->chunks))
diff --git a/src/backend/executor/nodeHashjoin.c b/src/backend/executor/nodeHashjoin.c
index 88eaaa10cef..9981ed8f7ae 100644
--- a/src/backend/executor/nodeHashjoin.c
+++ b/src/backend/executor/nodeHashjoin.c
@@ -81,11 +81,12 @@
  * aren't enough to go around.  For each batch there is a separate barrier
  * with the following phases:
  *
- *  PHJ_BATCH_ELECTING       -- initial state
- *  PHJ_BATCH_ALLOCATING     -- one allocates buckets
- *  PHJ_BATCH_LOADING        -- all load the hash table from disk
- *  PHJ_BATCH_PROBING        -- all probe
- *  PHJ_BATCH_DONE           -- end
+ *  PHJ_BATCH_ELECT          -- initial state
+ *  PHJ_BATCH_ALLOCATE*      -- one allocates buckets
+ *  PHJ_BATCH_LOAD           -- all load the hash table from disk
+ *  PHJ_BATCH_PROBING          -- all probe
+ *  PHJ_BATCH_SCAN*          -- one does full/right unmatched scan
+ *  PHJ_BATCH_FREE*          -- one frees memory
  *
  * Batch 0 is a special case, because it starts out in phase
  * PHJ_BATCH_PROBING; populating batch 0's hash table is done during
@@ -101,10 +102,11 @@
  * finished.  Practically, that means that we never emit a tuple while attached
  * to a barrier, unless the barrier has reached a phase that means that no
  * process will wait on it again.  We emit tuples while attached to the build
- * barrier in phase PHJ_BUILD_RUNNING, and to a per-batch barrier in phase
- * PHJ_BATCH_PROBING.  These are advanced to PHJ_BUILD_DONE and PHJ_BATCH_DONE
- * respectively without waiting, using BarrierArriveAndDetach().  The last to
- * detach receives a different return value so that it knows that it's safe to
+ * barrier in phase PHJ_BUILD_RUN, and to a per-batch barrier in phase
+ * PHJ_BATCH_PROBING.  These are advanced to PHJ_BUILD_FREE and PHJ_BATCH_SCAN
+ * respectively without waiting, using BarrierArriveAndDetach() and
+ * BarrierArriveAndDetachExceptLast() respectively.  The last to detach
+ * receives a different return value so that it knows that it's safe to
  * clean up.  Any straggler process that attaches after that phase is reached
  * will see that it's too late to participate or access the relevant shared
  * memory objects.
@@ -523,8 +525,23 @@ ExecHashJoinImpl(PlanState *pstate, bool parallel)
 					if (HJ_FILL_INNER(node))
 					{
 						/* set up to scan for unmatched inner tuples */
-						ExecPrepHashTableForUnmatched(node);
-						node->hj_JoinState = HJ_FILL_INNER_TUPLES;
+						if (parallel)
+						{
+							/*
+							 * Only one process is currently allow to handle
+							 * each batch's unmatched tuples, in a parallel
+							 * join.
+							 */
+							if (ExecParallelPrepHashTableForUnmatched(node))
+								node->hj_JoinState = HJ_FILL_INNER_TUPLES;
+							else
+								node->hj_JoinState = HJ_NEED_NEW_BATCH;
+						}
+						else
+						{
+							ExecPrepHashTableForUnmatched(node);
+							node->hj_JoinState = HJ_FILL_INNER_TUPLES;
+						}
 					}
 					else
 						node->hj_JoinState = HJ_NEED_NEW_BATCH;
@@ -635,25 +652,13 @@ ExecHashJoinImpl(PlanState *pstate, bool parallel)
 				{
 					node->hj_MatchedOuter = true;
 
-					if (parallel)
-					{
-						/*
-						 * Full/right outer joins are currently not supported
-						 * for parallel joins, so we don't need to set the
-						 * match bit.  Experiments show that it's worth
-						 * avoiding the shared memory traffic on large
-						 * systems.
-						 */
-						Assert(!HJ_FILL_INNER(node));
-					}
-					else
-					{
-						/*
-						 * This is really only needed if HJ_FILL_INNER(node),
-						 * but we'll avoid the branch and just set it always.
-						 */
+
+					/*
+					 * This is really only needed if HJ_FILL_INNER(node), but
+					 * we'll avoid the branch and just set it always.
+					 */
+					if (!HeapTupleHeaderHasMatch(HJTUPLE_MINTUPLE(node->hj_CurTuple)))
 						HeapTupleHeaderSetMatch(HJTUPLE_MINTUPLE(node->hj_CurTuple));
-					}
 
 					/* In an antijoin, we never return a matched tuple */
 					if (node->js.jointype == JOIN_ANTI ||
@@ -712,7 +717,8 @@ ExecHashJoinImpl(PlanState *pstate, bool parallel)
 				 * so any unmatched inner tuples in the hashtable have to be
 				 * emitted before we continue to the next batch.
 				 */
-				if (!ExecScanHashTableForUnmatched(node, econtext))
+				if (!(parallel ? ExecParallelScanHashTableForUnmatched(node, econtext)
+					  : ExecScanHashTableForUnmatched(node, econtext)))
 				{
 					/* no more unmatched tuples */
 					node->hj_JoinState = HJ_NEED_NEW_BATCH;
@@ -1271,6 +1277,8 @@ ExecParallelHashJoinOuterGetTuple(PlanState *outerNode,
 	}
 
 	/* End of this batch */
+	hashtable->batches[curbatch].outer_eof = true;
+
 	return NULL;
 }
 
@@ -1543,15 +1551,34 @@ ExecParallelHashJoinNewBatch(HashJoinState *hjstate)
 					 * hash table stays alive until everyone's finished
 					 * probing it, but no participant is allowed to wait at
 					 * this barrier again (or else a deadlock could occur).
-					 * All attached participants must eventually call
-					 * BarrierArriveAndDetach() so that the final phase
-					 * PHJ_BATCH_DONE can be reached.
+					 * All attached participants must eventually detach from
+					 * the barrier and one worker must advance the phase so
+					 * that the final phase is reached.
 					 */
 					ExecParallelHashTableSetCurrentBatch(hashtable, batchno);
 					sts_begin_parallel_scan(hashtable->batches[batchno].outer_tuples);
+
 					return true;
+				case PHJ_BATCH_SCAN:
+
+					/*
+					 * In principle, we could help scan for unmatched tuples,
+					 * since that phase is already underway (the thing we
+					 * can't do under current deadlock-avoidance rules is wait
+					 * for others to arrive at PHJ_BATCH_SCAN, because
+					 * PHJ_BATCH_PROBING emits tuples, but in this case we just
+					 * got here without waiting).  That is not yet done.  For
+					 * now, we just detach and go around again.  We have to
+					 * use ExecHashTableDetachBatch() because there's a small
+					 * chance we'll be the last to detach, and then we're
+					 * responsible for freeing memory.
+					 */
+					ExecParallelHashTableSetCurrentBatch(hashtable, batchno);
+					hashtable->batches[batchno].done = true;
+					ExecHashTableDetachBatch(hashtable);
+					break;
 
-				case PHJ_BATCH_DONE:
+				case PHJ_BATCH_FREE:
 
 					/*
 					 * Already done.  Detach and go around again (if any
diff --git a/src/backend/foreign/foreign.c b/src/backend/foreign/foreign.c
index 2d60eff9459..7a00c5f06db 100644
--- a/src/backend/foreign/foreign.c
+++ b/src/backend/foreign/foreign.c
@@ -33,6 +33,7 @@
 #include "optimizer/planmain.h"
 #include "optimizer/restrictinfo.h"
 #include "optimizer/tlist.h"
+#include "tcop/tcopprot.h"
 #include "utils/builtins.h"
 #include "utils/memutils.h"
 #include "utils/rel.h"
@@ -590,6 +591,15 @@ GetFdwRoutine(Oid fdwhandler)
 	Datum		datum;
 	FdwRoutine *routine;
 
+	/* Check if the access to foreign tables is restricted */
+	if (unlikely((restrict_nonsystem_relation_kind & RESTRICT_RELKIND_FOREIGN_TABLE) != 0))
+	{
+		/* there must not be built-in FDW handler  */
+		ereport(ERROR,
+				(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+				 errmsg("access to non-system foreign table is restricted")));
+	}
+
 	datum = OidFunctionCall0(fdwhandler);
 	routine = (FdwRoutine *) DatumGetPointer(datum);
 
diff --git a/src/backend/gpopt/config/CConfigParamMapping.cpp b/src/backend/gpopt/config/CConfigParamMapping.cpp
index 603855c50ec..5bd9091f604 100644
--- a/src/backend/gpopt/config/CConfigParamMapping.cpp
+++ b/src/backend/gpopt/config/CConfigParamMapping.cpp
@@ -331,7 +331,12 @@ CConfigParamMapping::SConfigMappingElem CConfigParamMapping::m_elements[] = {
 	 false,	 // m_negate_param
 	 GPOS_WSZ_LIT(
 		 "Enable create window hash agg")},
-	
+
+	{EopttraceDisableStreamingHashAgg, &optimizer_use_streaming_hashagg,
+	 true,	// m_negate_param
+	 GPOS_WSZ_LIT(
+		 "Disable streaming hash agg in ORCA-generated local partial aggregations.")},
+
 };
 
 //---------------------------------------------------------------------------
@@ -449,6 +454,8 @@ CConfigParamMapping::PackConfigParamInBitset(
 		// disable table scan if the corresponding GUC is turned off
 		traceflag_bitset->ExchangeSet(
 			GPOPT_DISABLE_XFORM_TF(CXform::ExfGet2TableScan));
+		traceflag_bitset->ExchangeSet(
+			GPOPT_DISABLE_XFORM_TF(CXform::ExfGet2ParallelTableScan));
 	}
 
 	if (!optimizer_enable_push_join_below_union_all)
diff --git a/src/backend/gpopt/gpdbwrappers.cpp b/src/backend/gpopt/gpdbwrappers.cpp
index aca95b2cc0a..97b149d6164 100644
--- a/src/backend/gpopt/gpdbwrappers.cpp
+++ b/src/backend/gpopt/gpdbwrappers.cpp
@@ -25,6 +25,8 @@
 #include <limits>  // std::numeric_limits
 
 #include "gpos/base.h"
+#include "gpopt/base/COptCtxt.h"
+#include "gpopt/optimizer/COptimizerConfig.h"
 #include "gpos/error/CAutoExceptionStack.h"
 #include "gpos/error/CException.h"
 
@@ -36,8 +38,10 @@ extern "C" {
 #include "access/amapi.h"
 #include "access/external.h"
 #include "access/genam.h"
+#include "access/parallel.h"
 #include "catalog/pg_aggregate.h"
 #include "catalog/pg_inherits.h"
+#include "cdb/cdbvars.h"
 #include "foreign/fdwapi.h"
 #include "nodes/nodeFuncs.h"
 #include "optimizer/clauses.h"
@@ -52,6 +56,9 @@ extern "C" {
 #include "utils/lsyscache.h"
 #include "utils/memutils.h"
 #include "utils/partcache.h"
+
+extern bool enable_parallel;
+extern int max_parallel_workers_per_gather;
 }
 #define GP_WRAP_START                                            \
 	sigjmp_buf local_sigjmp_buf;                                 \
@@ -2012,6 +2019,17 @@ gpdb::CheckCollation(Node *node)
 	return -1;
 }
 
+bool
+gpdb::HasOrderByOrderingOp(Query *query)
+{
+	GP_WRAP_START;
+	{
+		return has_orderby_ordering_op(query);
+	}
+	GP_WRAP_END;
+	return false;
+}
+
 Node *
 gpdb::CoerceToCommonType(ParseState *pstate, Node *node, Oid target_type,
 						 const char *context)
@@ -2565,6 +2583,19 @@ gpdb::GetForeignServerId(Oid reloid)
 	return 0;
 }
 
+int16
+gpdb::GetAppendOnlySegmentFilesCount(Relation rel)
+{
+	GP_WRAP_START;
+	{
+		FormData_pg_appendonly aoFormData;
+		GetAppendOnlyEntry(rel, &aoFormData);
+		return aoFormData.segfilecount;
+	}
+	GP_WRAP_END;
+	return -1;
+}
+
 // Locks on partition leafs and indexes are held during optimizer (after
 // parse-analyze stage). ORCA need this function to lock relation. Here
 // we do not need to consider lock-upgrade issue, reasons are:
@@ -2723,4 +2754,36 @@ gpdb::TestexprIsHashable(Node *testexpr, List *param_ids)
 	return false;
 }
 
+// check if parallel mode is OK (comprehensive check)
+bool
+gpdb::IsParallelModeOK(void)
+{
+	GP_WRAP_START;
+	{
+		if (!enable_parallel)
+			return false;
+
+		if (IS_SINGLENODE())
+			return false;
+
+		if (max_parallel_workers_per_gather <= 0)
+			return false;
+
+		// Check if parallel plans are enabled in current optimizer context
+		gpopt::COptCtxt *poctxt = gpopt::COptCtxt::PoctxtFromTLS();
+		if (nullptr != poctxt)
+		{
+			gpopt::COptimizerConfig *optimizer_config = poctxt->GetOptimizerConfig();
+			if (nullptr != optimizer_config)
+			{
+				if (!optimizer_config->CreateParallelPlan())
+					return false;
+			}
+		}
+		return true;
+	}
+	GP_WRAP_END;
+	return false;  // default to disabled if no context
+}
+
 // EOF
diff --git a/src/backend/gpopt/translate/CTranslatorDXLToPlStmt.cpp b/src/backend/gpopt/translate/CTranslatorDXLToPlStmt.cpp
index 4acf13bd606..6084abe1c62 100644
--- a/src/backend/gpopt/translate/CTranslatorDXLToPlStmt.cpp
+++ b/src/backend/gpopt/translate/CTranslatorDXLToPlStmt.cpp
@@ -30,6 +30,7 @@ extern "C" {
 #include "partitioning/partdesc.h"
 #include "storage/lmgr.h"
 #include "utils/guc.h"
+#include "optimizer/cost.h"
 #include "utils/lsyscache.h"
 #include "utils/partcache.h"
 #include "utils/rel.h"
@@ -83,6 +84,7 @@ extern "C" {
 #include "naucrates/dxl/operators/CDXLPhysicalSplit.h"
 #include "naucrates/dxl/operators/CDXLPhysicalTVF.h"
 #include "naucrates/dxl/operators/CDXLPhysicalTableScan.h"
+#include "naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h"
 #include "naucrates/dxl/operators/CDXLPhysicalValuesScan.h"
 #include "naucrates/dxl/operators/CDXLPhysicalWindow.h"
 #include "naucrates/dxl/operators/CDXLScalarBitmapBoolOp.h"
@@ -348,6 +350,12 @@ CTranslatorDXLToPlStmt::TranslateDXLOperatorToPlan(
 									   ctxt_translation_prev_siblings);
 			break;
 		}
+		case EdxlopPhysicalParallelTableScan:
+		{
+			plan = TranslateDXLParallelTblScan(dxlnode, output_context,
+											   ctxt_translation_prev_siblings);
+			break;
+		}
 		case EdxlopPhysicalIndexScan:
 		{
 			plan = TranslateDXLIndexScan(dxlnode, output_context,
@@ -712,6 +720,111 @@ CTranslatorDXLToPlStmt::TranslateDXLTblScan(
 }
 
 
+//---------------------------------------------------------------------------
+//	@function:
+//		CTranslatorDXLToPlStmt::TranslateDXLParallelTblScan
+//
+//	@doc:
+//		Translates a DXL parallel table scan node into a parallel SeqScan node
+Plan *
+CTranslatorDXLToPlStmt::TranslateDXLParallelTblScan(
+	const CDXLNode *tbl_scan_dxlnode, CDXLTranslateContext *output_context,
+	CDXLTranslationContextArray * /*ctxt_translation_prev_siblings*/)
+{
+	// translate table descriptor into a range table entry
+	CDXLPhysicalParallelTableScan *phy_parallel_tbl_scan_dxlop =
+		CDXLPhysicalParallelTableScan::Cast(tbl_scan_dxlnode->GetOperator());
+
+	ULONG parallel_workers = phy_parallel_tbl_scan_dxlop->UlParallelWorkers();
+
+	// translation context for column mappings in the base relation
+	CDXLTranslateContextBaseTable base_table_context(m_mp);
+
+	const CDXLTableDescr *dxl_table_descr =
+		phy_parallel_tbl_scan_dxlop->GetDXLTableDescr();
+	const IMDRelation *md_rel =
+		m_md_accessor->RetrieveRel(dxl_table_descr->MDId());
+
+	// Lock any table we are to scan, since it may not have been properly locked
+	// by the parser (e.g in case of generated scans for partitioned tables)
+	OID oidRel = CMDIdGPDB::CastMdid(md_rel->MDId())->Oid();
+	GPOS_ASSERT(dxl_table_descr->LockMode() != -1);
+	gpdb::GPDBLockRelationOid(oidRel, dxl_table_descr->LockMode());
+
+	Index index = ProcessDXLTblDescr(dxl_table_descr, &base_table_context);
+
+	// a table scan node must have 2 children: projection list and filter
+	GPOS_ASSERT(2 == tbl_scan_dxlnode->Arity());
+
+	// translate proj list and filter
+	CDXLNode *project_list_dxlnode = (*tbl_scan_dxlnode)[EdxltsIndexProjList];
+	CDXLNode *filter_dxlnode = (*tbl_scan_dxlnode)[EdxltsIndexFilter];
+
+	List *targetlist = NIL;
+
+	// List to hold the quals after translating filter_dxlnode node.
+	List *query_quals = NIL;
+
+	TranslateProjListAndFilter(
+		project_list_dxlnode, filter_dxlnode,
+		&base_table_context,  // translate context for the base table
+		nullptr,			  // translate_ctxt_left and pdxltrctxRight,
+		&targetlist, &query_quals, output_context);
+
+	Plan *plan = nullptr;
+	Plan *plan_return = nullptr;
+
+	// Parallel table scans are always sequential scans (not foreign scans)
+	SeqScan *seq_scan = MakeNode(SeqScan);
+	seq_scan->scanrelid = index;
+	plan = &(seq_scan->plan);
+	plan_return = (Plan *) seq_scan;
+
+	// Set parallel execution flags
+	plan->parallel_aware = true;
+	plan->parallel_safe = true;
+	plan->parallel = (int) parallel_workers;
+
+	plan->targetlist = targetlist;
+
+	// List to hold the quals which contain both security quals and query
+	// quals.
+	List *security_query_quals = NIL;
+
+	// Fetching the RTE of the relation from the rewritten parse tree
+	// based on the oidRel and adding the security quals of the RTE in
+	// the security_query_quals list.
+	AddSecurityQuals(oidRel, &security_query_quals, &index);
+
+	// The security quals should always be executed first when
+	// compared to other quals. So appending query quals to the
+	// security_query_quals list after the security quals.
+	security_query_quals =
+		gpdb::ListConcat(security_query_quals, query_quals);
+	plan->qual = security_query_quals;
+
+	if (md_rel->IsNonBlockTable())
+	{
+		CheckSafeTargetListForAOTables(plan->targetlist);
+	}
+
+	plan->plan_node_id = m_dxl_to_plstmt_context->GetNextPlanId();
+
+	// translate operator costs
+	TranslatePlanCosts(tbl_scan_dxlnode, plan);
+
+	// Adjust row count to per-worker statistics
+	if (parallel_workers > 1)
+	{
+		plan->plan_rows = ceil(plan->plan_rows / parallel_workers);
+	}
+
+	SetParamIds(plan);
+
+	return plan_return;
+}
+
+
 //---------------------------------------------------------------------------
 //	@function:
 //		CTranslatorDXLToPlStmt::SetIndexVarAttnoWalker
@@ -719,7 +832,6 @@ CTranslatorDXLToPlStmt::TranslateDXLTblScan(
 //	@doc:
 //		Walker to set index var attno's,
 //		attnos of index vars are set to their relative positions in index keys,
-//		skip any outer references while walking the expression tree
 //
 //---------------------------------------------------------------------------
 BOOL
@@ -2415,15 +2527,34 @@ CTranslatorDXLToPlStmt::TranslateDXLMotion(
 	sendslice->directDispatch.contentIds = NIL;
 	sendslice->directDispatch.haveProcessedAnyCalculations = false;
 
+	// set parallel workers if needed
+	ULONG child_index = motion_dxlop->GetRelationChildIdx();
+	CDXLNode *child_dxlnode = (*motion_dxlnode)[child_index];
+	ULONG child_parallel_workers = ExtractParallelWorkersFromDXL(child_dxlnode);
+	if (child_parallel_workers > 1)
+	{
+		// Determine parallel workers based on enable_parallel and gang type
+		bool supports_parallel = (sendslice->gangType == GANGTYPE_PRIMARY_READER ||
+		                          sendslice->gangType == GANGTYPE_PRIMARY_WRITER);
+
+		if (supports_parallel)
+		{
+			sendslice->parallel_workers = child_parallel_workers;
+		}
+		else
+		{
+			// Disable parallel for: non-PRIMARY gang types
+			// (SINGLETON_READER, ENTRYDB_READER, UNALLOCATED)
+			sendslice->parallel_workers = 0;
+		}
+	}
+
 	motion->motionID = sendslice->sliceIndex;
 
 	// translate motion child
 	// child node is in the same position in broadcast and gather motion nodes
 	// but different in redistribute motion nodes
-
-	ULONG child_index = motion_dxlop->GetRelationChildIdx();
-
-	CDXLNode *child_dxlnode = (*motion_dxlnode)[child_index];
+	// Note: child_index and child_dxlnode already defined above
 
 	CDXLTranslateContext child_context(m_mp, false,
 									   output_context->GetColIdToParamIdMap());
@@ -2576,6 +2707,16 @@ CTranslatorDXLToPlStmt::TranslateDXLMotion(
 			return nullptr;
 	}
 
+	// Adjust row count for parallel execution in the sending slice
+	// The Motion node receives rows from all parallel workers, so we need to
+	// account for the fact that each worker processes a fraction of the rows.
+	// TranslatePlanCosts() already divided by numsegments, but if we have
+	// parallel workers, each segment is further subdivided among workers.
+	if (sendslice->parallel_workers > 1)
+	{
+		plan->plan_rows = ceil(plan->plan_rows / sendslice->parallel_workers);
+	}
+
 	SetParamIds(plan);
 
 	return (Plan *) motion;
@@ -3306,7 +3447,7 @@ CTranslatorDXLToPlStmt::TranslateDXLWindowAgg(
 		// translate the window frame specified in the window key
 		if (nullptr != window_key->GetWindowFrame())
 		{
-			window->frameOptions = FRAMEOPTION_NONDEFAULT;
+			window->frameOptions = FRAMEOPTION_NONDEFAULT | FRAMEOPTION_BETWEEN;
 			window->frameOptions |= WindowFrameSpecToOptions(window_frame->ParseDXLFrameSpec());
 			window->frameOptions |= WindowFrameExclusionStrategyToOptions(
 				window_frame->ParseFrameExclusionStrategy());
@@ -3510,7 +3651,7 @@ CTranslatorDXLToPlStmt::TranslateDXLWindowHashAgg(
 		// translate the window frame specified in the window key
 		if (nullptr != window_key->GetWindowFrame())
 		{
-			window->frameOptions = FRAMEOPTION_NONDEFAULT;
+			window->frameOptions = FRAMEOPTION_NONDEFAULT | FRAMEOPTION_BETWEEN;
 			window->frameOptions |= WindowFrameSpecToOptions(window_frame->ParseDXLFrameSpec());
 			window->frameOptions |= WindowFrameExclusionStrategyToOptions(
 				window_frame->ParseFrameExclusionStrategy());
@@ -7282,4 +7423,75 @@ CTranslatorDXLToPlStmt::IsIndexForOrderBy(
 	}
 	return false;
 }
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CTranslatorDXLToPlStmt::ExtractParallelWorkersFromDXL
+//
+//	@doc:
+//		Extract parallel workers count from DXL node tree recursively.
+//		Since parallel degree is uniform across all parallel scans in a query,
+//		returns the first parallel degree found from any CDXLPhysicalParallelTableScan,
+//		or 1 if no parallel scan exists.
+//
+//---------------------------------------------------------------------------
+ULONG
+CTranslatorDXLToPlStmt::ExtractParallelWorkersFromDXL(const CDXLNode *dxlnode)
+{
+	if (nullptr == dxlnode)
+	{
+		return 1;
+	}
+
+	CDXLOperator *dxlop = dxlnode->GetOperator();
+	if (EdxlopPhysicalParallelTableScan == dxlop->GetDXLOperator())
+	{
+		// Return parallel workers from the parallel table scan operator
+		// All parallel scans in the query share the same parallel degree
+		CDXLPhysicalParallelTableScan *parallel_scan_dxlop =
+			CDXLPhysicalParallelTableScan::Cast(dxlop);
+		return parallel_scan_dxlop->UlParallelWorkers();
+	}
+	else if (EdxlopPhysicalTableScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalDynamicTableScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalIndexScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalIndexOnlyScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalBitmapTableScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalDynamicBitmapTableScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalForeignScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalDynamicForeignScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalDynamicIndexScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalDynamicIndexOnlyScan == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalValuesScan == dxlop->GetDXLOperator())
+	{
+		// Non-parallel scans (table, index, bitmap, foreign, values)
+		// These are leaf nodes in terms of parallel worker extraction
+		// Return 1 to indicate no parallel workers
+		return 1;
+	}
+	else if (EdxlopPhysicalMotionGather == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalMotionBroadcast == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalMotionRedistribute == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalMotionRandom == dxlop->GetDXLOperator() ||
+			 EdxlopPhysicalMotionRoutedDistribute == dxlop->GetDXLOperator())
+	{
+		// Motion node creates a slice boundary - do not recurse into child
+		// The child's parallel workers belong to the sending slice, not receiving slice
+		// Return 0 to indicate the receiving slice (current slice) has no parallel workers
+		return 1;
+	}
+
+	// Recursively check child nodes, return early when first parallel scan is found
+	for (ULONG ul = 0; ul < dxlnode->Arity(); ul++)
+	{
+		ULONG child_parallel_workers = ExtractParallelWorkersFromDXL((*dxlnode)[ul]);
+		if (child_parallel_workers > 1)
+		{
+			return child_parallel_workers;
+		}
+	}
+
+	return 1;
+}
+
 // EOF
diff --git a/src/backend/gpopt/translate/CTranslatorQueryToDXL.cpp b/src/backend/gpopt/translate/CTranslatorQueryToDXL.cpp
index 20cc6557c28..99d87917b38 100644
--- a/src/backend/gpopt/translate/CTranslatorQueryToDXL.cpp
+++ b/src/backend/gpopt/translate/CTranslatorQueryToDXL.cpp
@@ -324,6 +324,15 @@ CTranslatorQueryToDXL::CheckUnsupportedNodeTypes(Query *query)
 		GPOS_RAISE(gpdxl::ExmaDXL, gpdxl::ExmiQuery2DXLUnsupportedFeature,
 				   GPOS_WSZ_LIT("Non-default collation"));
 	}
+
+	// ORCA does not support amcanorderbyop (KNN ordered index scans).
+	// Fall back to the PostgreSQL planner for queries whose ORDER BY
+	// contains an ordering operator (e.g., <-> for distance).
+	if (gpdb::HasOrderByOrderingOp(query))
+	{
+		GPOS_RAISE(gpdxl::ExmaDXL, gpdxl::ExmiQuery2DXLUnsupportedFeature,
+				   GPOS_WSZ_LIT("ORDER BY with ordering operator (amcanorderbyop)"));
+	}
 }
 
 //---------------------------------------------------------------------------
diff --git a/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp b/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp
index ee4b8888b19..aa23d3932a2 100644
--- a/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp
+++ b/src/backend/gpopt/translate/CTranslatorRelcacheToDXL.cpp
@@ -516,7 +516,6 @@ CTranslatorRelcacheToDXL::RetrieveRel(CMemoryPool *mp, CMDAccessor *md_accessor,
 	IMdIdArray *check_constraint_mdids = nullptr;
 	BOOL is_temporary = false;
 	BOOL is_partitioned = false;
-	IMDRelation *md_rel = nullptr;
 	IMdIdArray *partition_oids = nullptr;
 	IMDId *foreign_server_mdid = nullptr;
 
@@ -618,14 +617,31 @@ CTranslatorRelcacheToDXL::RetrieveRel(CMemoryPool *mp, CMDAccessor *md_accessor,
 			CMDIdGPDB(IMDId::EmdidGeneral, gpdb::GetForeignServerId(oid));
 	}
 
-	md_rel = GPOS_NEW(mp) CMDRelationGPDB(
+	CMDRelationGPDB *md_rel_gpdb = GPOS_NEW(mp) CMDRelationGPDB(
 		mp, mdid, mdname, is_temporary, rel_storage_type, dist,
 		mdcol_array, distr_cols, distr_op_families, part_keys, part_types,
 		partition_oids, convert_hash_to_random, keyset_array,
 		md_index_info_array, check_constraint_mdids, mdpart_constraint,
 		foreign_server_mdid, rel->rd_rel->reltuples);
 
-	return md_rel;
+	// Set segment file count for AO/AOCO tables
+	// Skip partitioned tables as they don't have physical storage (only leaf partitions do)
+	if ((rel_storage_type == IMDRelation::ErelstorageAppendOnlyRows ||
+		 rel_storage_type == IMDRelation::ErelstorageAppendOnlyCols) &&
+		rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE)
+	{
+		INT seg_file_count = gpdb::GetAppendOnlySegmentFilesCount(rel.get());
+		md_rel_gpdb->SetSegFileCount(seg_file_count);
+	}
+
+	// Set parallel workers from table options
+	if (rel->rd_options != NULL)
+	{
+		INT parallel_workers = RelationGetParallelWorkers(rel.get(), -1);
+		md_rel_gpdb->SetParallelWorkers(parallel_workers);
+	}
+
+	return md_rel_gpdb;
 }
 
 //---------------------------------------------------------------------------
diff --git a/src/backend/gpopt/utils/COptTasks.cpp b/src/backend/gpopt/utils/COptTasks.cpp
index 6bd93379f0f..30e6e131f3d 100644
--- a/src/backend/gpopt/utils/COptTasks.cpp
+++ b/src/backend/gpopt/utils/COptTasks.cpp
@@ -385,7 +385,7 @@ COptTasks::LoadSearchStrategy(CMemoryPool *mp, char *path)
 //---------------------------------------------------------------------------
 COptimizerConfig *
 COptTasks::CreateOptimizerConfig(CMemoryPool *mp, ICostModel *cost_model,
-								 CPlanHint *plan_hints)
+								 CPlanHint *plan_hints, BOOL enable_parallel_plans)
 {
 	// get chosen plan number, cost threshold
 	ULLONG plan_id = (ULLONG) optimizer_plan_id;
@@ -424,7 +424,8 @@ COptTasks::CreateOptimizerConfig(CMemoryPool *mp, ICostModel *cost_model,
 				  push_group_by_below_setop_threshold, xform_bind_threshold,
 				  skew_factor),
 		plan_hints,
-		GPOS_NEW(mp) CWindowOids(mp, OID(F_ROW_NUMBER), OID(F_RANK_), OID(F_DENSE_RANK_)));
+		GPOS_NEW(mp) CWindowOids(mp, OID(F_ROW_NUMBER), OID(F_RANK_), OID(F_DENSE_RANK_)),
+		enable_parallel_plans);
 }
 
 //---------------------------------------------------------------------------
@@ -961,7 +962,7 @@ COptTasks::OptimizeTask(void *ptr)
 			ICostModel *cost_model = GetCostModel(mp, num_segments_for_costing);
 			CPlanHint *plan_hints = GetPlanHints(mp, opt_ctxt->m_query);
 			COptimizerConfig *optimizer_config =
-				CreateOptimizerConfig(mp, cost_model, plan_hints);
+				CreateOptimizerConfig(mp, cost_model, plan_hints, opt_ctxt->m_create_parallel_plan);
 			CConstExprEvaluatorProxy expr_eval_proxy(mp, &mda);
 			IConstExprEvaluator *expr_evaluator =
 				GPOS_NEW(mp) CConstExprEvaluatorDXL(mp, &mda, &expr_eval_proxy);
@@ -1186,6 +1187,7 @@ COptTasks::GPOPTOptimizedPlan(Query *query, SOptContext *gpopt_context, Optimize
 	gpopt_context->m_should_generate_plan_stmt = true;
 	// Copy options in `OptimizerOptions` to `SOptContext`
 	gpopt_context->m_create_vec_plan = opts->create_vectorization_plan;
+	gpopt_context->m_create_parallel_plan = opts->create_parallel_plan;
 	Execute(&OptimizeTask, gpopt_context);
 	return gpopt_context->m_plan_stmt;
 }
diff --git a/src/backend/gporca/concourse/build_and_test.py b/src/backend/gporca/concourse/build_and_test.py
deleted file mode 100755
index e885843dc4c..00000000000
--- a/src/backend/gporca/concourse/build_and_test.py
+++ /dev/null
@@ -1,110 +0,0 @@
-#!/usr/bin/python3
-
-import optparse
-import os
-import shutil
-import subprocess
-import sys
-
-def num_cpus():
-    # Use multiprocessing module, available in Python 2.6+
-    try:
-        import multiprocessing
-        return multiprocessing.cpu_count()
-    except (ImportError, NotImplementedError):
-        pass
-
-    # Get POSIX system config value for number of processors.
-    posix_num_cpus = os.sysconf("SC_NPROCESSORS_ONLN")
-    if posix_num_cpus != -1:
-        return posix_num_cpus
-
-    # Guess
-    return 2
-
-def install_dependencies(dependencies, output_dir):
-    for dependency in dependencies:
-        status = install_dependency(dependency, output_dir)
-        if status:
-            return status
-
-def install_dependency(dependency_name, output_dir):
-    return subprocess.call(
-        ["tar -xzf " + dependency_name + "/*.tar.gz -C " + output_dir], shell=True)
-
-def cmake_configure(src_dir, build_type, output_dir, cxx_compiler = None, cxxflags = None):
-    if os.path.exists("build"):
-        shutil.rmtree("build")
-    os.mkdir("build")
-    cmake_args = ["cmake",
-                  "-D", "CMAKE_INSTALL_PREFIX=" + output_dir,
-                  "-D", "CMAKE_BUILD_TYPE=" + build_type]
-    if cxx_compiler:
-        cmake_args.append("-D")
-        cmake_args.append("CMAKE_CXX_COMPILER=" + cxx_compiler)
-    if cxxflags:
-        cmake_args.append("-D")
-        cmake_args.append("CMAKE_CXX_FLAGS=" + cxxflags)
-
-    cmake_args.append("../" + src_dir)
-    cmake_command = " ".join(cmake_args)
-    if os.path.exists('/opt/gcc_env.sh'):
-        cmake_command = "source /opt/gcc_env.sh && " + cmake_command
-    print(cmake_command)
-    return subprocess.call(cmake_command, cwd="build", shell=True)
-
-def make():
-    return subprocess.call(["make",
-        "-j" + str(num_cpus()),
-        "-l" + str(2 * num_cpus()),
-        ],
-        cwd="build",
-        env=ccache_env()
-        )
-
-
-def ccache_env():
-    env = os.environ.copy()
-    env['CCACHE_DIR'] = os.getcwd() + '/.ccache'
-    return env
-
-
-def run_tests():
-    return subprocess.call(["ctest",
-                            "--output-on-failure",
-                            "-j" + str(num_cpus()),
-                            "--test-load", str(4 * num_cpus()),
-                            ],
-                            cwd="build")
-
-def main():
-    parser = optparse.OptionParser()
-    parser.add_option("--build_type", dest="build_type", default="RELEASE")
-    parser.add_option("--compiler", dest="compiler")
-    parser.add_option("--cxxflags", dest="cxxflags")
-    parser.add_option("--output_dir", dest="output_dir", default="install")
-    parser.add_option("--skiptests", dest="skiptests", action="store_true", default=False)
-
-    (options, args) = parser.parse_args()
-    # install deps for building
-    status = install_dependencies(args, "/usr/local")
-    if status:
-        return status
-    status = cmake_configure("",
-                             options.build_type,
-                             options.output_dir,
-                             options.compiler,
-                             options.cxxflags)
-    if status:
-        return status
-    status = make()
-    if status:
-        return status
-    if not options.skiptests:
-        status = run_tests()
-        if status:
-            return status
-    return 0
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/src/backend/gporca/concourse/xerces-c/build_xerces.py b/src/backend/gporca/concourse/xerces-c/build_xerces.py
deleted file mode 100644
index 8b49e13ac2a..00000000000
--- a/src/backend/gporca/concourse/xerces-c/build_xerces.py
+++ /dev/null
@@ -1,93 +0,0 @@
-#!/usr/bin/env python3
-
-import optparse
-import os
-import os.path
-import subprocess
-import sys
-import tarfile
-import urllib.request, urllib.error, urllib.parse
-import hashlib
-
-XERCES_SOURCE_URL = "http://archive.apache.org/dist/xerces/c/3/sources/xerces-c-3.1.2.tar.gz"
-XERCES_SOURCE_DIR = "xerces-c-3.1.2"
-
-def num_cpus():
-    # Use multiprocessing module, available in Python 2.6+
-    try:
-        import multiprocessing
-        return multiprocessing.cpu_count()
-    except (ImportError, NotImplementedError):
-        pass
-
-    # Get POSIX system config value for number of processors.
-    posix_num_cpus = os.sysconf("SC_NPROCESSORS_ONLN")
-    if posix_num_cpus != -1:
-        return posix_num_cpus
-
-    # Guess
-    return 2
-
-def get_xerces_source():
-    remote_src = urllib.request.urlopen(XERCES_SOURCE_URL)
-    local_src = open("xerces_src.tar.gz", "wb")
-    local_src.write(remote_src.read())
-    local_src.close()
-    file_hash = hashlib.sha256(open('xerces_src.tar.gz','rb').read()).hexdigest()
-    actual_hash = ""
-    with open('xerces_patch/concourse/xerces-c/xerces-c-3.1.2.tar.gz.sha256', 'r') as f:
-        actual_hash = f.read().strip()
-    if file_hash != actual_hash:
-        return 1
-    tarball = tarfile.open("xerces_src.tar.gz", "r:gz")
-    for item in tarball:
-        tarball.extract(item, ".")
-    tarball.close()
-    return 0
-
-def configure(cxx_compiler, cxxflags, cflags, output_dir):
-    os.mkdir("build")
-    environment = os.environ.copy()
-    if cxx_compiler:
-        environment["CXX"] = cxx_compiler
-    if cxxflags:
-        environment["CXXFLAGS"] = cxxflags
-    if cflags:
-        environment["CFLAGS"] = cflags
-    return subprocess.call(
-        [os.path.abspath(XERCES_SOURCE_DIR + "/configure"), "--prefix=" + os.path.abspath(output_dir)],
-        env = environment,
-        cwd = "build")
-
-def make():
-    return subprocess.call(["make", "-j" + str(num_cpus())], cwd="build")
-
-def install():
-    return subprocess.call(["make", "install"], cwd="build")
-
-def main():
-    parser = optparse.OptionParser()
-    parser.add_option("--compiler", dest="compiler")
-    parser.add_option("--cxxflags", dest="cxxflags")
-    parser.add_option("--cflags", dest="cflags")
-    parser.add_option("--output_dir", dest="output_dir", default="install")
-    (options, args) = parser.parse_args()
-    if len(args) > 0:
-        print("Unknown arguments")
-        return 1
-    status = get_xerces_source()
-    if status:
-        return status
-    status = configure(options.compiler, options.cxxflags, options.cflags, options.output_dir)
-    if status:
-        return status
-    status = make()
-    if status:
-        return status
-    status = install()
-    if status:
-        return status
-    return 0
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/src/backend/gporca/concourse/xerces-c/xerces-c-3.1.2.tar.gz.sha256 b/src/backend/gporca/concourse/xerces-c/xerces-c-3.1.2.tar.gz.sha256
deleted file mode 100644
index 7fbcc8000ec..00000000000
--- a/src/backend/gporca/concourse/xerces-c/xerces-c-3.1.2.tar.gz.sha256
+++ /dev/null
@@ -1 +0,0 @@
-743bd0a029bf8de56a587c270d97031e0099fe2b7142cef03e0da16e282655a0
diff --git a/src/backend/gporca/libgpdbcost/include/gpdbcost/CCostModelGPDB.h b/src/backend/gporca/libgpdbcost/include/gpdbcost/CCostModelGPDB.h
index 2b44693fa4e..7db2cdbbdd1 100644
--- a/src/backend/gporca/libgpdbcost/include/gpdbcost/CCostModelGPDB.h
+++ b/src/backend/gporca/libgpdbcost/include/gpdbcost/CCostModelGPDB.h
@@ -80,6 +80,11 @@ class CCostModelGPDB : public ICostModel
 						  const CCostModelGPDB *pcmgpdb,
 						  const SCostingInfo *pci);
 
+	// cost of parallel table scan
+	static CCost CostParallelTableScan(CMemoryPool *mp, CExpressionHandle &exprhdl,
+									   const CCostModelGPDB *pcmgpdb,
+									   const SCostingInfo *pci);
+
 	// cost of filter
 	static CCost CostFilter(CMemoryPool *mp, CExpressionHandle &exprhdl,
 							const CCostModelGPDB *pcmgpdb,
@@ -225,6 +230,10 @@ class CCostModelGPDB : public ICostModel
 								   IStatistics *&stats,
 								   CMDAccessor *md_accessor, CMemoryPool *mp);
 
+	// Helper functions for parallel cost calculation
+	static CDouble CalculateParallelEfficiency(ULONG ulWorkers);
+	static CDouble GetWorkerStartupCost(const CCostModelGPDB *pcmgpdb, ULONG ulWorkers);
+
 public:
 	// ctor
 	CCostModelGPDB(CMemoryPool *mp, ULONG ulSegments,
diff --git a/src/backend/gporca/libgpdbcost/src/CCostModelGPDB.cpp b/src/backend/gporca/libgpdbcost/src/CCostModelGPDB.cpp
index 0bf5e167469..575f6473ff0 100644
--- a/src/backend/gporca/libgpdbcost/src/CCostModelGPDB.cpp
+++ b/src/backend/gporca/libgpdbcost/src/CCostModelGPDB.cpp
@@ -12,6 +12,7 @@
 #include "gpdbcost/CCostModelGPDB.h"
 
 #include <limits>
+#include <cmath>
 
 #include "gpopt/base/CColRefSetIter.h"
 #include "gpopt/base/COptCtxt.h"
@@ -27,6 +28,7 @@
 #include "gpopt/operators/CPhysicalHashAgg.h"
 #include "gpopt/operators/CPhysicalIndexOnlyScan.h"
 #include "gpopt/operators/CPhysicalIndexScan.h"
+#include "gpopt/operators/CPhysicalParallelTableScan.h"
 #include "gpopt/operators/CPhysicalMotion.h"
 #include "gpopt/operators/CPhysicalMotionBroadcast.h"
 #include "gpopt/operators/CPhysicalPartitionSelector.h"
@@ -43,6 +45,8 @@
 using namespace gpos;
 using namespace gpdbcost;
 
+// Forward declare PostgreSQL GUC variables
+extern double parallel_setup_cost;
 
 //---------------------------------------------------------------------------
 //	@function:
@@ -2380,7 +2384,8 @@ CCostModelGPDB::CostScan(CMemoryPool *,	 // mp
 	GPOS_ASSERT(COperator::EopPhysicalTableScan == op_id ||
 				COperator::EopPhysicalDynamicTableScan == op_id ||
 				COperator::EopPhysicalForeignScan == op_id ||
-				COperator::EopPhysicalDynamicForeignScan == op_id);
+				COperator::EopPhysicalDynamicForeignScan == op_id ||
+				COperator::EopPhysicalParallelTableScan == op_id);
 
 	const CDouble dInitScan =
 		pcmgpdb->GetCostModelParams()
@@ -2402,6 +2407,7 @@ CCostModelGPDB::CostScan(CMemoryPool *,	 // mp
 		case COperator::EopPhysicalDynamicTableScan:
 		case COperator::EopPhysicalForeignScan:
 		case COperator::EopPhysicalDynamicForeignScan:
+		case COperator::EopPhysicalParallelTableScan:
 			// table scan cost considers only retrieving tuple cost,
 			// since we scan the entire table here, the cost is correlated with table rows and table width,
 			// since Scan's parent operator may be a filter that will be pushed into Scan node in GPDB plan,
@@ -2416,6 +2422,120 @@ CCostModelGPDB::CostScan(CMemoryPool *,	 // mp
 }
 
 
+//---------------------------------------------------------------------------
+//	@function:
+//		CCostModelGPDB::CostParallelTableScan
+//
+//	@doc:
+//		Cost of parallel table scan
+//
+//---------------------------------------------------------------------------
+CCost
+CCostModelGPDB::CostParallelTableScan(CMemoryPool *mp,
+									  CExpressionHandle &exprhdl,
+									  const CCostModelGPDB *pcmgpdb,
+									  const SCostingInfo *pci)
+{
+	GPOS_ASSERT(nullptr != pcmgpdb);
+	GPOS_ASSERT(nullptr != pci);
+
+	COperator *pop = exprhdl.Pop();
+	GPOS_ASSERT(COperator::EopPhysicalParallelTableScan == pop->Eopid());
+
+	// Get the parallel table scan operator
+	CPhysicalParallelTableScan *popParallelScan =
+		CPhysicalParallelTableScan::PopConvert(pop);
+	ULONG ulWorkers = popParallelScan->UlParallelWorkers();
+
+	// If only 1 worker, use regular scan cost
+	if (ulWorkers <= 1)
+	{
+		return CostScan(mp, exprhdl, pcmgpdb, pci);
+	}
+
+	// Get base scan parameters
+	const CDouble dInitScan =
+		pcmgpdb->GetCostModelParams()
+			->PcpLookup(CCostModelParamsGPDB::EcpInitScanFactor)
+			->Get();
+	const CDouble dTableWidth =
+		CPhysicalScan::PopConvert(pop)->PstatsBaseTable()->Width();
+	const CDouble dTableScanCostUnit =
+		pcmgpdb->GetCostModelParams()
+			->PcpLookup(CCostModelParamsGPDB::EcpTableScanCostUnit)
+			->Get();
+
+	// Calculate base scan cost
+	CDouble dBaseScanCost = dInitScan + pci->Rows() * dTableWidth * dTableScanCostUnit;
+
+	// Calculate parallel efficiency (decreases with more workers)
+	CDouble dParallelEfficiency = CalculateParallelEfficiency(ulWorkers);
+
+	// Parallel scan cost = base cost / (workers * efficiency)
+	CDouble dParallelScanCost = dBaseScanCost / (ulWorkers * dParallelEfficiency);
+
+	// Add worker startup cost
+	CDouble dWorkerStartupCost = GetWorkerStartupCost(pcmgpdb, ulWorkers);
+
+	// Total cost
+	return CCost(pci->NumRebinds() * dParallelScanCost + dWorkerStartupCost);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CCostModelGPDB::CalculateParallelEfficiency
+//
+//	@doc:
+//		Calculate parallel efficiency factor (0-1) based on worker count
+//
+//---------------------------------------------------------------------------
+CDouble
+CCostModelGPDB::CalculateParallelEfficiency(ULONG ulWorkers)
+{
+	if (ulWorkers <= 1)
+	{
+		return 1.0;
+	}
+
+	// Efficiency decreases logarithmically with more workers
+	// Formula: efficiency = 1 / (1 + 0.1 * log2(workers))
+	// This gives: 2 workers = 0.91, 4 workers = 0.83, 8 workers = 0.77
+	double dLogWorkers = std::log2(static_cast<double>(ulWorkers));
+	return CDouble(1.0 / (1.0 + 0.1 * dLogWorkers));
+}
+
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CCostModelGPDB::GetWorkerStartupCost
+//
+//	@doc:
+//		Get the cost of starting up parallel workers
+//
+//---------------------------------------------------------------------------
+CDouble
+CCostModelGPDB::GetWorkerStartupCost(const CCostModelGPDB * /* pcmgpdb */, ULONG ulWorkers)
+{
+	if (ulWorkers <= 1)
+	{
+		return 0.0;
+	}
+
+	// ORCA's cost units are much smaller than PostgreSQL's cost model
+	// PostgreSQL's parallel_setup_cost default is 1000, but ORCA's costs are:
+	//   - InitScanFactor: 431.0
+	//   - HJHashTableInitCostFactor: 500.0
+	//   - DefaultCost: 100.0
+	//
+	// Use a conversion factor to map parallel_setup_cost to ORCA's scale.
+	// With default parallel_setup_cost=1000, this gives 10.0, which is
+	// reasonable compared to InitScanFactor (431.0) - about 0.1% overhead
+	const double POSTGRES_TO_ORCA_COST_CONVERSION = 0.001;
+
+	return CDouble(parallel_setup_cost * POSTGRES_TO_ORCA_COST_CONVERSION);
+}
+
+
 //---------------------------------------------------------------------------
 //	@function:
 //		CCostModelGPDB::CostFilter
@@ -2489,11 +2609,15 @@ CCostModelGPDB::Cost(
 		case COperator::EopPhysicalDynamicTableScan:
 		case COperator::EopPhysicalForeignScan:
 		case COperator::EopPhysicalDynamicForeignScan:
-
 		{
 			return CostScan(m_mp, exprhdl, this, pci);
 		}
 
+		case COperator::EopPhysicalParallelTableScan:
+		{
+			return CostParallelTableScan(m_mp, exprhdl, this, pci);
+		}
+
 		case COperator::EopPhysicalFilter:
 		{
 			return CostFilter(m_mp, exprhdl, this, pci);
diff --git a/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpec.h b/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpec.h
index d3b47b95f80..9f3b74bd76f 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpec.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpec.h
@@ -71,6 +71,7 @@ class CDistributionSpec : public CPropSpec
 		EdtStrictSingleton,	 // data is on a single segment or the master (derived only, only compatible with other singleton distributions)
 		EdtRandom,			 // data is randomly distributed across all segments
 		EdtStrictRandom,  // same as random, used to force multiple slices for parallel union all.
+		EdtWorkerRandom,  // data is randomly distributed among parallel workers within segments
 		EdtRouted,	// data is routed to a segment explicitly specified in the tuple,
 		EdtUniversal,  // data is available everywhere (derived only)
 		EdtNonSingleton,  // data can have any distribution except singleton (required only)
diff --git a/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpecWorkerRandom.h b/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpecWorkerRandom.h
new file mode 100644
index 00000000000..f026f00e247
--- /dev/null
+++ b/src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpecWorkerRandom.h
@@ -0,0 +1,139 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CDistributionSpecWorkerRandom.h
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/include/gpopt/base/CDistributionSpecWorkerRandom.h
+ *
+ *-------------------------------------------------------------------------
+ */
+#ifndef GPOPT_CDistributionSpecWorkerRandom_H
+#define GPOPT_CDistributionSpecWorkerRandom_H
+
+#include "gpos/base.h"
+
+#include "gpopt/base/CDistributionSpecRandom.h"
+
+namespace gpopt
+{
+using namespace gpos;
+
+//---------------------------------------------------------------------------
+//	@class:
+//		CDistributionSpecWorkerRandom
+//
+//	@doc:
+//		Class for representing worker-level random distribution.
+//		This class provides a specialized implementation for parallel
+//		worker execution with explicit worker count management.
+//
+//---------------------------------------------------------------------------
+class CDistributionSpecWorkerRandom : public CDistributionSpecRandom
+{
+private:
+	// Number of workers for parallel execution
+	ULONG m_ulWorkers;
+
+	// Base segment distribution (usually segment-level random)
+	CDistributionSpec *m_pdsSegmentBase;
+
+	// private copy ctor
+	CDistributionSpecWorkerRandom(const CDistributionSpecWorkerRandom &);
+
+public:
+	// ctor
+	CDistributionSpecWorkerRandom(ULONG ulWorkers, CDistributionSpec *pdsSegmentBase = nullptr);
+
+	// dtor
+	~CDistributionSpecWorkerRandom() override;
+
+	// distribution type accessor
+	EDistributionType
+	Edt() const override
+	{
+		return CDistributionSpec::EdtWorkerRandom;
+	}
+
+	// distribution identifier
+	const CHAR *
+	SzId() const override
+	{
+		return "WORKER_RANDOM";
+	}
+
+	// Get worker count
+	ULONG
+	UlWorkers() const
+	{
+		return m_ulWorkers;
+	}
+
+	// Get base segment distribution
+	CDistributionSpec *
+	PdsSegmentBase() const
+	{
+		return m_pdsSegmentBase;
+	}
+
+	// does this distribution match the given one
+	BOOL Matches(const CDistributionSpec *pds) const override;
+
+	// does this distribution satisfy the given one
+	BOOL FSatisfies(const CDistributionSpec *pds) const override;
+
+	// append enforcers to dynamic array for the given plan properties
+	void AppendEnforcers(CMemoryPool *mp, CExpressionHandle &exprhdl,
+						 CReqdPropPlan *prpp, CExpressionArray *pdrgpexpr,
+						 CExpression *pexpr) override;
+
+	// print
+	IOstream &OsPrint(IOstream &os) const override;
+
+	// Factory method for creating worker-level random distribution
+	static CDistributionSpecWorkerRandom *PdsCreateWorkerRandom(
+		CMemoryPool *mp, ULONG ulWorkers, CDistributionSpec *pdsBase = nullptr);
+
+	// conversion function
+	static CDistributionSpecWorkerRandom *
+	PdsConvert(CDistributionSpec *pds)
+	{
+		GPOS_ASSERT(nullptr != pds);
+		GPOS_ASSERT(EdtWorkerRandom == pds->Edt());
+
+		return dynamic_cast<CDistributionSpecWorkerRandom *>(pds);
+	}
+
+	// conversion function: const argument
+	static const CDistributionSpecWorkerRandom *
+	PdsConvert(const CDistributionSpec *pds)
+	{
+		GPOS_ASSERT(nullptr != pds);
+		GPOS_ASSERT(EdtWorkerRandom == pds->Edt());
+
+		return dynamic_cast<const CDistributionSpecWorkerRandom *>(pds);
+	}
+
+};	// class CDistributionSpecWorkerRandom
+
+}  // namespace gpopt
+
+#endif	// !GPOPT_CDistributionSpecWorkerRandom_H
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/include/gpopt/base/CRewindabilitySpec.h b/src/backend/gporca/libgpopt/include/gpopt/base/CRewindabilitySpec.h
index bd2dea7eec1..2959a678301 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/base/CRewindabilitySpec.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/base/CRewindabilitySpec.h
@@ -108,6 +108,7 @@ class CRewindabilitySpec : public CPropSpec
 		EmhtSentinel
 	};
 
+
 private:
 	// rewindability support
 	ERewindabilityType m_rewindability;
diff --git a/src/backend/gporca/libgpopt/include/gpopt/base/CUtils.h b/src/backend/gporca/libgpopt/include/gpopt/base/CUtils.h
index 1e873e14847..0aded041e00 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/base/CUtils.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/base/CUtils.h
@@ -1026,6 +1026,9 @@ class CUtils
 	static CTableDescriptorHashSet *RemoveDuplicateMdids(
 		CMemoryPool *mp, CTableDescriptorHashSet *tabdescs);
 
+	static BOOL FHasCrossSliceReplicatedCTEConsumer(CMemoryPool *mp,
+													CExpression *pexpr);
+
 	static CExpression *ReplaceColrefWithProjectExpr(CMemoryPool *mp,
 													 CExpression *pexpr,
 													 CColRef *pcolref,
diff --git a/src/backend/gporca/libgpopt/include/gpopt/operators/COperator.h b/src/backend/gporca/libgpopt/include/gpopt/operators/COperator.h
index 657e3082ef7..5d10a1cee99 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/operators/COperator.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/operators/COperator.h
@@ -188,6 +188,7 @@ class COperator : public CRefCount, public DbgPrintMixin<COperator>
 		EopScalarFieldSelect,
 
 		EopPhysicalTableScan,
+		EopPhysicalParallelTableScan,
 		EopPhysicalForeignScan,
 		EopPhysicalIndexScan,
 		EopPhysicalIndexOnlyScan,
diff --git a/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalParallelTableScan.h b/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalParallelTableScan.h
new file mode 100644
index 00000000000..2ebb916d4f3
--- /dev/null
+++ b/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalParallelTableScan.h
@@ -0,0 +1,140 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CPhysicalParallelTableScan.h
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalParallelTableScan.h
+ *
+ *-------------------------------------------------------------------------
+ */
+#ifndef GPOPT_CPhysicalParallelTableScan_H
+#define GPOPT_CPhysicalParallelTableScan_H
+
+#include "gpos/base.h"
+
+#include "gpopt/operators/CPhysicalTableScan.h"
+
+namespace gpopt
+{
+//---------------------------------------------------------------------------
+//	@class:
+//		CPhysicalParallelTableScan
+//
+//	@doc:
+//		Parallel table scan operator
+//
+//---------------------------------------------------------------------------
+class CPhysicalParallelTableScan : public CPhysicalTableScan
+{
+private:
+	// number of parallel workers
+	ULONG m_ulParallelWorkers;
+
+	// worker-level distribution spec
+	CDistributionSpec *m_pdsWorkerDistribution;
+
+	// private copy ctor
+	CPhysicalParallelTableScan(const CPhysicalParallelTableScan &);
+
+public:
+	// ctors
+	explicit CPhysicalParallelTableScan(CMemoryPool *mp);
+	CPhysicalParallelTableScan(CMemoryPool *mp, const CName *pnameAlias, 
+							   CTableDescriptor *ptabdesc,
+							   CColRefArray *pdrgpcrOutput,
+							   ULONG ulParallelWorkers);
+
+	// dtor
+	~CPhysicalParallelTableScan() override;
+
+	// ident accessors
+	EOperatorId
+	Eopid() const override
+	{
+		return EopPhysicalParallelTableScan;
+	}
+
+	// return a string for operator name
+	const CHAR *
+	SzId() const override
+	{
+		return "CPhysicalParallelTableScan";
+	}
+
+	// number of parallel workers
+	ULONG UlParallelWorkers() const
+	{
+		return m_ulParallelWorkers;
+	}
+
+	// operator specific hash function
+	ULONG HashValue() const override;
+
+	// match function
+	BOOL Matches(COperator *) const override;
+
+	// debug print
+	IOstream &OsPrint(IOstream &) const override;
+
+	// conversion function
+	static CPhysicalParallelTableScan *
+	PopConvert(COperator *pop)
+	{
+		GPOS_ASSERT(nullptr != pop);
+		GPOS_ASSERT(EopPhysicalParallelTableScan == pop->Eopid());
+
+		return dynamic_cast<CPhysicalParallelTableScan *>(pop);
+	}
+
+	CRewindabilitySpec *
+	PrsDerive(CMemoryPool *mp,
+			  CExpressionHandle &  // exprhdl
+	) const override
+	{
+		return GPOS_NEW(mp)
+			CRewindabilitySpec(CRewindabilitySpec::ErtNone,
+							   CRewindabilitySpec::EmhtNoMotion);
+	}
+
+	// derive distribution
+	CDistributionSpec *PdsDerive(CMemoryPool *mp, CExpressionHandle &exprhdl) const override;
+
+	// return distribution property enforcing type for this operator
+	CEnfdProp::EPropEnforcingType EpetDistribution(
+		CExpressionHandle &exprhdl,
+		const CEnfdDistribution *ped) const override;
+
+	// return rewindability property enforcing type for this operator
+	CEnfdProp::EPropEnforcingType EpetRewindability(
+		CExpressionHandle &exprhdl,
+		const CEnfdRewindability *per) const override;
+
+	// check if optimization contexts is valid
+	// Reject if parent requires REWINDABLE (e.g., for NL Join inner child)
+	BOOL FValidContext(CMemoryPool *mp, COptimizationContext *poc,
+					   COptimizationContextArray *pdrgpocChild) const override;
+
+};	// class CPhysicalParallelTableScan
+
+}  // namespace gpopt
+
+#endif	// !GPOPT_CPhysicalParallelTableScan_H
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalTableScan.h b/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalTableScan.h
index ace1005d67a..d34f0150b55 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalTableScan.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/operators/CPhysicalTableScan.h
@@ -71,7 +71,8 @@ class CPhysicalTableScan : public CPhysicalScan
 	{
 		GPOS_ASSERT(nullptr != pop);
 		GPOS_ASSERT(EopPhysicalTableScan == pop->Eopid() ||
-					EopPhysicalForeignScan == pop->Eopid());
+					EopPhysicalForeignScan == pop->Eopid() ||
+					EopPhysicalParallelTableScan == pop->Eopid());
 
 		return dynamic_cast<CPhysicalTableScan *>(pop);
 	}
diff --git a/src/backend/gporca/libgpopt/include/gpopt/optimizer/COptimizerConfig.h b/src/backend/gporca/libgpopt/include/gpopt/optimizer/COptimizerConfig.h
index 159ddafbed7..eeee3932b3e 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/optimizer/COptimizerConfig.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/optimizer/COptimizerConfig.h
@@ -69,11 +69,15 @@ class COptimizerConfig : public CRefCount
 	// default window oids
 	CWindowOids *m_window_oids;
 
+	// should generate parallel plans ?
+	BOOL m_create_parallel_plan;
+
 public:
 	// ctor
 	COptimizerConfig(CEnumeratorConfig *pec, CStatisticsConfig *stats_config,
 					 CCTEConfig *pcteconf, ICostModel *pcm, CHint *phint,
-					 CPlanHint *pplanhint, CWindowOids *pdefoidsGPDB);
+					 CPlanHint *pplanhint, CWindowOids *pdefoidsGPDB,
+					 BOOL enable_parallel_plans = false);
 
 	// dtor
 	~COptimizerConfig() override;
@@ -127,6 +131,13 @@ class COptimizerConfig : public CRefCount
 		return m_plan_hint;
 	}
 
+	// parallel plans setting
+	BOOL
+	CreateParallelPlan() const
+	{
+		return m_create_parallel_plan;
+	}
+
 	// generate default optimizer configurations
 	static COptimizerConfig *PoconfDefault(CMemoryPool *mp);
 
diff --git a/src/backend/gporca/libgpopt/include/gpopt/search/CGroup.h b/src/backend/gporca/libgpopt/include/gpopt/search/CGroup.h
index 0b94e9df7e7..eaeaf22024f 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/search/CGroup.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/search/CGroup.h
@@ -38,6 +38,7 @@ class CDrvdProp;
 class CDrvdPropCtxtPlan;
 class CReqdPropRelational;
 class CExpression;
+class CMemo;
 
 // type definitions
 // array of groups
@@ -160,6 +161,9 @@ class CGroup : public CRefCount, public DbgPrintMixin<CGroup>
 	// memory pool
 	CMemoryPool *m_mp;
 
+	// containing memo
+	CMemo *m_pmemo;
+
 	// id is used when printing memo contents
 	ULONG m_id;
 
@@ -257,6 +261,9 @@ class CGroup : public CRefCount, public DbgPrintMixin<CGroup>
 	// setter of group state
 	void SetState(EState estNewState);
 
+	// setter of containing memo
+	void SetMemo(CMemo *pmemo);
+
 	// set hash join keys
 	void SetJoinKeys(CExpressionArray *pdrgpexprOuter,
 					 CExpressionArray *pdrgpexprInner,
@@ -338,6 +345,13 @@ class CGroup : public CRefCount, public DbgPrintMixin<CGroup>
 		return m_id;
 	}
 
+	// containing memo accessor
+	CMemo *
+	Pmemo() const
+	{
+		return m_pmemo;
+	}
+
 	// group properties accessor
 	CDrvdProp *
 	Pdp() const
diff --git a/src/backend/gporca/libgpopt/include/gpopt/search/CGroupProxy.h b/src/backend/gporca/libgpopt/include/gpopt/search/CGroupProxy.h
index 61303f39ef7..1e77f0fbcab 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/search/CGroupProxy.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/search/CGroupProxy.h
@@ -23,6 +23,7 @@ using namespace gpos;
 class CGroupExpression;
 class CDrvdProp;
 class COptimizationContext;
+class CMemo;
 
 //---------------------------------------------------------------------------
 //	@class:
@@ -63,6 +64,13 @@ class CGroupProxy
 		m_pgroup->SetState(estNewState);
 	}
 
+	// set containing memo
+	void
+	SetMemo(CMemo *pmemo)
+	{
+		m_pgroup->SetMemo(pmemo);
+	}
+
 	// set hash join keys
 	void
 	SetJoinKeys(CExpressionArray *pdrgpexprOuter,
diff --git a/src/backend/gporca/libgpopt/include/gpopt/xforms/CXform.h b/src/backend/gporca/libgpopt/include/gpopt/xforms/CXform.h
index 225371097c5..d0fca8219ac 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/xforms/CXform.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/xforms/CXform.h
@@ -69,6 +69,7 @@ class CXform : public CRefCount, public DbgPrintMixin<CXform>
 		ExfExpandNAryJoinMinCard,
 		ExfExpandNAryJoinDP,
 		ExfGet2TableScan,
+		ExfGet2ParallelTableScan,
 		ExfIndexGet2IndexScan,
 		ExfDynamicGet2DynamicTableScan,
 		ExfDynamicIndexGet2DynamicIndexScan,
diff --git a/src/backend/gporca/libgpopt/include/gpopt/xforms/CXformGet2ParallelTableScan.h b/src/backend/gporca/libgpopt/include/gpopt/xforms/CXformGet2ParallelTableScan.h
new file mode 100644
index 00000000000..99c8d4863d4
--- /dev/null
+++ b/src/backend/gporca/libgpopt/include/gpopt/xforms/CXformGet2ParallelTableScan.h
@@ -0,0 +1,88 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CXformGet2ParallelTableScan.h
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/include/gpopt/xforms/CXformGet2ParallelTableScan.h
+ *
+ *-------------------------------------------------------------------------
+ */
+#ifndef GPOPT_CXformGet2ParallelTableScan_H
+#define GPOPT_CXformGet2ParallelTableScan_H
+
+#include "gpos/base.h"
+
+#include "gpopt/xforms/CXformImplementation.h"
+
+namespace gpopt
+{
+using namespace gpos;
+
+//---------------------------------------------------------------------------
+//	@class:
+//		CXformGet2ParallelTableScan
+//
+//	@doc:
+//		Transform Get to Parallel TableScan using GUC enable_parallel
+//
+//---------------------------------------------------------------------------
+class CXformGet2ParallelTableScan : public CXformImplementation
+{
+private:
+	// check if memo contains logical operators that are incompatible with parallel execution
+	static BOOL FHasParallelIncompatibleOps(CExpressionHandle &exprhdl);
+
+public:
+	CXformGet2ParallelTableScan(const CXformGet2ParallelTableScan &) = delete;
+
+	// ctor
+	explicit CXformGet2ParallelTableScan(CMemoryPool *);
+
+	// dtor
+	~CXformGet2ParallelTableScan() override = default;
+
+	// ident accessors
+	EXformId
+	Exfid() const override
+	{
+		return ExfGet2ParallelTableScan;
+	}
+
+	// return a string for xform name
+	const CHAR *
+	SzId() const override
+	{
+		return "CXformGet2ParallelTableScan";
+	}
+
+	// compute xform promise for a given expression handle
+	EXformPromise Exfp(CExpressionHandle &exprhdl) const override;
+
+	// actual transform
+	void Transform(CXformContext *pxfctxt, CXformResult *pxfres,
+				   CExpression *pexpr) const override;
+
+};	// class CXformGet2ParallelTableScan
+
+}  // namespace gpopt
+
+#endif	// !GPOPT_CXformGet2ParallelTableScan_H
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/include/gpopt/xforms/xforms.h b/src/backend/gporca/libgpopt/include/gpopt/xforms/xforms.h
index fb5ba6b1e3c..0ee9beb2eb7 100644
--- a/src/backend/gporca/libgpopt/include/gpopt/xforms/xforms.h
+++ b/src/backend/gporca/libgpopt/include/gpopt/xforms/xforms.h
@@ -52,6 +52,7 @@
 #include "gpopt/xforms/CXformGbAggDedup2StreamAggDedup.h"
 #include "gpopt/xforms/CXformGbAggWithMDQA2Join.h"
 #include "gpopt/xforms/CXformGet2TableScan.h"
+#include "gpopt/xforms/CXformGet2ParallelTableScan.h"
 #include "gpopt/xforms/CXformImplementAssert.h"
 #include "gpopt/xforms/CXformImplementBitmapTableGet.h"
 #include "gpopt/xforms/CXformImplementCTEConsumer.h"
diff --git a/src/backend/gporca/libgpopt/src/base/CDistributionSpecWorkerRandom.cpp b/src/backend/gporca/libgpopt/src/base/CDistributionSpecWorkerRandom.cpp
new file mode 100644
index 00000000000..a5e9e86b02d
--- /dev/null
+++ b/src/backend/gporca/libgpopt/src/base/CDistributionSpecWorkerRandom.cpp
@@ -0,0 +1,330 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CDistributionSpecWorkerRandom.cpp
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/src/base/CDistributionSpecWorkerRandom.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "gpopt/base/CDistributionSpecWorkerRandom.h"
+
+#include "gpopt/base/CColRefSet.h"
+#include "gpopt/base/CDistributionSpecHashed.h"
+#include "gpopt/base/CDistributionSpecStrictRandom.h"
+#include "gpopt/base/COptCtxt.h"
+#include "gpopt/base/CUtils.h"
+#include "gpopt/operators/CExpressionHandle.h"
+#include "gpopt/operators/CPhysicalMotionHashDistribute.h"
+#include "gpopt/operators/CPhysicalMotionRandom.h"
+#include "naucrates/traceflags/traceflags.h"
+
+using namespace gpopt;
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::CDistributionSpecWorkerRandom
+//
+//	@doc:
+//		Ctor
+//		Note: This constructor should only be called from PdsCreateWorkerRandom
+//		factory method, which ensures pdsSegmentBase is properly initialized
+//
+//---------------------------------------------------------------------------
+CDistributionSpecWorkerRandom::CDistributionSpecWorkerRandom(ULONG ulWorkers, CDistributionSpec *pdsSegmentBase)
+	: m_ulWorkers(ulWorkers), m_pdsSegmentBase(pdsSegmentBase)
+{
+	GPOS_ASSERT(ulWorkers > 0);
+	GPOS_ASSERT(nullptr != pdsSegmentBase &&
+				"pdsSegmentBase must be non-null. Use PdsCreateWorkerRandom factory method.");
+
+	m_pdsSegmentBase->AddRef();
+
+	if (COptCtxt::PoctxtFromTLS()->FDMLQuery())
+	{
+		// set duplicate sensitive flag to enforce Hash-Distribution of
+		// Const Tables in DML queries
+		MarkDuplicateSensitive();
+	}
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::~CDistributionSpecWorkerRandom
+//
+//	@doc:
+//		Dtor
+//
+//---------------------------------------------------------------------------
+CDistributionSpecWorkerRandom::~CDistributionSpecWorkerRandom()
+{
+	CRefCount::SafeRelease(m_pdsSegmentBase);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::PdsCreateWorkerRandom
+//
+//	@doc:
+//		Factory method for creating worker-level random distribution
+//
+//---------------------------------------------------------------------------
+CDistributionSpecWorkerRandom *
+CDistributionSpecWorkerRandom::PdsCreateWorkerRandom(CMemoryPool *mp, ULONG ulWorkers, CDistributionSpec *pdsBase)
+{
+	GPOS_ASSERT(nullptr != mp);
+	GPOS_ASSERT(ulWorkers > 0);
+
+	// If no base distribution provided, create a default random distribution
+	// using the provided memory pool (not TLS pool)
+	CDistributionSpec *pdsSegmentBase = pdsBase;
+	if (nullptr == pdsSegmentBase)
+	{
+		pdsSegmentBase = GPOS_NEW(mp) CDistributionSpecRandom();
+	}
+
+	return GPOS_NEW(mp) CDistributionSpecWorkerRandom(ulWorkers, pdsSegmentBase);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::Matches
+//
+//	@doc:
+//		Match function
+//
+//---------------------------------------------------------------------------
+BOOL
+CDistributionSpecWorkerRandom::Matches(const CDistributionSpec *pds) const
+{
+	if (pds->Edt() == CDistributionSpec::EdtWorkerRandom)
+	{
+		const CDistributionSpecWorkerRandom *pdsWorkerRandom =
+			CDistributionSpecWorkerRandom::PdsConvert(pds);
+
+		// Check if worker counts match and base distributions are compatible
+		return (m_ulWorkers == pdsWorkerRandom->m_ulWorkers &&
+				IsDuplicateSensitive() == pdsWorkerRandom->IsDuplicateSensitive() &&
+				((nullptr == m_pdsSegmentBase && nullptr == pdsWorkerRandom->m_pdsSegmentBase) ||
+				 (nullptr != m_pdsSegmentBase && nullptr != pdsWorkerRandom->m_pdsSegmentBase &&
+				  m_pdsSegmentBase->Matches(pdsWorkerRandom->m_pdsSegmentBase))));
+	}
+
+	return false;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::FSatisfies
+//
+//	@doc:
+//		Check if this distribution spec satisfies the given one
+//
+//---------------------------------------------------------------------------
+BOOL
+CDistributionSpecWorkerRandom::FSatisfies(const CDistributionSpec *pds) const
+{
+	if (Matches(pds))
+	{
+		return true;
+	}
+
+	// Handle different distribution types
+	if (EdtWorkerRandom == pds->Edt())
+	{
+		const CDistributionSpecWorkerRandom *pdsWorkerRandom =
+			CDistributionSpecWorkerRandom::PdsConvert(pds);
+
+		// Worker-level can satisfy another worker-level if it has the same number of workers
+		// and the base segment distribution is compatible
+		return (m_ulWorkers == pdsWorkerRandom->m_ulWorkers &&
+				(nullptr == m_pdsSegmentBase || nullptr == pdsWorkerRandom->m_pdsSegmentBase ||
+				 m_pdsSegmentBase->FSatisfies(pdsWorkerRandom->m_pdsSegmentBase)) &&
+				(IsDuplicateSensitive() || !pdsWorkerRandom->IsDuplicateSensitive()));
+	}
+	else if (EdtRandom == pds->Edt())
+	{
+		// Note: This ensures semantic consistency with Random::FSatisfies(WorkerRandom),
+		// which also returns false, as neither can satisfy the other without a Motion.
+		return false;
+	}
+
+	// Standard satisfaction logic for other distribution types
+	return EdtAny == pds->Edt() || EdtNonSingleton == pds->Edt() ||
+		   EdtNonReplicated == pds->Edt();
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::AppendEnforcers
+//
+//	@doc:
+//		Add required enforcers to dynamic array
+//
+//---------------------------------------------------------------------------
+void
+CDistributionSpecWorkerRandom::AppendEnforcers(CMemoryPool *mp,
+											   CExpressionHandle &exprhdl,
+											   CReqdPropPlan *prpp,
+											   CExpressionArray *pdrgpexpr,
+											   CExpression *pexpr)
+{
+	GPOS_ASSERT(nullptr != mp);
+	GPOS_ASSERT(nullptr != prpp);
+	GPOS_ASSERT(nullptr != pdrgpexpr);
+	GPOS_ASSERT(nullptr != pexpr);
+	GPOS_ASSERT(!GPOS_FTRACE(EopttraceDisableMotions));
+	GPOS_ASSERT(
+		this == prpp->Ped()->PdsRequired() &&
+		"required plan properties don't match enforced distribution spec");
+
+	// Get the actually required distribution specification
+	CDistributionSpec *pdsRequired = prpp->Ped()->PdsRequired();
+	GPOS_ASSERT(nullptr != pdsRequired);
+
+	// Get child's distribution for duplicate hazard checking
+	CDistributionSpec *expr_dist_spec =
+		CDrvdPropPlan::Pdpplan(exprhdl.Pdp())->Pds();
+	BOOL fDuplicateHazard = CUtils::FDuplicateHazardDistributionSpec(expr_dist_spec);
+
+	pexpr->AddRef();
+	CExpression *pexprMotion = nullptr;
+
+	// Generate appropriate motion based on required distribution type
+	switch (pdsRequired->Edt())
+	{
+		case CDistributionSpec::EdtHashed:
+		{
+			// Required: Hashed distribution -> Generate HashDistribute Motion
+			if (GPOS_FTRACE(EopttraceDisableMotionHashDistribute))
+			{
+				// Hash redistribute Motion is disabled, cannot satisfy requirement
+				pexpr->Release();
+				return;
+			}
+
+			CDistributionSpecHashed *pdsHashedRequired =
+				CDistributionSpecHashed::PdsConvert(pdsRequired);
+			pdsHashedRequired->AddRef();
+
+			if (fDuplicateHazard)
+			{
+				pdsHashedRequired->MarkDuplicateSensitive();
+			}
+
+			pexprMotion = GPOS_NEW(mp) CExpression(
+				mp, GPOS_NEW(mp) CPhysicalMotionHashDistribute(mp, pdsHashedRequired), pexpr);
+			break;
+		}
+
+		case CDistributionSpec::EdtRandom:
+		{
+			// Required: Random distribution (segment-level, no worker parallelism)
+			// Need to convert WorkerRandom to plain Random
+			if (GPOS_FTRACE(EopttraceDisableMotionRandom))
+			{
+				// Random Motion is disabled
+				pexpr->Release();
+				return;
+			}
+
+			// Create a Random distribution spec (not WorkerRandom) as the Motion target
+			// This converts worker-level parallelism to segment-level distribution
+			CDistributionSpecRandom *random_dist_spec = nullptr;
+
+			if (fDuplicateHazard)
+			{
+				random_dist_spec = GPOS_NEW(mp) CDistributionSpecRandom();
+				random_dist_spec->MarkDuplicateSensitive();
+			}
+			else
+			{
+				// Use StrictRandom for actual redistribution motion
+				random_dist_spec = GPOS_NEW(mp) CDistributionSpecStrictRandom();
+			}
+
+			pexprMotion = GPOS_NEW(mp) CExpression(
+				mp, GPOS_NEW(mp) CPhysicalMotionRandom(mp, random_dist_spec), pexpr);
+			break;
+		}
+		case CDistributionSpec::EdtWorkerRandom:
+		{
+			// Required: WorkerRandom distribution -> Generate Random Motion
+			if (GPOS_FTRACE(EopttraceDisableMotionRandom))
+			{
+				// Random Motion is disabled
+				pexpr->Release();
+				return;
+			}
+
+			CDistributionSpecWorkerRandom *random_dist_spec =
+				PdsCreateWorkerRandom(mp, m_ulWorkers, GPOS_NEW(mp) CDistributionSpecRandom());
+
+			if (fDuplicateHazard)
+			{
+				random_dist_spec->MarkDuplicateSensitive();
+			}
+
+			pexprMotion = GPOS_NEW(mp) CExpression(
+				mp, GPOS_NEW(mp) CPhysicalMotionRandom(mp, random_dist_spec), pexpr);
+			break;
+		}
+
+		default:
+		{
+			// Fallback: cannot generate appropriate motion
+			pexpr->Release();
+			return;
+		}
+	}
+
+	// Add the generated motion to the enforcer array
+	if (nullptr != pexprMotion)
+	{
+		pdrgpexpr->Append(pexprMotion);
+	}
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDistributionSpecWorkerRandom::OsPrint
+//
+//	@doc:
+//		Print function
+//
+//---------------------------------------------------------------------------
+IOstream &
+CDistributionSpecWorkerRandom::OsPrint(IOstream &os) const
+{
+	os << SzId() << "[workers:" << m_ulWorkers << "]";
+	if (nullptr != m_pdsSegmentBase)
+	{
+		os << " base:";
+		m_pdsSegmentBase->OsPrint(os);
+	}
+	if (IsDuplicateSensitive())
+	{
+		os << " (duplicate sensitive)";
+	}
+	return os;
+}
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/src/base/CUtils.cpp b/src/backend/gporca/libgpopt/src/base/CUtils.cpp
index b5f847b817a..4776c602fcd 100644
--- a/src/backend/gporca/libgpopt/src/base/CUtils.cpp
+++ b/src/backend/gporca/libgpopt/src/base/CUtils.cpp
@@ -978,6 +978,130 @@ CUtils::FHasCTEAnchor(CExpression *pexpr)
 	return false;
 }
 
+// True if the distribution is replicated-like.
+static BOOL
+FReplicatedLikeDistribution(CDistributionSpec::EDistributionType edt)
+{
+	return (CDistributionSpec::EdtStrictReplicated == edt ||
+			CDistributionSpec::EdtTaintedReplicated == edt ||
+			CDistributionSpec::EdtUniversal == edt);
+}
+
+struct SCTEInfo
+{
+	ULONG cteId;
+	ULONG sliceId;
+
+	SCTEInfo(ULONG cte_id, ULONG slice_id) : cteId(cte_id), sliceId(slice_id)
+	{
+	}
+};
+
+typedef CDynamicPtrArray<SCTEInfo, CleanupDelete<SCTEInfo> > CTEInfoArray;
+
+// Walk the physical tree, recording the slice id of every replicated
+// CTE Producer and every CTE Consumer. Slices are delimited by Motion
+// nodes: each non-scalar child of a Motion lives in a fresh slice --
+// same motId-stack idea as in apply_shareinput_xslice.
+static void
+CollectCTESlices(CMemoryPool *mp, CExpression *pexpr, ULONG curSlice,
+				 ULONG *pNextSlice, CTEInfoArray *prodInfos,
+				 CTEInfoArray *consInfos)
+{
+	GPOS_CHECK_STACK_SIZE;
+	GPOS_ASSERT(nullptr != pexpr);
+
+	COperator *pop = pexpr->Pop();
+
+	if (COperator::EopPhysicalCTEProducer == pop->Eopid())
+	{
+		// Producer's distribution comes from its only child -- inspect
+		// it there. Skip non-replicated Producers; they cannot trigger
+		// the cross-slice issue we are checking for.
+		GPOS_ASSERT(1 == pexpr->Arity());
+		CExpression *pexprChild = (*pexpr)[0];
+		CDrvdPropPlan *pdpplan =
+			CDrvdPropPlan::Pdpplan(pexprChild->PdpDerive());
+
+		if (FReplicatedLikeDistribution(pdpplan->Pds()->Edt()))
+		{
+			prodInfos->Append(GPOS_NEW(mp) SCTEInfo(
+				CPhysicalCTEProducer::PopConvert(pop)->UlCTEId(), curSlice));
+		}
+	}
+	else if (COperator::EopPhysicalCTEConsumer == pop->Eopid())
+	{
+		// Consumer is a leaf -- record (cteId, curSlice) and let the
+		// caller decide later, once the whole tree has been walked.
+		consInfos->Append(GPOS_NEW(mp) SCTEInfo(
+			CPhysicalCTEConsumer::PopConvert(pop)->UlCTEId(), curSlice));
+	}
+
+	BOOL isMotion = CUtils::FPhysicalMotion(pop);
+
+	for (ULONG ul = 0; ul < pexpr->Arity(); ul++)
+	{
+		CExpression *pexprChild = (*pexpr)[ul];
+
+		if (pexprChild->Pop()->FScalar())
+		{
+			continue;
+		}
+
+		ULONG childSlice = curSlice;
+		if (isMotion)
+		{
+			(*pNextSlice)++;
+			childSlice = *pNextSlice;
+		}
+
+		CollectCTESlices(mp, pexprChild, childSlice, pNextSlice, prodInfos,
+						 consInfos);
+	}
+}
+
+static BOOL
+FFoundCrossSlice(const CTEInfoArray *consInfos, const CTEInfoArray *prodInfos)
+{
+	for (ULONG ic = 0; ic < consInfos->Size(); ic++)
+	{
+		SCTEInfo *cons = (*consInfos)[ic];
+
+		for (ULONG ip = 0; ip < prodInfos->Size(); ip++)
+		{
+			SCTEInfo *prod = (*prodInfos)[ip];
+			if (prod->cteId == cons->cteId && prod->sliceId != cons->sliceId)
+			{
+				return true;
+			}
+		}
+	}
+	return false;
+}
+
+BOOL
+CUtils::FHasCrossSliceReplicatedCTEConsumer(CMemoryPool *mp, CExpression *pexpr)
+{
+	if (NULL == pexpr)
+	{
+		return false;
+	}
+
+	CTEInfoArray *prodInfos = GPOS_NEW(mp) CTEInfoArray(mp);
+	CTEInfoArray *consInfos = GPOS_NEW(mp) CTEInfoArray(mp);
+	ULONG nextSlice = 0;
+
+	CollectCTESlices(mp, pexpr, 0 /*curSlice*/, &nextSlice, prodInfos,
+					 consInfos);
+
+	BOOL cross = FFoundCrossSlice(consInfos, prodInfos);
+
+	prodInfos->Release();
+	consInfos->Release();
+
+	return cross;
+}
+
 //---------------------------------------------------------------------------
 //	@class:
 //		CUtils::FHasSubqueryOrApply
diff --git a/src/backend/gporca/libgpopt/src/base/Makefile b/src/backend/gporca/libgpopt/src/base/Makefile
index 604fd3a6fa4..01f2bb0a02a 100644
--- a/src/backend/gporca/libgpopt/src/base/Makefile
+++ b/src/backend/gporca/libgpopt/src/base/Makefile
@@ -42,6 +42,7 @@ OBJS        = CAutoOptCtxt.o \
               CDistributionSpecStrictRandom.o \
               CDistributionSpecStrictSingleton.o \
               CDistributionSpecUniversal.o \
+              CDistributionSpecWorkerRandom.o \
               CDrvdProp.o \
               CDrvdPropCtxt.o \
               CDrvdPropCtxtPlan.o \
diff --git a/src/backend/gporca/libgpopt/src/operators/CLogicalGet.cpp b/src/backend/gporca/libgpopt/src/operators/CLogicalGet.cpp
index ff93a28522c..8e6e3461d51 100644
--- a/src/backend/gporca/libgpopt/src/operators/CLogicalGet.cpp
+++ b/src/backend/gporca/libgpopt/src/operators/CLogicalGet.cpp
@@ -305,6 +305,8 @@ CLogicalGet::PxfsCandidates(CMemoryPool *mp) const
 	CXformSet *xform_set = GPOS_NEW(mp) CXformSet(mp);
 
 	(void) xform_set->ExchangeSet(CXform::ExfGet2TableScan);
+	// add parallel table scan
+	(void) xform_set->ExchangeSet(CXform::ExfGet2ParallelTableScan);
 
 	return xform_set;
 }
diff --git a/src/backend/gporca/libgpopt/src/operators/CNormalizer.cpp b/src/backend/gporca/libgpopt/src/operators/CNormalizer.cpp
index 97fb97a1409..38c8a93a9ab 100644
--- a/src/backend/gporca/libgpopt/src/operators/CNormalizer.cpp
+++ b/src/backend/gporca/libgpopt/src/operators/CNormalizer.cpp
@@ -18,6 +18,7 @@
 #include "gpopt/base/CUtils.h"
 #include "gpopt/operators/CLogical.h"
 #include "gpopt/operators/CLogicalConstTableGet.h"
+#include "gpopt/operators/CLogicalGbAgg.h"
 #include "gpopt/operators/CLogicalInnerJoin.h"
 #include "gpopt/operators/CLogicalLeftOuterCorrelatedApply.h"
 #include "gpopt/operators/CLogicalLeftOuterJoin.h"
@@ -126,6 +127,18 @@ CNormalizer::FPushable(CExpression *pexprLogical, CExpression *pexprPred)
 		return false;
 	}
 
+	// do not push predicates below a scalar (plain) aggregate, i.e. one with
+	// no grouping columns. A scalar aggregate produces exactly one output row
+	// regardless of input cardinality, so a predicate above it (HAVING clause)
+	// must be evaluated against that output row, not the aggregate's input.
+	// Pushing e.g. "HAVING false" below would leave the agg emitting one row
+	// (e.g. count = 0) instead of zero rows.
+	if (COperator::EopLogicalGbAgg == pexprLogical->Pop()->Eopid() &&
+		0 == CLogicalGbAgg::PopConvert(pexprLogical->Pop())->Pdrgpcr()->Size())
+	{
+		return false;
+	}
+
 
 	CColRefSet *pcrsUsed = pexprPred->DeriveUsedColumns();
 	CColRefSet *pcrsOutput = pexprLogical->DeriveOutputColumns();
diff --git a/src/backend/gporca/libgpopt/src/operators/CPhysicalCTEProducer.cpp b/src/backend/gporca/libgpopt/src/operators/CPhysicalCTEProducer.cpp
index c6be21f87cd..a13e89fda1e 100644
--- a/src/backend/gporca/libgpopt/src/operators/CPhysicalCTEProducer.cpp
+++ b/src/backend/gporca/libgpopt/src/operators/CPhysicalCTEProducer.cpp
@@ -14,6 +14,7 @@
 #include "gpos/base.h"
 
 #include "gpopt/base/CCTEMap.h"
+#include "gpopt/base/CDistributionSpecRandom.h"
 #include "gpopt/base/COptCtxt.h"
 #include "gpopt/operators/CExpression.h"
 #include "gpopt/operators/CExpressionHandle.h"
diff --git a/src/backend/gporca/libgpopt/src/operators/CPhysicalParallelTableScan.cpp b/src/backend/gporca/libgpopt/src/operators/CPhysicalParallelTableScan.cpp
new file mode 100644
index 00000000000..a70a35981c6
--- /dev/null
+++ b/src/backend/gporca/libgpopt/src/operators/CPhysicalParallelTableScan.cpp
@@ -0,0 +1,284 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CPhysicalParallelTableScan.cpp
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/src/operators/CPhysicalParallelTableScan.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "gpopt/operators/CPhysicalParallelTableScan.h"
+
+#include "gpos/base.h"
+
+#include "gpopt/base/CDistributionSpec.h"
+#include "gpopt/base/CDistributionSpecHashed.h"
+#include "gpopt/base/CDistributionSpecRandom.h"
+#include "gpopt/base/CDistributionSpecWorkerRandom.h"
+#include "gpopt/base/CDistributionSpecSingleton.h"
+#include "gpopt/base/CUtils.h"
+#include "gpopt/base/CEnfdDistribution.h"
+#include "gpopt/base/CEnfdRewindability.h"
+#include "gpopt/base/COptimizationContext.h"
+#include "gpopt/base/CRewindabilitySpec.h"
+#include "gpopt/base/CDrvdPropPlan.h"
+#include "gpopt/metadata/CName.h"
+#include "gpopt/metadata/CTableDescriptor.h"
+#include "gpopt/operators/CExpressionHandle.h"
+
+using namespace gpopt;
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::CPhysicalParallelTableScan
+//
+//	@doc:
+//		ctor
+//
+//---------------------------------------------------------------------------
+CPhysicalParallelTableScan::CPhysicalParallelTableScan(CMemoryPool *mp)
+	: CPhysicalTableScan(mp, GPOS_NEW(mp) CName(GPOS_NEW(mp) CWStringConst(GPOS_WSZ_LIT("parallel_table"))), nullptr, nullptr),
+	  m_ulParallelWorkers(1),
+	  m_pdsWorkerDistribution(nullptr)
+{
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::CPhysicalParallelTableScan
+//
+//	@doc:
+//		ctor
+//
+//---------------------------------------------------------------------------
+CPhysicalParallelTableScan::CPhysicalParallelTableScan(CMemoryPool *mp,
+													   const CName *pnameAlias,
+													   CTableDescriptor *ptabdesc,
+													   CColRefArray *pdrgpcrOutput,
+													   ULONG ulParallelWorkers)
+	: CPhysicalTableScan(mp, pnameAlias, ptabdesc, pdrgpcrOutput),
+	  m_ulParallelWorkers(ulParallelWorkers),
+	  m_pdsWorkerDistribution(nullptr)
+{
+	GPOS_ASSERT(ulParallelWorkers > 0);
+	GPOS_ASSERT(nullptr != m_pds);
+	// Create worker-level distribution based on table's segment distribution
+	if (ulParallelWorkers > 0 && nullptr != m_pds)
+	{
+		// Create worker-level random distribution using the table's distribution as base
+		// The base CPhysicalScan already sets up m_pds from the table descriptor
+		m_pdsWorkerDistribution = CDistributionSpecWorkerRandom::PdsCreateWorkerRandom(mp, ulParallelWorkers, m_pds);
+	}
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::~CPhysicalParallelTableScan
+//
+//	@doc:
+//		dtor
+//
+//---------------------------------------------------------------------------
+CPhysicalParallelTableScan::~CPhysicalParallelTableScan()
+{
+	CRefCount::SafeRelease(m_pdsWorkerDistribution);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::HashValue
+//
+//	@doc:
+//		Combine pointer for table descriptor, parallel workers and Eop
+//
+//---------------------------------------------------------------------------
+ULONG
+CPhysicalParallelTableScan::HashValue() const
+{
+	ULONG ulHash = gpos::CombineHashes(CPhysicalTableScan::HashValue(),
+									   gpos::HashValue<ULONG>(&m_ulParallelWorkers));
+	return ulHash;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::Matches
+//
+//	@doc:
+//		match operator
+//
+//---------------------------------------------------------------------------
+BOOL
+CPhysicalParallelTableScan::Matches(COperator *pop) const
+{
+	if (Eopid() != pop->Eopid())
+	{
+		return false;
+	}
+
+	CPhysicalParallelTableScan *popParallelTableScan = 
+		CPhysicalParallelTableScan::PopConvert(pop);
+	
+	return CPhysicalTableScan::Matches(pop) && 
+		   m_ulParallelWorkers == popParallelTableScan->UlParallelWorkers();
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::OsPrint
+//
+//	@doc:
+//		debug print
+//
+//---------------------------------------------------------------------------
+IOstream &
+CPhysicalParallelTableScan::OsPrint(IOstream &os) const
+{
+	os << SzId() << " ";
+
+	// alias of table as referenced in the query
+	m_pnameAlias->OsPrint(os);
+
+	// actual name of table in catalog and columns
+	os << " (";
+	m_ptabdesc->Name().OsPrint(os);
+	os << "), Columns: [";
+
+	CUtils::OsPrintDrgPcr(os, m_pdrgpcrOutput);
+	os << "], Workers: " << m_ulParallelWorkers;
+
+	return os;
+}
+
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::PdsDerive
+//
+//	@doc:
+//		Derive distribution for parallel table scan
+//
+//---------------------------------------------------------------------------
+CDistributionSpec *
+CPhysicalParallelTableScan::PdsDerive(CMemoryPool *mp, CExpressionHandle &exprhdl) const
+{
+	// If we have a pre-computed worker distribution, use it
+	if (nullptr != m_pdsWorkerDistribution)
+	{
+		m_pdsWorkerDistribution->AddRef();
+		return m_pdsWorkerDistribution;
+	}
+
+	// Otherwise, derive from the base physical scan
+	// This uses the m_pds member from CPhysicalScan
+	return CPhysicalScan::PdsDerive(mp, exprhdl);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::EpetDistribution
+//
+//	@doc:
+//		Return the enforcing type for distribution property based on this
+//		operator
+//
+//---------------------------------------------------------------------------
+CEnfdProp::EPropEnforcingType
+CPhysicalParallelTableScan::EpetDistribution(CExpressionHandle & /*exprhdl*/,
+											  const CEnfdDistribution *ped) const
+{
+	GPOS_ASSERT(nullptr != ped);
+
+	// First check if worker-level distribution can satisfy the requirement
+	// This is the primary distribution for parallel scans
+	if (nullptr != m_pdsWorkerDistribution && ped->FCompatible(m_pdsWorkerDistribution))
+	{
+		return CEnfdProp::EpetUnnecessary;
+	}
+
+	// Neither distribution satisfies the requirement
+	// Motion enforcement will be needed on the output
+	return CEnfdProp::EpetRequired;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::EpetRewindability
+//
+//	@doc:
+//		Return rewindability property enforcing type for this operator
+//
+//---------------------------------------------------------------------------
+CEnfdProp::EPropEnforcingType
+CPhysicalParallelTableScan::EpetRewindability(CExpressionHandle &exprhdl,
+											  const CEnfdRewindability *per) const
+{
+	GPOS_ASSERT(nullptr != per);
+
+	// Get derived rewindability from this operator
+	CRewindabilitySpec *prs = CDrvdPropPlan::Pdpplan(exprhdl.Pdp())->Prs();
+
+	// Check if our derived rewindability satisfies the requirement
+	if (per->FCompatible(prs))
+	{
+		// Our derived rewindability (ErtNone) satisfies the requirement
+		return CEnfdProp::EpetUnnecessary;
+	}
+
+	// Cannot satisfy the rewindability requirement
+	// GPORCA will need to add an enforcer (e.g., Spool)
+	return CEnfdProp::EpetRequired;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CPhysicalParallelTableScan::FValidContext
+//
+//	@doc:
+//		Check if optimization contexts is valid;
+//		Reject if parent requires REWINDABLE (e.g., for NL Join inner child)
+//		because ParallelTableScan derives NONE (not rewindable)
+//
+//---------------------------------------------------------------------------
+BOOL
+CPhysicalParallelTableScan::FValidContext(CMemoryPool *,
+										  COptimizationContext *poc,
+										  COptimizationContextArray *) const
+{
+	GPOS_ASSERT(nullptr != poc);
+
+	CReqdPropPlan *prpp = poc->Prpp();
+	CRewindabilitySpec *prsRequired = prpp->Per()->PrsRequired();
+
+	// If parent requires REWINDABLE or higher, reject
+	// ParallelTableScan can only provide ErtNone
+	if (prsRequired->IsOriginNLJoin())
+	{
+		// Parent requires rewindability (e.g., NL Join inner child)
+		// but ParallelTableScan cannot provide it
+		// Reject this plan to avoid the assertion failure later
+		return false;
+	}
+
+	return true;
+}
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/src/operators/Makefile b/src/backend/gporca/libgpopt/src/operators/Makefile
index faa0f9a70d6..ce5362e9049 100644
--- a/src/backend/gporca/libgpopt/src/operators/Makefile
+++ b/src/backend/gporca/libgpopt/src/operators/Makefile
@@ -123,6 +123,7 @@ OBJS        = CExpression.o \
               CPhysicalMotionRoutedDistribute.o \
               CPhysicalDynamicForeignScan.o \
               CPhysicalNLJoin.o \
+              CPhysicalParallelTableScan.o \
               CPhysicalParallelUnionAll.o \
               CPhysicalPartitionSelector.o \
               CPhysicalRightOuterHashJoin.o \
diff --git a/src/backend/gporca/libgpopt/src/optimizer/COptimizerConfig.cpp b/src/backend/gporca/libgpopt/src/optimizer/COptimizerConfig.cpp
index e55a04862aa..a9486f33e09 100644
--- a/src/backend/gporca/libgpopt/src/optimizer/COptimizerConfig.cpp
+++ b/src/backend/gporca/libgpopt/src/optimizer/COptimizerConfig.cpp
@@ -33,14 +33,16 @@ COptimizerConfig::COptimizerConfig(CEnumeratorConfig *pec,
 								   CStatisticsConfig *stats_config,
 								   CCTEConfig *pcteconf, ICostModel *cost_model,
 								   CHint *phint, CPlanHint *pplanhint,
-								   CWindowOids *pwindowoids)
+								   CWindowOids *pwindowoids,
+								   BOOL enable_parallel_plans)
 	: m_enumerator_cfg(pec),
 	  m_stats_conf(stats_config),
 	  m_cte_conf(pcteconf),
 	  m_cost_model(cost_model),
 	  m_hint(phint),
 	  m_plan_hint(pplanhint),
-	  m_window_oids(pwindowoids)
+	  m_window_oids(pwindowoids),
+	  m_create_parallel_plan(enable_parallel_plans)
 {
 	GPOS_ASSERT(nullptr != pec);
 	GPOS_ASSERT(nullptr != stats_config);
@@ -85,7 +87,7 @@ COptimizerConfig::PoconfDefault(CMemoryPool *mp)
 		CStatisticsConfig::PstatsconfDefault(mp),
 		CCTEConfig::PcteconfDefault(mp), ICostModel::PcmDefault(mp),
 		CHint::PhintDefault(mp), nullptr /* pplanhint */,
-		CWindowOids::GetWindowOids(mp));
+		CWindowOids::GetWindowOids(mp), false /* enable_parallel_plans */);
 }
 
 //---------------------------------------------------------------------------
@@ -105,7 +107,7 @@ COptimizerConfig::PoconfDefault(CMemoryPool *mp, ICostModel *pcm)
 		GPOS_NEW(mp) CEnumeratorConfig(mp, 0 /*plan_id*/, 0 /*ullSamples*/),
 		CStatisticsConfig::PstatsconfDefault(mp),
 		CCTEConfig::PcteconfDefault(mp), pcm, CHint::PhintDefault(mp),
-		nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp));
+		nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp), false /* enable_parallel_plans */);
 }
 
 //---------------------------------------------------------------------------
diff --git a/src/backend/gporca/libgpopt/src/search/CGroup.cpp b/src/backend/gporca/libgpopt/src/search/CGroup.cpp
index 18b4cf44e5b..02fd7fa9ccc 100644
--- a/src/backend/gporca/libgpopt/src/search/CGroup.cpp
+++ b/src/backend/gporca/libgpopt/src/search/CGroup.cpp
@@ -152,6 +152,7 @@ CGroup::SContextLink::Equals(const SContextLink *pclink1,
 //---------------------------------------------------------------------------
 CGroup::CGroup(CMemoryPool *mp, BOOL fScalar)
 	: m_mp(mp),
+	  m_pmemo(nullptr),
 	  m_id(GPOPT_INVALID_GROUP_ID),
 	  m_fScalar(fScalar),
 	  m_pdrgpexprJoinKeysOuter(nullptr),
@@ -534,6 +535,25 @@ CGroup::SetState(EState estNewState)
 }
 
 
+//---------------------------------------------------------------------------
+//	@function:
+//		CGroup::SetMemo
+//
+//	@doc:
+//		Set containing memo reference;
+//
+//---------------------------------------------------------------------------
+void
+CGroup::SetMemo(CMemo *pmemo)
+{
+	GPOS_ASSERT(nullptr != pmemo);
+	GPOS_ASSERT(nullptr == m_pmemo &&
+				"Overwriting previously assigned memo reference");
+
+	m_pmemo = pmemo;
+}
+
+
 void
 CGroup::SetJoinKeys(CExpressionArray *pdrgpexprOuter,
 					CExpressionArray *pdrgpexprInner,
diff --git a/src/backend/gporca/libgpopt/src/search/CMemo.cpp b/src/backend/gporca/libgpopt/src/search/CMemo.cpp
index 5248300aa86..d92da7a9ed9 100644
--- a/src/backend/gporca/libgpopt/src/search/CMemo.cpp
+++ b/src/backend/gporca/libgpopt/src/search/CMemo.cpp
@@ -140,6 +140,7 @@ CMemo::Add(
 		GPOS_ASSERT(nullptr != gp.PgexprFirst());
 
 		gp.SetId(id);
+		gp.SetMemo(this);
 		gp.InitProperties(pdp);
 	}
 
diff --git a/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXL.cpp b/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXL.cpp
index 6119e2ba71f..51acac518be 100644
--- a/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXL.cpp
+++ b/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXL.cpp
@@ -66,6 +66,7 @@
 #include "gpopt/operators/CPhysicalStreamAggDeduplicate.h"
 #include "gpopt/operators/CPhysicalTVF.h"
 #include "gpopt/operators/CPhysicalTableScan.h"
+#include "gpopt/operators/CPhysicalParallelTableScan.h"
 #include "gpopt/operators/CPhysicalUnionAll.h"
 #include "gpopt/operators/CPredicateUtils.h"
 #include "gpopt/operators/CScalarArray.h"
@@ -129,6 +130,7 @@
 #include "naucrates/dxl/operators/CDXLPhysicalSplit.h"
 #include "naucrates/dxl/operators/CDXLPhysicalTVF.h"
 #include "naucrates/dxl/operators/CDXLPhysicalTableScan.h"
+#include "naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h"
 #include "naucrates/dxl/operators/CDXLPhysicalWindow.h"
 #include "naucrates/dxl/operators/CDXLScalarAggref.h"
 #include "naucrates/dxl/operators/CDXLScalarArray.h"
@@ -265,6 +267,20 @@ CTranslatorExprToDXL::PdxlnTranslate(CExpression *pexpr,
 
 	GPOS_ASSERT(nullptr == m_pdpplan);
 
+	// Walk the physical tree and detect a CTE Consumer placed on a
+	// different slice than its Producer when the Producer's output is
+	// replicated-like (StrictReplicated/TaintedReplicated/Universal).
+	// Fall back to the Postgres optimizer if it is detected because
+	// it breaks Producer-Consumer locality and can hang the
+	// query at execution.
+	if (CUtils::FHasCrossSliceReplicatedCTEConsumer(m_mp, pexpr))
+	{
+		GPOS_RAISE(
+			gpopt::ExmaDXL, gpopt::ExmiExpr2DXLUnsupportedFeature,
+			GPOS_WSZ_LIT(
+				"CTE Consumer placed on a different slice than its replicated Producer"));
+	}
+
 	m_pdpplan = CDrvdPropPlan::Pdpplan(pexpr->PdpDerive());
 	m_pdpplan->AddRef();
 
@@ -342,6 +358,7 @@ CTranslatorExprToDXL::CreateDXLNode(CExpression *pexpr,
 	GPOS_ASSERT(nullptr != pexpr);
 	ULONG ulOpId = (ULONG) pexpr->Pop()->Eopid();
 	if (COperator::EopPhysicalTableScan == ulOpId ||
+		COperator::EopPhysicalParallelTableScan == ulOpId ||
 		COperator::EopPhysicalForeignScan == ulOpId)
 	{
 		CDXLNode *dxlnode = PdxlnTblScan(
@@ -711,6 +728,13 @@ CTranslatorExprToDXL::PdxlnTblScan(CExpression *pexprTblScan,
 	{
 		pdxlopTS = GPOS_NEW(m_mp) CDXLPhysicalTableScan(m_mp, table_descr);
 	}
+	else if (COperator::EopPhysicalParallelTableScan == op_id)
+	{
+		CPhysicalParallelTableScan *parallel_scan =
+			CPhysicalParallelTableScan::PopConvert(pexprTblScan->Pop());
+		pdxlopTS = GPOS_NEW(m_mp) CDXLPhysicalParallelTableScan(
+			m_mp, table_descr, parallel_scan->UlParallelWorkers());
+	}
 	else
 	{
 		GPOS_ASSERT(COperator::EopPhysicalForeignScan == op_id);
@@ -2556,6 +2580,7 @@ CTranslatorExprToDXL::PdxlnFromFilter(CExpression *pexprFilter,
 	switch (eopidRelational)
 	{
 		case COperator::EopPhysicalTableScan:
+		case COperator::EopPhysicalParallelTableScan:
 		case COperator::EopPhysicalForeignScan:
 		{
 			// if there is a structure of the form
@@ -4250,6 +4275,18 @@ CTranslatorExprToDXL::BuildScalarSubplans(
 {
 	const ULONG size = pdrgpcrInner->Size();
 
+	// Fallback to Postgres optimizer if the SubPlan's inner expression contains a
+	// CTE Consumer placed on a different slice than its replicated Producer.
+	// Such a Consumer becomes a cross-slice Shared Scan reader without a local
+	// Producer, which can hang the query or fail at execution time.
+	if (CUtils::FHasCrossSliceReplicatedCTEConsumer(m_mp, pexprInner))
+	{
+		GPOS_RAISE(
+			gpopt::ExmaDXL, gpopt::ExmiExpr2DXLUnsupportedFeature,
+			GPOS_WSZ_LIT(
+				"CTE Consumer placed on a different slice than its replicated Producer"));
+	}
+
 	CDXLNodeArray *pdrgpdxlnInner = GPOS_NEW(m_mp) CDXLNodeArray(m_mp);
 	for (ULONG ul = 0; ul < size; ul++)
 	{
@@ -4383,6 +4420,7 @@ CTranslatorExprToDXL::PdxlnCorrelatedNLJoin(
 	switch (pexprOuterChild->Pop()->Eopid())
 	{
 		case COperator::EopPhysicalTableScan:
+		case COperator::EopPhysicalParallelTableScan:
 		{
 			dxl_properties->AddRef();
 			// create and return a table scan node
@@ -4571,6 +4609,7 @@ UlIndexFilter(Edxlopid edxlopid)
 	{
 		case EdxlopPhysicalTableScan:
 		case EdxlopPhysicalForeignScan:
+		case EdxlopPhysicalParallelTableScan:
 			return EdxltsIndexFilter;
 		case EdxlopPhysicalDynamicForeignScan:
 			return EdxldfsIndexFilter;
@@ -4626,6 +4665,7 @@ CTranslatorExprToDXL::PdxlnResultFromNLJoinOuter(
 		case EdxlopPhysicalDynamicIndexScan:
 		case EdxlopPhysicalDynamicBitmapTableScan:
 		case EdxlopPhysicalResult:
+		case EdxlopPhysicalParallelTableScan:
 		{
 			// if the scalar join condition is a constant TRUE, just translate the child, no need to create an AND expression
 			if (CTranslatorExprToDXLUtils::FScalarConstTrue(m_pmda,
diff --git a/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXLUtils.cpp b/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXLUtils.cpp
index 27f5cb688fe..7fa48972366 100644
--- a/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXLUtils.cpp
+++ b/src/backend/gporca/libgpopt/src/translate/CTranslatorExprToDXLUtils.cpp
@@ -17,6 +17,7 @@
 #include "gpopt/base/CConstraintDisjunction.h"
 #include "gpopt/base/CConstraintInterval.h"
 #include "gpopt/base/CConstraintNegation.h"
+#include "gpopt/base/CDistributionSpecWorkerRandom.h"
 #include "gpopt/base/COptCtxt.h"
 #include "gpopt/exception.h"
 #include "gpopt/mdcache/CMDAccessorUtils.h"
@@ -759,10 +760,11 @@ CTranslatorExprToDXLUtils::SetDirectDispatchInfo(
 	//			  +--CScalarConst (5)
 
 	if (CDistributionSpec::EdtHashed == pds->Edt() ||
-		CDistributionSpec::EdtRandom == pds->Edt())
+		CDistributionSpec::EdtRandom == pds->Edt() ||
+		CDistributionSpec::EdtWorkerRandom == pds->Edt())
 	{
 		// direct dispatch supported for scans over
-		// hash & random distributed tables
+		// hash, random & worker-random distributed tables
 		for (ULONG i = 0; i < size; i++)
 		{
 			CExpression *pexprFilter = (*pexprFilterArray)[i];
@@ -816,6 +818,62 @@ CTranslatorExprToDXLUtils::SetDirectDispatchInfo(
 					dxl_direct_dispatch_info = GetDXLDirectDispatchInfoRandDist(
 						mp, md_accessor, pcrDistrCol, pcnstrDistrCol);
 				}
+				else if (CDistributionSpec::EdtWorkerRandom == pds->Edt())
+				{
+					CConstraint *pcnstr = ppc->Pcnstr();
+
+					CDistributionSpecWorkerRandom *pdsWorkerRandom =
+						CDistributionSpecWorkerRandom::PdsConvert(pds);
+
+					// Get the base segment distribution for worker-random distribution
+					CDistributionSpec *pdsSegmentBase = pdsWorkerRandom->PdsSegmentBase();
+
+					if (nullptr == pdsSegmentBase)
+					{
+						// No base segment distribution available, cannot proceed with direct dispatch
+						continue;
+					}
+
+					// Handle direct dispatch based on the base segment distribution type
+					if (CDistributionSpec::EdtHashed == pdsSegmentBase->Edt())
+					{
+						// Base distribution is hashed - use hash distribution keys
+						CDistributionSpecHashed *pdsHashed =
+							CDistributionSpecHashed::PdsConvert(pdsSegmentBase);
+						CExpressionArray *pdrgpexprHashed = pdsHashed->Pdrgpexpr();
+
+						dxl_direct_dispatch_info = GetDXLDirectDispatchInfo(
+							mp, md_accessor, pdrgpexprHashed, pcnstr);
+					}
+					else if (CDistributionSpec::EdtRandom == pdsSegmentBase->Edt())
+					{
+						// Base distribution is random - use gp_segment_id
+						CDistributionSpecRandom *pdsRandom =
+							CDistributionSpecRandom::PdsConvert(pdsSegmentBase);
+
+						// Extracting GpSegmentID for base random distribution
+						const CColRef *pcrDistrCol = pdsRandom->GetGpSegmentId();
+
+						if (pcrDistrCol == nullptr)
+						{
+							// Direct Dispatch not feasible - no gp_segment_id available
+							continue;
+						}
+
+						CConstraint *pcnstrDistrCol = pcnstr->Pcnstr(mp, pcrDistrCol);
+
+						if (pcnstrDistrCol == nullptr)
+						{
+							// Direct Dispatch not feasible - no constraint on gp_segment_id
+							continue;
+						}
+
+						dxl_direct_dispatch_info = GetDXLDirectDispatchInfoRandDist(
+							mp, md_accessor, pcrDistrCol, pcnstrDistrCol);
+					}
+					// Note: Other base distribution types (Singleton, Replicated, etc.)
+					// are not supported for direct dispatch in worker-random context
+				}
 
 				if (nullptr != dxl_direct_dispatch_info)
 				{
@@ -1296,7 +1354,8 @@ CTranslatorExprToDXLUtils::FLocalHashAggStreamSafe(CExpression *pexprAgg)
 
 	// is a local hash aggregate and it generates duplicates (therefore safe to stream)
 	return (COperator::EgbaggtypeLocal == popAgg->Egbaggtype()) &&
-		   popAgg->FGeneratesDuplicates();
+		   popAgg->FGeneratesDuplicates() &&
+		   !GPOS_FTRACE(EopttraceDisableStreamingHashAgg);
 }
 
 //---------------------------------------------------------------------------
diff --git a/src/backend/gporca/libgpopt/src/xforms/CSubqueryHandler.cpp b/src/backend/gporca/libgpopt/src/xforms/CSubqueryHandler.cpp
index 791ee8345a9..a3c333c5ab1 100644
--- a/src/backend/gporca/libgpopt/src/xforms/CSubqueryHandler.cpp
+++ b/src/backend/gporca/libgpopt/src/xforms/CSubqueryHandler.cpp
@@ -308,6 +308,93 @@ CSubqueryHandler::FProjectCountSubquery(CExpression *pexprSubquery,
 }
 
 
+//---------------------------------------------------------------------------
+//	@function:
+//		FContainsEmptyGbAgg
+//
+//	@doc:
+//		Return true if pexpr contains a GbAgg with empty grouping columns
+//		(i.e., GROUP BY ())
+//
+//---------------------------------------------------------------------------
+static BOOL
+FContainsEmptyGbAgg(CExpression *pexpr)
+{
+	if (COperator::EopLogicalGbAgg == pexpr->Pop()->Eopid())
+	{
+		return 0 == CLogicalGbAgg::PopConvert(pexpr->Pop())->Pdrgpcr()->Size();
+	}
+	const ULONG arity = pexpr->Arity();
+	for (ULONG ul = 0; ul < arity; ul++)
+	{
+		CExpression *pexprChild = (*pexpr)[ul];
+		if (pexprChild->Pop()->FLogical() && FContainsEmptyGbAgg(pexprChild))
+		{
+			return true;
+		}
+	}
+	return false;
+}
+
+
+//---------------------------------------------------------------------------
+//	@function:
+//		FHasCorrelatedSelectAboveGbAgg
+//
+//	@doc:
+//		Return true if pexpr has a CLogicalSelect with outer references in its
+//		filter predicate that sits above a GROUP BY () aggregate.  This pattern
+//		arises when a correlated scalar subquery has a correlated HAVING clause,
+//		e.g. "SELECT count(*) FROM t GROUP BY () HAVING outer_col".
+//
+//		When such a pattern exists the scalar subquery must NOT be decorrelated
+//		with COALESCE(count,0) semantics: if the HAVING condition is false the
+//		subquery should return NULL (no rows), not 0.
+//
+//---------------------------------------------------------------------------
+static BOOL
+FHasCorrelatedSelectAboveGbAgg(CExpression *pexpr)
+{
+	// Stop recursion at a GbAgg boundary: we are looking for a Select
+	// that sits *above* a GbAgg, so once we reach the GbAgg there is
+	// nothing more to check in this branch.
+	if (COperator::EopLogicalGbAgg == pexpr->Pop()->Eopid())
+	{
+		return false;
+	}
+
+	if (COperator::EopLogicalSelect == pexpr->Pop()->Eopid() &&
+		pexpr->HasOuterRefs())
+	{
+		// The Select has outer references somewhere in its subtree.
+		// Check whether they originate from the filter (child 1) rather
+		// than from the logical child (child 0).  If the logical child has
+		// no outer refs but the Select as a whole does, the outer refs must
+		// come from the filter predicate — exactly the correlated-HAVING
+		// pattern we want to detect.
+		CExpression *pexprLogicalChild = (*pexpr)[0];
+		if (!pexprLogicalChild->HasOuterRefs() &&
+			FContainsEmptyGbAgg(pexprLogicalChild))
+		{
+			return true;
+		}
+	}
+
+	// Recurse into logical children only.
+	const ULONG arity = pexpr->Arity();
+	for (ULONG ul = 0; ul < arity; ul++)
+	{
+		CExpression *pexprChild = (*pexpr)[ul];
+		if (pexprChild->Pop()->FLogical() &&
+			FHasCorrelatedSelectAboveGbAgg(pexprChild))
+		{
+			return true;
+		}
+	}
+	return false;
+}
+
+
 //---------------------------------------------------------------------------
 //	@function:
 //		CSubqueryHandler::SSubqueryDesc::SetCorrelatedExecution
@@ -382,6 +469,21 @@ CSubqueryHandler::Psd(CMemoryPool *mp, CExpression *pexprSubquery,
 	// set flag of correlated execution
 	psd->SetCorrelatedExecution();
 
+	// A correlated scalar subquery of the form
+	//   SELECT count(*) FROM t GROUP BY () HAVING <outer_ref_condition>
+	// must execute as a correlated SubPlan.  After NormalizeHaving() the HAVING
+	// clause becomes a CLogicalSelect with outer refs sitting above the GbAgg.
+	// If we decorrelate such a subquery the join filter replaces the HAVING
+	// condition, but a LEFT JOIN returns 0 (not NULL) for count(*) when no
+	// rows match — which is semantically wrong.  Forcing correlated execution
+	// preserves the correct NULL-when-no-rows semantics.
+	if (!psd->m_fCorrelatedExecution && psd->m_fHasCountAgg &&
+		psd->m_fHasOuterRefs &&
+		FHasCorrelatedSelectAboveGbAgg(pexprInner))
+	{
+		psd->m_fCorrelatedExecution = true;
+	}
+
 	return psd;
 }
 
@@ -753,8 +855,19 @@ CSubqueryHandler::FCreateOuterApplyForScalarSubquery(
 	*ppexprNewOuter = pexprPrj;
 
 	BOOL fGeneratedByQuantified = popSubquery->FGeneratedByQuantified();
+
+	// When GROUP BY () has a correlated HAVING clause (now represented as a
+	// CLogicalSelect with outer refs sitting above the GbAgg), the subquery
+	// must return NULL — not 0 — when the HAVING condition is false.
+	// Applying COALESCE(count,0) would incorrectly convert that NULL to 0,
+	// so we skip the special count(*) semantics in that case.
+	BOOL fCorrelatedHavingAboveEmptyGby =
+		(fHasCountAggMatchingColumn && 0 == pgbAgg->Pdrgpcr()->Size() &&
+		 FHasCorrelatedSelectAboveGbAgg((*pexprSubquery)[0]));
+
 	if (fGeneratedByQuantified ||
-		(fHasCountAggMatchingColumn && 0 == pgbAgg->Pdrgpcr()->Size()))
+		(fHasCountAggMatchingColumn && 0 == pgbAgg->Pdrgpcr()->Size() &&
+		 !fCorrelatedHavingAboveEmptyGby))
 	{
 		CMDAccessor *md_accessor = COptCtxt::PoctxtFromTLS()->Pmda();
 		const IMDTypeInt8 *pmdtypeint8 = md_accessor->PtMDType<IMDTypeInt8>();
diff --git a/src/backend/gporca/libgpopt/src/xforms/CXformFactory.cpp b/src/backend/gporca/libgpopt/src/xforms/CXformFactory.cpp
index e21c24511dd..7ffe39774dc 100644
--- a/src/backend/gporca/libgpopt/src/xforms/CXformFactory.cpp
+++ b/src/backend/gporca/libgpopt/src/xforms/CXformFactory.cpp
@@ -144,6 +144,7 @@ CXformFactory::Instantiate()
 	Add(GPOS_NEW(m_mp) CXformExpandNAryJoinMinCard(m_mp));
 	Add(GPOS_NEW(m_mp) CXformExpandNAryJoinDP(m_mp));
 	Add(GPOS_NEW(m_mp) CXformGet2TableScan(m_mp));
+	Add(GPOS_NEW(m_mp) CXformGet2ParallelTableScan(m_mp));
 	Add(GPOS_NEW(m_mp) CXformIndexGet2IndexScan(m_mp));
 	Add(GPOS_NEW(m_mp) CXformDynamicGet2DynamicTableScan(m_mp));
 	Add(GPOS_NEW(m_mp) CXformDynamicIndexGet2DynamicIndexScan(m_mp));
diff --git a/src/backend/gporca/libgpopt/src/xforms/CXformGet2ParallelTableScan.cpp b/src/backend/gporca/libgpopt/src/xforms/CXformGet2ParallelTableScan.cpp
new file mode 100644
index 00000000000..8799661ce49
--- /dev/null
+++ b/src/backend/gporca/libgpopt/src/xforms/CXformGet2ParallelTableScan.cpp
@@ -0,0 +1,243 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CXformGet2ParallelTableScan.cpp
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libgpopt/src/xforms/CXformGet2ParallelTableScan.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "gpopt/xforms/CXformGet2ParallelTableScan.h"
+
+#include "gpos/base.h"
+
+#include "gpopt/base/COptCtxt.h"
+#include "gpopt/hints/CHintUtils.h"
+#include "gpopt/metadata/CTableDescriptor.h"
+#include "gpopt/operators/CExpressionHandle.h"
+#include "gpopt/operators/CLogicalGet.h"
+#include "gpopt/operators/CPhysicalParallelTableScan.h"
+#include "gpopt/optimizer/COptimizerConfig.h"
+#include "naucrates/md/IMDRelation.h"
+#include "gpopt/search/CGroupProxy.h"
+#include "gpopt/search/CMemo.h"
+
+
+// Use gpdbwrappers for parallel checks
+extern int max_parallel_workers_per_gather;
+
+// Forward declarations for gpdbwrappers functions
+namespace gpdb {
+	bool IsParallelModeOK(void);
+}
+
+using namespace gpopt;
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CXformGet2ParallelTableScan::FHasParallelIncompatibleOps
+//
+//	@doc:
+//		Check if memo contains logical operators that are incompatible
+//		with parallel execution (CTE, Dynamic scans, Foreign scans, etc.)
+//
+//---------------------------------------------------------------------------
+BOOL
+CXformGet2ParallelTableScan::FHasParallelIncompatibleOps(CExpressionHandle &exprhdl)
+{
+	CGroupExpression *pgexprHandle = exprhdl.Pgexpr();
+	if (nullptr == pgexprHandle)
+	{
+		return false;
+	}
+
+	CGroup *pgroup = pgexprHandle->Pgroup();
+	if (nullptr == pgroup)
+	{
+		return false;
+	}
+
+	CMemo *pmemo = pgroup->Pmemo();
+	if (nullptr == pmemo)
+	{
+		return false;
+	}
+
+	// Iterate through all groups in memo to check for parallel-incompatible operations
+	const ULONG_PTR ulGroups = pmemo->UlpGroups();
+	for (ULONG_PTR ul = 0; ul < ulGroups; ul++)
+	{
+		CGroup *pgroupCurrent = pmemo->Pgroup(ul);
+		if (nullptr == pgroupCurrent)
+		{
+			continue;
+		}
+
+		// Check all group expressions in this group using CGroupProxy
+		CGroupProxy gp(pgroupCurrent);
+		CGroupExpression *pgexpr = gp.PgexprFirst();
+		while (nullptr != pgexpr)
+		{
+			COperator::EOperatorId eopid = pgexpr->Pop()->Eopid();
+
+			// Check for CTE-related operators (incompatible with parallel execution)
+			if (COperator::EopLogicalCTEProducer == eopid ||
+				COperator::EopLogicalCTEConsumer == eopid ||
+				COperator::EopLogicalSequence == eopid ||
+				COperator::EopLogicalSequenceProject == eopid)
+			{
+				return true;
+			}
+
+			if (COperator::EopLogicalUnion == eopid ||
+				COperator::EopLogicalUnionAll == eopid ||
+				COperator::EopLogicalIntersect == eopid ||
+				COperator::EopLogicalIntersectAll == eopid ||
+				COperator::EopLogicalDifference == eopid ||
+				COperator::EopLogicalDifferenceAll == eopid)
+			{
+				// Set operations are not supported in parallel plans
+				return true;
+			}
+
+			pgexpr = gp.PgexprNext(pgexpr);
+		}
+	}
+
+	return false;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CXformGet2ParallelTableScan::CXformGet2ParallelTableScan
+//
+//	@doc:
+//		Ctor
+//
+//---------------------------------------------------------------------------
+CXformGet2ParallelTableScan::CXformGet2ParallelTableScan(CMemoryPool *mp)
+	: CXformImplementation(
+		  // pattern
+		  GPOS_NEW(mp) CExpression(mp, GPOS_NEW(mp) CLogicalGet(mp)))
+{
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CXformGet2ParallelTableScan::Exfp
+//
+//	@doc:
+//		Compute promise of xform based on GUC enable_parallel
+//		Uses unified parallel degree from max_parallel_workers_per_gather
+//
+//---------------------------------------------------------------------------
+CXform::EXformPromise
+CXformGet2ParallelTableScan::Exfp(CExpressionHandle &exprhdl) const
+{
+	// Check if parallel plans are enabled in context and parallel processing is safe
+	if (!gpdb::IsParallelModeOK())
+	{
+		return CXform::ExfpNone;
+	}
+
+	// Check for parallel-incompatible operations that would conflict with parallel scans
+	if (FHasParallelIncompatibleOps(exprhdl))
+	{
+		return CXform::ExfpNone;
+	}
+
+	CLogicalGet *popGet = CLogicalGet::PopConvert(exprhdl.Pop());
+	CTableDescriptor *ptabdesc = popGet->Ptabdesc();
+
+	// Don't use parallel scan for replicated tables
+	if (ptabdesc->GetRelDistribution() == IMDRelation::EreldistrReplicated ||
+		ptabdesc->GetRelDistribution() == IMDRelation::EreldistrMasterOnly ||
+		COptCtxt::PoctxtFromTLS()->HasReplicatedTables())
+	{
+		//FIXME: Should we consider replicated tables.
+		return CXform::ExfpNone;
+	}
+
+	// High promise for parallel scan when enabled
+	// All tables will use the same parallel degree from max_parallel_workers_per_gather
+	return CXform::ExfpHigh;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CXformGet2ParallelTableScan::Transform
+//
+//	@doc:
+//		Actual transformation
+//
+//---------------------------------------------------------------------------
+void
+CXformGet2ParallelTableScan::Transform(CXformContext *pxfctxt, CXformResult *pxfres,
+									   CExpression *pexpr) const
+{
+	GPOS_ASSERT(nullptr != pxfctxt);
+	GPOS_ASSERT(FPromising(pxfctxt->Pmp(), this, pexpr));
+	GPOS_ASSERT(FCheckPattern(pexpr));
+
+	CLogicalGet *popGet = CLogicalGet::PopConvert(pexpr->Pop());
+
+	CMemoryPool *mp = pxfctxt->Pmp();
+
+	// create/extract components for alternative
+	CName *pname = GPOS_NEW(mp) CName(mp, popGet->Name());
+
+	CTableDescriptor *ptabdesc = popGet->Ptabdesc();
+	ptabdesc->AddRef();
+
+	CColRefArray *pdrgpcrOutput = popGet->PdrgpcrOutput();
+	GPOS_ASSERT(nullptr != pdrgpcrOutput);
+	pdrgpcrOutput->AddRef();
+
+	// Determine parallel workers degree
+	// Priority: table-level parallel_workers setting > GUC max_parallel_workers_per_gather > default
+	ULONG ulParallelWorkers = 2;
+
+	// Check if table has a specific parallel_workers setting
+	CMDAccessor *md_accessor = COptCtxt::PoctxtFromTLS()->Pmda();
+	const IMDRelation *pmdrel = md_accessor->RetrieveRel(ptabdesc->MDId());
+	INT table_parallel_workers = pmdrel->ParallelWorkers();
+
+	if (table_parallel_workers > 0)
+	{
+		// Use table-level setting if explicitly configured
+		ulParallelWorkers = (ULONG)table_parallel_workers;
+	}
+	else if (max_parallel_workers_per_gather > 0)
+	{
+		// Fall back to GUC setting
+		ulParallelWorkers = (ULONG)max_parallel_workers_per_gather;
+	}
+
+	// create alternative expression
+	CExpression *pexprAlt = GPOS_NEW(mp) CExpression(
+		mp,
+		GPOS_NEW(mp) CPhysicalParallelTableScan(mp, pname, ptabdesc, pdrgpcrOutput, ulParallelWorkers));
+	
+	// add alternative to transformation result
+	pxfres->Add(pexprAlt);
+}
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libgpopt/src/xforms/CXformGet2TableScan.cpp b/src/backend/gporca/libgpopt/src/xforms/CXformGet2TableScan.cpp
index 05e826aec92..d34068a3dfc 100644
--- a/src/backend/gporca/libgpopt/src/xforms/CXformGet2TableScan.cpp
+++ b/src/backend/gporca/libgpopt/src/xforms/CXformGet2TableScan.cpp
@@ -20,6 +20,10 @@
 #include "gpopt/operators/CPhysicalTableScan.h"
 #include "gpopt/optimizer/COptimizerConfig.h"
 
+namespace gpdb {
+	bool IsParallelModeOK(void);
+}
+
 using namespace gpopt;
 
 
@@ -57,6 +61,13 @@ CXformGet2TableScan::Exfp(CExpressionHandle &exprhdl) const
 		return CXform::ExfpNone;
 	}
 
+	// If parallel processing is enabled, give lower priority to regular table scan
+	// to allow parallel table scan to take precedence
+	if (gpdb::IsParallelModeOK())
+	{
+		return CXform::ExfpLow;
+	}
+
 	return CXform::ExfpHigh;
 }
 
diff --git a/src/backend/gporca/libgpopt/src/xforms/Makefile b/src/backend/gporca/libgpopt/src/xforms/Makefile
index 03f6293b36d..66da51e28bb 100644
--- a/src/backend/gporca/libgpopt/src/xforms/Makefile
+++ b/src/backend/gporca/libgpopt/src/xforms/Makefile
@@ -47,6 +47,7 @@ OBJS        = CDecorrelator.o \
               CXformGbAggDedup2StreamAggDedup.o \
               CXformGbAggWithMDQA2Join.o \
               CXformGet2TableScan.o \
+              CXformGet2ParallelTableScan.o \
               CXformImplementAssert.o \
               CXformImplementBitmapTableGet.o \
               CXformImplementCTEConsumer.o \
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperator.h b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperator.h
index 8fb27307c36..e583e9974a3 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperator.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperator.h
@@ -125,6 +125,7 @@ enum Edxlopid
 	EdxlopPhysicalValuesScan,
 	EdxlopPhysicalProjection,
 	EdxlopPhysicalTableScan,
+	EdxlopPhysicalParallelTableScan,
 	EdxlopPhysicalBitmapTableScan,
 	EdxlopPhysicalDynamicBitmapTableScan,
 	EdxlopPhysicalForeignScan,
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperatorFactory.h b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperatorFactory.h
index ed27db129fe..568240a5c98 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperatorFactory.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLOperatorFactory.h
@@ -134,6 +134,10 @@ class CDXLOperatorFactory
 	static CDXLPhysical *MakeDXLTblScan(CDXLMemoryManager *dxl_memory_manager,
 										const Attributes &attrs);
 
+	// create a parallel table scan operator
+	static CDXLPhysical *MakeDXLParallelTblScan(CDXLMemoryManager *dxl_memory_manager,
+												const Attributes &attrs);
+
 	// create a result operator
 	static CDXLPhysical *MakeDXLResult(CDXLMemoryManager *dxl_memory_manager);
 
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h
new file mode 100644
index 00000000000..ff3afa68df0
--- /dev/null
+++ b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h
@@ -0,0 +1,104 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CDXLPhysicalParallelTableScan.h
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#ifndef GPDXL_CDXLPhysicalParallelTableScan_H
+#define GPDXL_CDXLPhysicalParallelTableScan_H
+
+#include "gpos/base.h"
+
+#include "naucrates/dxl/operators/CDXLPhysicalTableScan.h"
+
+namespace gpdxl
+{
+using namespace gpos;
+
+//---------------------------------------------------------------------------
+//	@class:
+//		CDXLPhysicalParallelTableScan
+//
+//	@doc:
+//		Class for representing DXL parallel table scan operators
+//
+//---------------------------------------------------------------------------
+class CDXLPhysicalParallelTableScan : public CDXLPhysicalTableScan
+{
+private:
+	// number of parallel workers
+	ULONG m_ulParallelWorkers;
+
+public:
+	CDXLPhysicalParallelTableScan(const CDXLPhysicalParallelTableScan &) = delete;
+
+	// ctor
+	CDXLPhysicalParallelTableScan(CMemoryPool *mp, CDXLTableDescr *table_descr,
+								  ULONG ulParallelWorkers);
+
+	// ctor with uninitialized table descriptor
+	CDXLPhysicalParallelTableScan(CMemoryPool *mp, ULONG ulParallelWorkers);
+
+	// dtor
+	~CDXLPhysicalParallelTableScan() override = default;
+
+	// get operator type
+	Edxlopid GetDXLOperator() const override;
+
+	// get operator name
+	const CWStringConst *GetOpNameStr() const override;
+
+	// get number of parallel workers
+	ULONG UlParallelWorkers() const
+	{
+		return m_ulParallelWorkers;
+	}
+
+	// serialize operator in DXL format
+	void SerializeToDXL(CXMLSerializer *xml_serializer,
+						const CDXLNode *dxlnode) const override;
+
+	// conversion function
+	static CDXLPhysicalParallelTableScan *
+	Cast(CDXLOperator *dxl_op)
+	{
+		GPOS_ASSERT(nullptr != dxl_op);
+		GPOS_ASSERT(EdxlopPhysicalParallelTableScan == dxl_op->GetDXLOperator());
+
+		return dynamic_cast<CDXLPhysicalParallelTableScan *>(dxl_op);
+	}
+
+#ifdef GPOS_DEBUG
+	// checks whether the operator has valid structure, i.e. number and
+	// types of child nodes
+	void AssertValid(const CDXLNode *dxlnode, BOOL validate_children) const override;
+#endif	// GPOS_DEBUG
+
+};	// class CDXLPhysicalParallelTableScan
+
+}  // namespace gpdxl
+
+#endif	// !GPDXL_CDXLPhysicalParallelTableScan_H
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalTableScan.h b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalTableScan.h
index a043e137614..aef1695612a 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalTableScan.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/dxl/operators/CDXLPhysicalTableScan.h
@@ -76,7 +76,8 @@ class CDXLPhysicalTableScan : public CDXLPhysical
 	{
 		GPOS_ASSERT(nullptr != dxl_op);
 		GPOS_ASSERT(EdxlopPhysicalTableScan == dxl_op->GetDXLOperator() ||
-					EdxlopPhysicalForeignScan == dxl_op->GetDXLOperator());
+					EdxlopPhysicalForeignScan == dxl_op->GetDXLOperator() ||
+					EdxlopPhysicalParallelTableScan == dxl_op->GetDXLOperator());
 
 		return dynamic_cast<CDXLPhysicalTableScan *>(dxl_op);
 	}
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/dxl/xml/dxltokens.h b/src/backend/gporca/libnaucrates/include/naucrates/dxl/xml/dxltokens.h
index 5a61801511a..9c5d89fe8ae 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/dxl/xml/dxltokens.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/dxl/xml/dxltokens.h
@@ -96,6 +96,7 @@ enum Edxltoken
 	EdxltokenPhysical,
 
 	EdxltokenPhysicalTableScan,
+	EdxltokenPhysicalParallelTableScan,
 	EdxltokenPhysicalBitmapTableScan,
 	EdxltokenPhysicalDynamicBitmapTableScan,
 	EdxltokenPhysicalForeignScan,
@@ -374,6 +375,7 @@ enum Edxltoken
 	EdxltokenColNdvBySeg,
 
 	EdxltokenParamId,
+	EdxltokenParallelWorkers,
 
 	EdxltokenCtidColName,
 	EdxltokenOidColName,
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationCtasGPDB.h b/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationCtasGPDB.h
index 780c1be5b11..195a17f9e94 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationCtasGPDB.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationCtasGPDB.h
@@ -264,6 +264,12 @@ class CMDRelationCtasGPDB : public IMDRelationCtas
 		return 0;
 	}
 
+	INT SegFileCount() const override
+	{
+		GPOS_ASSERT("Function should not be called for CTAS tables");
+		return -1;
+	}
+
 #ifdef GPOS_DEBUG
 	// debug print of the metadata relation
 	void DebugPrint(IOstream &os) const override;
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationGPDB.h b/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationGPDB.h
index f15b0f26ecc..ecb4bb4a4d4 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationGPDB.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/md/CMDRelationGPDB.h
@@ -122,13 +122,19 @@ class CMDRelationGPDB : public IMDRelation
 	// rows
 	CDouble m_rows;
 
+	// segment file count for AO/AOCO tables (-1 for non-AO tables)
+	INT m_seg_file_count;
+
+	// parallel workers setting from table options (-1 if not set)
+	INT m_parallel_workers;
+
 public:
 	CMDRelationGPDB(const CMDRelationGPDB &) = delete;
 
 	// ctor
 	CMDRelationGPDB(
 		CMemoryPool *mp, IMDId *mdid, CMDName *mdname, BOOL is_temp_table,
-		Erelstoragetype rel_storage_type, 
+		Erelstoragetype rel_storage_type,
 		Ereldistrpolicy rel_distr_policy, CMDColumnArray *mdcol_array,
 		ULongPtrArray *distr_col_array, IMdIdArray *distr_opfamilies,
 		ULongPtrArray *partition_cols_array, CharPtrArray *str_part_types_array,
@@ -242,6 +248,16 @@ class CMDRelationGPDB : public IMDRelation
 
 	CDouble Rows() const override;
 
+	INT SegFileCount() const override;
+
+	// Set segment file count for AO/AOCO tables
+	void SetSegFileCount(INT seg_file_count);
+
+	INT ParallelWorkers() const override;
+
+	// Set parallel workers from table options
+	void SetParallelWorkers(INT parallel_workers);
+
 #ifdef GPOS_DEBUG
 	// debug print of the metadata relation
 	void DebugPrint(IOstream &os) const override;
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelation.h b/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelation.h
index 036af05597a..b5e7a8f22ee 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelation.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelation.h
@@ -203,6 +203,12 @@ class IMDRelation : public IMDCacheObject
 
 	// rows
 	virtual CDouble Rows() const = 0;
+
+	// segment file count for AO/AOCO tables (returns -1 for non-AO tables)
+	virtual INT SegFileCount() const = 0;
+
+	// parallel workers setting from table options (returns -1 if not set)
+	virtual INT ParallelWorkers() const = 0;
 };
 
 // common structure over relation and external relation metadata for index info
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelationCtas.h b/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelationCtas.h
index 18aa6b8e30c..ae805c9cc17 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelationCtas.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/md/IMDRelationCtas.h
@@ -108,6 +108,13 @@ class IMDRelationCtas : public IMDRelation
 
 	// CTAS storage options
 	virtual CDXLCtasStorageOptions *GetDxlCtasStorageOption() const = 0;
+
+	// parallel workers - CTAS tables don't have this setting yet
+	INT
+	ParallelWorkers() const override
+	{
+		return -1;  // not set
+	}
 };
 }  // namespace gpmd
 
diff --git a/src/backend/gporca/libnaucrates/include/naucrates/traceflags/traceflags.h b/src/backend/gporca/libnaucrates/include/naucrates/traceflags/traceflags.h
index 2e489f214e5..8a18ace986a 100644
--- a/src/backend/gporca/libnaucrates/include/naucrates/traceflags/traceflags.h
+++ b/src/backend/gporca/libnaucrates/include/naucrates/traceflags/traceflags.h
@@ -250,6 +250,9 @@ enum EOptTraceFlag
 	// Use the all key exclude the non-fixed key in AGG pds
 	EopttraceAggRRSExcludeNonFixedKey = 103053,
 
+	// Disable streaming hash agg in ORCA-generated local partial aggregations
+	EopttraceDisableStreamingHashAgg = 103054,
+
 	///////////////////////////////////////////////////////
 	///////////////////// statistics flags ////////////////
 	//////////////////////////////////////////////////////
diff --git a/src/backend/gporca/libnaucrates/src/md/CMDRelationGPDB.cpp b/src/backend/gporca/libnaucrates/src/md/CMDRelationGPDB.cpp
index 03f52c3fdd0..dceb24d0c55 100644
--- a/src/backend/gporca/libnaucrates/src/md/CMDRelationGPDB.cpp
+++ b/src/backend/gporca/libnaucrates/src/md/CMDRelationGPDB.cpp
@@ -62,7 +62,9 @@ CMDRelationGPDB::CMDRelationGPDB(
 	  m_colpos_nondrop_colpos_map(nullptr),
 	  m_attrno_nondrop_col_pos_map(nullptr),
 	  m_nondrop_col_pos_array(nullptr),
-	  m_rows(rows)
+	  m_rows(rows),
+	  m_seg_file_count(-1),
+	  m_parallel_workers(-1)
 {
 	GPOS_ASSERT(mdid->IsValid());
 	GPOS_ASSERT(nullptr != mdcol_array);
@@ -595,6 +597,46 @@ CMDRelationGPDB::Rows() const
 	return m_rows;
 }
 
+INT
+CMDRelationGPDB::SegFileCount() const
+{
+	return m_seg_file_count;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CMDRelationGPDB::SetSegFileCount
+//
+//	@doc:
+//		Set segment file count for AO/AOCO tables
+//
+//---------------------------------------------------------------------------
+void
+CMDRelationGPDB::SetSegFileCount(INT seg_file_count)
+{
+	m_seg_file_count = seg_file_count;
+}
+
+INT
+CMDRelationGPDB::ParallelWorkers() const
+{
+	return m_parallel_workers;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CMDRelationGPDB::SetParallelWorkers
+//
+//	@doc:
+//		Set parallel workers from table options
+//
+//---------------------------------------------------------------------------
+void
+CMDRelationGPDB::SetParallelWorkers(INT parallel_workers)
+{
+	m_parallel_workers = parallel_workers;
+}
+
 //---------------------------------------------------------------------------
 //	@function:
 //		CMDRelationGPDB::Serialize
diff --git a/src/backend/gporca/libnaucrates/src/operators/CDXLOperatorFactory.cpp b/src/backend/gporca/libnaucrates/src/operators/CDXLOperatorFactory.cpp
index 8b037b833f0..a4d4914b731 100644
--- a/src/backend/gporca/libnaucrates/src/operators/CDXLOperatorFactory.cpp
+++ b/src/backend/gporca/libnaucrates/src/operators/CDXLOperatorFactory.cpp
@@ -28,6 +28,7 @@
 #include "naucrates/dxl/operators/CDXLDatumStatsDoubleMappable.h"
 #include "naucrates/dxl/operators/CDXLDatumStatsLintMappable.h"
 #include "naucrates/dxl/operators/CDXLLogicalJoin.h"
+#include "naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h"
 #include "naucrates/dxl/operators/CDXLPhysicalAgg.h"
 #include "naucrates/dxl/operators/CDXLPhysicalAppend.h"
 #include "naucrates/dxl/operators/CDXLPhysicalBroadcastMotion.h"
@@ -101,6 +102,31 @@ CDXLOperatorFactory::MakeDXLTblScan(CDXLMemoryManager *dxl_memory_manager,
 	return GPOS_NEW(mp) CDXLPhysicalTableScan(mp);
 }
 
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLOperatorFactory::MakeDXLParallelTblScan
+//
+//	@doc:
+//		Construct a parallel table scan operator
+//
+//---------------------------------------------------------------------------
+CDXLPhysical *
+CDXLOperatorFactory::MakeDXLParallelTblScan(CDXLMemoryManager *dxl_memory_manager,
+											const Attributes &attrs)
+{
+	// get the memory pool from the memory manager
+	CMemoryPool *mp = dxl_memory_manager->Pmp();
+
+	// extract number of parallel workers
+	const XMLCh *parallel_workers_xml = ExtractAttrValue(attrs, EdxltokenParallelWorkers, 
+														 EdxltokenPhysicalParallelTableScan);
+	ULONG ulParallelWorkers = CDXLOperatorFactory::ConvertAttrValueToUlong(
+		dxl_memory_manager, parallel_workers_xml, EdxltokenParallelWorkers, 
+		EdxltokenPhysicalParallelTableScan);
+
+	return GPOS_NEW(mp) CDXLPhysicalParallelTableScan(mp, ulParallelWorkers);
+}
+
 //---------------------------------------------------------------------------
 //	@function:
 //		CDXLOperatorFactory::MakeDXLResult
diff --git a/src/backend/gporca/libnaucrates/src/operators/CDXLPhysicalParallelTableScan.cpp b/src/backend/gporca/libnaucrates/src/operators/CDXLPhysicalParallelTableScan.cpp
new file mode 100644
index 00000000000..a96657031e9
--- /dev/null
+++ b/src/backend/gporca/libnaucrates/src/operators/CDXLPhysicalParallelTableScan.cpp
@@ -0,0 +1,162 @@
+/*-------------------------------------------------------------------------
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ *
+ * CDXLPhysicalParallelTableScan.cpp
+ *
+ * IDENTIFICATION
+ *	  src/backend/gporca/libnaucrates/src/operators/CDXLPhysicalParallelTableScan.cpp
+ *
+ *-------------------------------------------------------------------------
+ */
+
+#include "naucrates/dxl/operators/CDXLPhysicalParallelTableScan.h"
+
+#include "naucrates/dxl/operators/CDXLNode.h"
+#include "naucrates/dxl/xml/CXMLSerializer.h"
+
+using namespace gpos;
+using namespace gpdxl;
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::CDXLPhysicalParallelTableScan
+//
+//	@doc:
+//		Constructor
+//
+//---------------------------------------------------------------------------
+CDXLPhysicalParallelTableScan::CDXLPhysicalParallelTableScan(CMemoryPool *mp,
+															 CDXLTableDescr *table_descr,
+															 ULONG ulParallelWorkers)
+	: CDXLPhysicalTableScan(mp, table_descr),
+	  m_ulParallelWorkers(ulParallelWorkers)
+{
+	GPOS_ASSERT(ulParallelWorkers > 0);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::CDXLPhysicalParallelTableScan
+//
+//	@doc:
+//		Constructor with uninitialized table descriptor
+//
+//---------------------------------------------------------------------------
+CDXLPhysicalParallelTableScan::CDXLPhysicalParallelTableScan(CMemoryPool *mp,
+															 ULONG ulParallelWorkers)
+	: CDXLPhysicalTableScan(mp),
+	  m_ulParallelWorkers(ulParallelWorkers)
+{
+	GPOS_ASSERT(ulParallelWorkers > 0);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::GetDXLOperator
+//
+//	@doc:
+//		Operator type
+//
+//---------------------------------------------------------------------------
+Edxlopid
+CDXLPhysicalParallelTableScan::GetDXLOperator() const
+{
+	return EdxlopPhysicalParallelTableScan;
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::GetOpNameStr
+//
+//	@doc:
+//		Operator name
+//
+//---------------------------------------------------------------------------
+const CWStringConst *
+CDXLPhysicalParallelTableScan::GetOpNameStr() const
+{
+	return CDXLTokens::GetDXLTokenStr(EdxltokenPhysicalParallelTableScan);
+}
+
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::SerializeToDXL
+//
+//	@doc:
+//		Serialize operator in DXL format
+//
+//---------------------------------------------------------------------------
+void
+CDXLPhysicalParallelTableScan::SerializeToDXL(CXMLSerializer *xml_serializer,
+											   const CDXLNode *dxlnode) const
+{
+	const CWStringConst *element_name = GetOpNameStr();
+	xml_serializer->OpenElement(CDXLTokens::GetDXLTokenStr(EdxltokenNamespacePrefix),
+								element_name);
+
+	// serialize parallel workers attribute
+	xml_serializer->AddAttribute(CDXLTokens::GetDXLTokenStr(EdxltokenParallelWorkers),
+								 m_ulParallelWorkers);
+
+	// serialize properties
+	dxlnode->SerializePropertiesToDXL(xml_serializer);
+
+	// serialize projection list and filter
+	dxlnode->SerializeChildrenToDXL(xml_serializer);
+
+	xml_serializer->CloseElement(CDXLTokens::GetDXLTokenStr(EdxltokenNamespacePrefix),
+								 element_name);
+}
+
+#ifdef GPOS_DEBUG
+//---------------------------------------------------------------------------
+//	@function:
+//		CDXLPhysicalParallelTableScan::AssertValid
+//
+//	@doc:
+//		Checks whether operator node is well-structured
+//
+//---------------------------------------------------------------------------
+void
+CDXLPhysicalParallelTableScan::AssertValid(const CDXLNode *dxlnode,
+											BOOL validate_children) const
+{
+	// assert proj list and filter are valid
+	CDXLPhysical::AssertValid(dxlnode, validate_children);
+
+	// parallel table scan has only 2 children (proj list and filter)
+	GPOS_ASSERT(2 == dxlnode->Arity());
+
+	CDXLNode *proj_list_dxlnode = (*dxlnode)[0];  // First child is projection list
+	CDXLNode *filter_dxlnode = (*dxlnode)[1];     // Second child is filter
+
+	GPOS_ASSERT(EdxlopScalarProjectList ==
+				proj_list_dxlnode->GetOperator()->GetDXLOperator());
+	GPOS_ASSERT(EdxlopScalarFilter ==
+				filter_dxlnode->GetOperator()->GetDXLOperator());
+
+	if (validate_children)
+	{
+		proj_list_dxlnode->GetOperator()->AssertValid(proj_list_dxlnode, validate_children);
+		filter_dxlnode->GetOperator()->AssertValid(filter_dxlnode, validate_children);
+	}
+}
+#endif	// GPOS_DEBUG
+
+// EOF
\ No newline at end of file
diff --git a/src/backend/gporca/libnaucrates/src/operators/Makefile b/src/backend/gporca/libnaucrates/src/operators/Makefile
index 418bd5a0fd2..1d78142feab 100644
--- a/src/backend/gporca/libnaucrates/src/operators/Makefile
+++ b/src/backend/gporca/libnaucrates/src/operators/Makefile
@@ -85,6 +85,7 @@ OBJS        = CDXLColDescr.o \
               CDXLPhysicalSplit.o \
               CDXLPhysicalTVF.o \
               CDXLPhysicalTableScan.o \
+              CDXLPhysicalParallelTableScan.o \
               CDXLPhysicalValuesScan.o \
               CDXLPhysicalWindow.o \
               CDXLProperties.o \
diff --git a/src/backend/gporca/libnaucrates/src/parser/CParseHandlerOptimizerConfig.cpp b/src/backend/gporca/libnaucrates/src/parser/CParseHandlerOptimizerConfig.cpp
index 3b64d409bfe..49b4d786b55 100644
--- a/src/backend/gporca/libnaucrates/src/parser/CParseHandlerOptimizerConfig.cpp
+++ b/src/backend/gporca/libnaucrates/src/parser/CParseHandlerOptimizerConfig.cpp
@@ -273,7 +273,7 @@ CParseHandlerOptimizerConfig::EndElement(const XMLCh *const,  // element_uri,
 	}
 
 	m_optimizer_config = GPOS_NEW(m_mp) COptimizerConfig(
-		pec, stats_config, pcteconfig, pcm, phint, pplanhint, pwindowoidsGPDB);
+		pec, stats_config, pcteconfig, pcm, phint, pplanhint, pwindowoidsGPDB, false);
 
 	CParseHandlerTraceFlags *pphTraceFlags =
 		dynamic_cast<CParseHandlerTraceFlags *>((*this)[this->Length() - 1]);
diff --git a/src/backend/gporca/libnaucrates/src/xml/dxltokens.cpp b/src/backend/gporca/libnaucrates/src/xml/dxltokens.cpp
index 0f59d689a05..79fcc9f7d6a 100644
--- a/src/backend/gporca/libnaucrates/src/xml/dxltokens.cpp
+++ b/src/backend/gporca/libnaucrates/src/xml/dxltokens.cpp
@@ -112,6 +112,7 @@ CDXLTokens::Init(CMemoryPool *mp)
 		{EdxltokenPhysical, GPOS_WSZ_LIT("OpPhysical")},
 
 		{EdxltokenPhysicalTableScan, GPOS_WSZ_LIT("TableScan")},
+		{EdxltokenPhysicalParallelTableScan, GPOS_WSZ_LIT("ParallelTableScan")},
 		{EdxltokenPhysicalBitmapTableScan, GPOS_WSZ_LIT("BitmapTableScan")},
 		{EdxltokenPhysicalDynamicBitmapTableScan,
 		 GPOS_WSZ_LIT("DynamicBitmapTableScan")},
@@ -420,6 +421,7 @@ CDXLTokens::Init(CMemoryPool *mp)
 		{EdxltokenColNdvBySeg, GPOS_WSZ_LIT("NdvBySeg")},
 
 		{EdxltokenParamId, GPOS_WSZ_LIT("ParamId")},
+		{EdxltokenParallelWorkers, GPOS_WSZ_LIT("ParallelWorkers")},
 
 		{EdxltokenCtidColName, GPOS_WSZ_LIT("ctid")},
 		{EdxltokenOidColName, GPOS_WSZ_LIT("oid")},
diff --git a/src/backend/gporca/server/src/startup/main.cpp b/src/backend/gporca/server/src/startup/main.cpp
index 29be9dc9994..9418fa94abb 100644
--- a/src/backend/gporca/server/src/startup/main.cpp
+++ b/src/backend/gporca/server/src/startup/main.cpp
@@ -381,6 +381,24 @@ PvExec(void *pv)
 	return nullptr;
 }
 
+//---------------------------------------------------------------------------
+//	Stub implementations for PostgreSQL symbols required by GPORCA
+//	These are needed for standalone testing without linking to PostgreSQL
+//---------------------------------------------------------------------------
+
+// Stub for parallel mode check
+namespace gpdb {
+	bool IsParallelModeOK(void)
+	{
+		// For unittest, we enable parallel mode by default
+		return true;
+	}
+}
+
+// Stub GUC variables for parallel execution
+int max_parallel_workers_per_gather = 2;
+bool enable_parallel = true;
+double parallel_setup_cost = 1000.0;
 
 //---------------------------------------------------------------------------
 //	@function:
diff --git a/src/backend/gporca/server/src/unittest/CTestUtils.cpp b/src/backend/gporca/server/src/unittest/CTestUtils.cpp
index bca99766fda..5ce83305b32 100644
--- a/src/backend/gporca/server/src/unittest/CTestUtils.cpp
+++ b/src/backend/gporca/server/src/unittest/CTestUtils.cpp
@@ -3539,7 +3539,7 @@ CTestUtils::EresSamplePlans(const CHAR *rgszFileNames[], ULONG ulTests,
 				CStatisticsConfig::PstatsconfDefault(mp),
 				CCTEConfig::PcteconfDefault(mp), ICostModel::PcmDefault(mp),
 				CHint::PhintDefault(mp), nullptr,
-				CWindowOids::GetWindowOids(mp));
+				CWindowOids::GetWindowOids(mp), false);
 		}
 		else
 		{
@@ -3678,7 +3678,7 @@ CTestUtils::EresCheckPlans(const CHAR *rgszFileNames[], ULONG ulTests,
 				CStatisticsConfig::PstatsconfDefault(mp),
 				CCTEConfig::PcteconfDefault(mp), ICostModel::PcmDefault(mp),
 				CHint::PhintDefault(mp), nullptr,
-				CWindowOids::GetWindowOids(mp));
+				CWindowOids::GetWindowOids(mp), false);
 		}
 		else
 		{
diff --git a/src/backend/gporca/server/src/unittest/dxl/statistics/CCardinalityTestUtils.cpp b/src/backend/gporca/server/src/unittest/dxl/statistics/CCardinalityTestUtils.cpp
index f95ecb14ee4..24da702044c 100644
--- a/src/backend/gporca/server/src/unittest/dxl/statistics/CCardinalityTestUtils.cpp
+++ b/src/backend/gporca/server/src/unittest/dxl/statistics/CCardinalityTestUtils.cpp
@@ -112,7 +112,8 @@ CCardinalityTestUtils::PhistInt4Remain(CMemoryPool *mp, ULONG num_of_buckets,
 	}
 
 	return GPOS_NEW(mp) CHistogram(mp, histogram_buckets, true, null_freq,
-								   num_NDV_remain, freq_remaining);
+								   num_NDV_remain, freq_remaining,
+								   num_NDV_remain /* distinct_by_segs */);
 }
 
 // helper function to generate an example int histogram
diff --git a/src/backend/gporca/server/src/unittest/dxl/statistics/CHistogramTest.cpp b/src/backend/gporca/server/src/unittest/dxl/statistics/CHistogramTest.cpp
index b6eb14a8378..900e16a3f7d 100644
--- a/src/backend/gporca/server/src/unittest/dxl/statistics/CHistogramTest.cpp
+++ b/src/backend/gporca/server/src/unittest/dxl/statistics/CHistogramTest.cpp
@@ -268,7 +268,8 @@ CHistogramTest::PhistExampleInt4Remain(CMemoryPool *mp)
 
 	return GPOS_NEW(mp)
 		CHistogram(mp, histogram_buckets, true, 0.1 /*null_freq*/,
-				   2.0 /*distinct_remaining*/, 0.4 /*freq_remaining*/);
+				   2.0 /*distinct_remaining*/, 0.4 /*freq_remaining*/,
+				   2.0 /*distinct_by_segs*/);
 }
 
 // basis skew test
diff --git a/src/backend/gporca/server/src/unittest/dxl/statistics/CStatisticsTest.cpp b/src/backend/gporca/server/src/unittest/dxl/statistics/CStatisticsTest.cpp
index e596add7f0d..6b0345b98e6 100644
--- a/src/backend/gporca/server/src/unittest/dxl/statistics/CStatisticsTest.cpp
+++ b/src/backend/gporca/server/src/unittest/dxl/statistics/CStatisticsTest.cpp
@@ -504,7 +504,7 @@ CStatisticsTest::EresUnittest_CStatisticsBasic()
 
 	ULongPtrArray *aggs = GPOS_NEW(mp) ULongPtrArray(mp);
 	CStatistics *pstats4 = CGroupByStatsProcessor::CalcGroupByStats(
-		mp, stats, GCs, aggs, nullptr /*keys*/);
+		mp, stats, GCs, aggs, nullptr /*keys*/, false /*is_partial*/);
 
 	GPOS_TRACE(GPOS_WSZ_LIT("pstats4 = stats group by"));
 	CCardinalityTestUtils::PrintStats(mp, pstats4);
diff --git a/src/backend/gporca/server/src/unittest/gpopt/minidump/CICGTest.cpp b/src/backend/gporca/server/src/unittest/gpopt/minidump/CICGTest.cpp
index 58d3971cfcf..facd4126ea2 100644
--- a/src/backend/gporca/server/src/unittest/gpopt/minidump/CICGTest.cpp
+++ b/src/backend/gporca/server/src/unittest/gpopt/minidump/CICGTest.cpp
@@ -303,7 +303,7 @@ CICGTest::EresUnittest_NegativeIndexApplyTests()
 				CEnumeratorConfig::GetEnumeratorCfg(mp, 0 /*plan_id*/),
 				CStatisticsConfig::PstatsconfDefault(mp),
 				CCTEConfig::PcteconfDefault(mp), pcm, CHint::PhintDefault(mp),
-				nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp));
+				nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp), false);
 			CDXLNode *pdxlnPlan = CMinidumperUtils::PdxlnExecuteMinidump(
 				mp, rgszNegativeIndexApplyFileNames[ul],
 				GPOPT_TEST_SEGMENTS /*ulSegments*/, 1 /*ulSessionId*/,
diff --git a/src/backend/gporca/server/src/unittest/gpopt/minidump/CMiniDumperDXLTest.cpp b/src/backend/gporca/server/src/unittest/gpopt/minidump/CMiniDumperDXLTest.cpp
index f046a185f29..b088aa5f6c5 100644
--- a/src/backend/gporca/server/src/unittest/gpopt/minidump/CMiniDumperDXLTest.cpp
+++ b/src/backend/gporca/server/src/unittest/gpopt/minidump/CMiniDumperDXLTest.cpp
@@ -127,7 +127,7 @@ CMiniDumperDXLTest::EresUnittest_Basic()
 			CStatisticsConfig::PstatsconfDefault(mp),
 			CCTEConfig::PcteconfDefault(mp), ICostModel::PcmDefault(mp),
 			CHint::PhintDefault(mp), nullptr /* pplanhint */,
-			CWindowOids::GetWindowOids(mp));
+			CWindowOids::GetWindowOids(mp), false);
 
 		// setup opt ctx
 		CAutoOptCtxt aoc(mp, &mda, nullptr, /* pceeval */
diff --git a/src/backend/gporca/server/src/unittest/gpopt/minidump/CMissingStatsTest.cpp b/src/backend/gporca/server/src/unittest/gpopt/minidump/CMissingStatsTest.cpp
index a2d362aa5a2..6dc10137187 100644
--- a/src/backend/gporca/server/src/unittest/gpopt/minidump/CMissingStatsTest.cpp
+++ b/src/backend/gporca/server/src/unittest/gpopt/minidump/CMissingStatsTest.cpp
@@ -88,7 +88,7 @@ CMissingStatsTest::EresUnittest_RunTests()
 			CEnumeratorConfig::GetEnumeratorCfg(mp, 0 /*plan_id*/),
 			CStatisticsConfig::PstatsconfDefault(mp),
 			CCTEConfig::PcteconfDefault(mp), pcm, CHint::PhintDefault(mp),
-			nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp));
+			nullptr /* pplanhint */, CWindowOids::GetWindowOids(mp), false);
 		SMissingStatsTestCase testCase = rgtc[ul];
 
 		CDXLNode *pdxlnPlan = CMinidumperUtils::PdxlnExecuteMinidump(
diff --git a/src/backend/gporca/server/src/unittest/gpopt/xforms/CXformTest.cpp b/src/backend/gporca/server/src/unittest/gpopt/xforms/CXformTest.cpp
index 910a10ad2ab..ba8e554bf08 100644
--- a/src/backend/gporca/server/src/unittest/gpopt/xforms/CXformTest.cpp
+++ b/src/backend/gporca/server/src/unittest/gpopt/xforms/CXformTest.cpp
@@ -172,7 +172,7 @@ CXformTest::EresUnittest_ApplyXforms_CTE()
 
 	pdrgpexpr->Append(pexprConsumer);
 	COptCtxt::PoctxtFromTLS()->Pcteinfo()->IncrementConsumers(ulCTEId);
-	COptCtxt::PoctxtFromTLS()->Pcteinfo()->AddCTEConsumer(pexprNewConsumer);
+	COptCtxt::PoctxtFromTLS()->Pcteinfo()->AddCTEConsumer(pexprConsumer);
 
 	pexprConsumer->AddRef();
 	CExpression *pexprSelect =
diff --git a/src/backend/optimizer/path/joinpath.c b/src/backend/optimizer/path/joinpath.c
index d4c2b793bb5..b5e7ef3b60c 100644
--- a/src/backend/optimizer/path/joinpath.c
+++ b/src/backend/optimizer/path/joinpath.c
@@ -2327,15 +2327,9 @@ hash_inner_and_outer(PlannerInfo *root,
 		 * able to properly guarantee uniqueness.  Similarly, we can't handle
 		 * JOIN_FULL and JOIN_RIGHT, because they can produce false null
 		 * extended rows.  Also, the resulting path must not be parameterized.
-		 * We would be able to support JOIN_FULL and JOIN_RIGHT for Parallel
-		 * Hash, since in that case we're back to a single hash table with a
-		 * single set of match bits for each batch, but that will require
-		 * figuring out a deadlock-free way to wait for the probe to finish.
 		 */
 		if (joinrel->consider_parallel &&
 			save_jointype != JOIN_UNIQUE_OUTER &&
-			save_jointype != JOIN_FULL &&
-			save_jointype != JOIN_RIGHT &&
 			outerrel->partial_pathlist != NIL &&
 			bms_is_empty(joinrel->lateral_relids))
 		{
@@ -2372,9 +2366,13 @@ hash_inner_and_outer(PlannerInfo *root,
 			 * total inner path will also be parallel-safe, but if not, we'll
 			 * have to search for the cheapest safe, unparameterized inner
 			 * path.  If doing JOIN_UNIQUE_INNER, we can't use any alternative
-			 * inner path.
+			 * inner path.  If full or right join, we can't use parallelism
+			 * (building the hash table in each backend) because no one
+			 * process has all the match bits.
 			 */
-			if (cheapest_total_inner->parallel_safe)
+			if (save_jointype == JOIN_FULL || save_jointype == JOIN_RIGHT)
+				cheapest_safe_inner = NULL;
+			else if (cheapest_total_inner->parallel_safe)
 				cheapest_safe_inner = cheapest_total_inner;
 			else if (save_jointype != JOIN_UNIQUE_INNER)
 				cheapest_safe_inner =
diff --git a/src/backend/optimizer/plan/aqumv.c b/src/backend/optimizer/plan/aqumv.c
index 4a576061780..04c173f41de 100644
--- a/src/backend/optimizer/plan/aqumv.c
+++ b/src/backend/optimizer/plan/aqumv.c
@@ -996,3 +996,352 @@ groupby_query_rewrite(PlannerInfo *subroot,
 	subroot->append_rel_list = NIL;
 	return true;
 }
+
+/*
+ * aqumv_query_is_exact_match
+ *
+ * Compare two Query trees for semantic identity.  Both should be at the
+ * same preprocessing stage (raw parser output).  Returns true only if
+ * they are structurally identical in all query-semantics fields.
+ */
+static bool
+aqumv_query_is_exact_match(Query *raw_parse, Query *viewQuery)
+{
+	/* Both must be CMD_SELECT */
+	if (raw_parse->commandType != CMD_SELECT ||
+		viewQuery->commandType != CMD_SELECT)
+		return false;
+
+	/* Same number of range table entries */
+	if (list_length(raw_parse->rtable) != list_length(viewQuery->rtable))
+		return false;
+
+	/* Compare range tables (table OIDs, join types, aliases structure) */
+	if (!equal(raw_parse->rtable, viewQuery->rtable))
+		return false;
+
+	/* Compare join tree (FROM clause + WHERE quals) */
+	if (!equal(raw_parse->jointree, viewQuery->jointree))
+		return false;
+
+	/* Compare target list entries: expressions and sort/group refs */
+	if (list_length(raw_parse->targetList) != list_length(viewQuery->targetList))
+		return false;
+	{
+		ListCell *lc1, *lc2;
+		forboth(lc1, raw_parse->targetList, lc2, viewQuery->targetList)
+		{
+			TargetEntry *tle1 = lfirst_node(TargetEntry, lc1);
+			TargetEntry *tle2 = lfirst_node(TargetEntry, lc2);
+			if (!equal(tle1->expr, tle2->expr))
+				return false;
+			if (tle1->resjunk != tle2->resjunk)
+				return false;
+			if (tle1->ressortgroupref != tle2->ressortgroupref)
+				return false;
+		}
+	}
+
+	/* Compare GROUP BY, HAVING, ORDER BY, DISTINCT, LIMIT */
+	if (!equal(raw_parse->groupClause, viewQuery->groupClause))
+		return false;
+	if (raw_parse->groupDistinct != viewQuery->groupDistinct)
+		return false;
+	if (!equal(raw_parse->havingQual, viewQuery->havingQual))
+		return false;
+	if (!equal(raw_parse->sortClause, viewQuery->sortClause))
+		return false;
+	if (!equal(raw_parse->distinctClause, viewQuery->distinctClause))
+		return false;
+	if (!equal(raw_parse->limitCount, viewQuery->limitCount))
+		return false;
+	if (!equal(raw_parse->limitOffset, viewQuery->limitOffset))
+		return false;
+	if (raw_parse->limitOption != viewQuery->limitOption)
+		return false;
+
+	/* Compare boolean flags */
+	if (raw_parse->hasAggs != viewQuery->hasAggs)
+		return false;
+	if (raw_parse->hasWindowFuncs != viewQuery->hasWindowFuncs)
+		return false;
+	if (raw_parse->hasDistinctOn != viewQuery->hasDistinctOn)
+		return false;
+
+	return true;
+}
+
+/*
+ * answer_query_using_materialized_views_for_join
+ *
+ * Handle multi-table JOIN queries via exact-match comparison.
+ * This is completely independent from the single-table AQUMV code path.
+ *
+ * We compare the saved raw parse tree (before any planner preprocessing)
+ * against the stored viewQuery from gp_matview_aux.  On exact match,
+ * rewrite the query to a simple SELECT FROM mv.
+ */
+RelOptInfo *
+answer_query_using_materialized_views_for_join(PlannerInfo *root, AqumvContext aqumv_context)
+{
+	RelOptInfo		*current_rel = aqumv_context->current_rel;
+	query_pathkeys_callback qp_callback = aqumv_context->qp_callback;
+	Query			*parse = root->parse;
+	Query			*raw_parse = root->aqumv_raw_parse;
+	RelOptInfo		*mv_final_rel = current_rel;
+	Relation		matviewRel;
+	Relation		mvauxDesc;
+	TupleDesc		mvaux_tupdesc;
+	SysScanDesc		mvscan;
+	HeapTuple		tup;
+	Form_gp_matview_aux mvaux_tup;
+	bool			need_close = false;
+
+	/* Must have the saved raw parse tree. */
+	if (raw_parse == NULL)
+		return mv_final_rel;
+
+	/* Must be a join query (more than one table in FROM). */
+	if (list_length(raw_parse->rtable) <= 1)
+		return mv_final_rel;
+
+	/* Basic eligibility checks (same as single-table AQUMV). */
+	if (parse->commandType != CMD_SELECT ||
+		parse->rowMarks != NIL ||
+		parse->scatterClause != NIL ||
+		parse->cteList != NIL ||
+		parse->setOperations != NULL ||
+		parse->hasModifyingCTE ||
+		parse->parentStmtType == PARENTSTMTTYPE_REFRESH_MATVIEW ||
+		parse->parentStmtType == PARENTSTMTTYPE_CTAS ||
+		contain_mutable_functions((Node *) raw_parse) ||
+		parse->hasSubLinks)
+		return mv_final_rel;
+
+	mvauxDesc = table_open(GpMatviewAuxId, AccessShareLock);
+	mvaux_tupdesc = RelationGetDescr(mvauxDesc);
+
+	mvscan = systable_beginscan(mvauxDesc, InvalidOid, false,
+								NULL, 0, NULL);
+
+	while (HeapTupleIsValid(tup = systable_getnext(mvscan)))
+	{
+		Datum		view_query_datum;
+		char		*view_query_str;
+		bool		is_null;
+		Query		*viewQuery;
+		RangeTblEntry *mvrte;
+		PlannerInfo	*subroot;
+		TupleDesc	mv_tupdesc;
+
+		CHECK_FOR_INTERRUPTS();
+		if (need_close)
+			table_close(matviewRel, AccessShareLock);
+
+		mvaux_tup = (Form_gp_matview_aux) GETSTRUCT(tup);
+		matviewRel = table_open(mvaux_tup->mvoid, AccessShareLock);
+		need_close = true;
+
+		if (!RelationIsPopulated(matviewRel))
+			continue;
+
+		/* MV must be up-to-date (IVM is always current). */
+		if (!RelationIsIVM(matviewRel) &&
+			!MatviewIsGeneralyUpToDate(RelationGetRelid(matviewRel)))
+			continue;
+
+		/* Get a copy of view query. */
+		view_query_datum = heap_getattr(tup,
+										Anum_gp_matview_aux_view_query,
+										mvaux_tupdesc,
+										&is_null);
+
+		view_query_str = TextDatumGetCString(view_query_datum);
+		viewQuery = copyObject(stringToNode(view_query_str));
+		pfree(view_query_str);
+		Assert(IsA(viewQuery, Query));
+
+		/* Skip single-table viewQueries (handled by existing AQUMV). */
+		if (list_length(viewQuery->rtable) <= 1)
+			continue;
+
+		/* Exact match comparison between raw parse and view query. */
+		if (!aqumv_query_is_exact_match(raw_parse, viewQuery))
+			continue;
+
+		/*
+		 * We have an exact match.  Rewrite viewQuery to:
+		 *   SELECT mv.col1, mv.col2, ... FROM mv
+		 */
+		mv_tupdesc = RelationGetDescr(matviewRel);
+
+		/* Build new target list referencing MV columns. */
+		{
+			List	   *new_tlist = NIL;
+			ListCell   *lc;
+			int			attnum = 0;
+
+			foreach(lc, viewQuery->targetList)
+			{
+				TargetEntry *old_tle = lfirst_node(TargetEntry, lc);
+				TargetEntry *new_tle;
+				Var			*newVar;
+				Form_pg_attribute attr;
+
+				if (old_tle->resjunk)
+					continue;
+
+				attnum++;
+				attr = TupleDescAttr(mv_tupdesc, attnum - 1);
+
+				newVar = makeVar(1,
+								attr->attnum,
+								attr->atttypid,
+								attr->atttypmod,
+								attr->attcollation,
+								0);
+				newVar->location = -1;
+
+				new_tle = makeTargetEntry((Expr *) newVar,
+										  (AttrNumber) attnum,
+										  old_tle->resname,
+										  false);
+				new_tle->ressortgroupref = old_tle->ressortgroupref;
+				new_tlist = lappend(new_tlist, new_tle);
+			}
+
+			viewQuery->targetList = new_tlist;
+		}
+
+		/* Create new RTE for the MV. */
+		mvrte = makeNode(RangeTblEntry);
+		mvrte->rtekind = RTE_RELATION;
+		mvrte->relid = RelationGetRelid(matviewRel);
+		mvrte->relkind = RELKIND_MATVIEW;
+		mvrte->rellockmode = AccessShareLock;
+		mvrte->inh = false;
+		mvrte->inFromCl = true;
+
+		/* Build eref with column names from the MV's TupleDesc. */
+		{
+			Alias  *eref = makeAlias(RelationGetRelationName(matviewRel), NIL);
+			int		i;
+			for (i = 0; i < mv_tupdesc->natts; i++)
+			{
+				Form_pg_attribute attr = TupleDescAttr(mv_tupdesc, i);
+				if (!attr->attisdropped)
+					eref->colnames = lappend(eref->colnames,
+											 makeString(pstrdup(NameStr(attr->attname))));
+				else
+					eref->colnames = lappend(eref->colnames,
+											 makeString(pstrdup("")));
+			}
+			mvrte->eref = eref;
+			mvrte->alias = makeAlias(RelationGetRelationName(matviewRel), NIL);
+		}
+
+		viewQuery->rtable = list_make1(mvrte);
+		viewQuery->jointree = makeFromExpr(list_make1(makeNode(RangeTblRef)), NULL);
+		((RangeTblRef *) linitial(viewQuery->jointree->fromlist))->rtindex = 1;
+
+		/* Clear aggregation/grouping state — already materialized in MV. */
+		viewQuery->hasAggs = false;
+		viewQuery->groupClause = NIL;
+		viewQuery->havingQual = NULL;
+		/* Keep sortClause: upper planner needs it to add Sort node. */
+		viewQuery->distinctClause = NIL;
+		viewQuery->hasDistinctOn = false;
+		viewQuery->hasWindowFuncs = false;
+		viewQuery->hasTargetSRFs = false;
+		viewQuery->limitCount = parse->limitCount;
+		viewQuery->limitOffset = parse->limitOffset;
+		viewQuery->limitOption = parse->limitOption;
+
+		/* Create subroot for planning the MV scan. */
+		subroot = (PlannerInfo *) palloc(sizeof(PlannerInfo));
+		memcpy(subroot, root, sizeof(PlannerInfo));
+		subroot->parent_root = root;
+		subroot->eq_classes = NIL;
+		subroot->plan_params = NIL;
+		subroot->outer_params = NULL;
+		subroot->init_plans = NIL;
+		subroot->agginfos = NIL;
+		subroot->aggtransinfos = NIL;
+		subroot->parse = viewQuery;
+		subroot->tuple_fraction = root->tuple_fraction;
+		subroot->limit_tuples = root->limit_tuples;
+		subroot->append_rel_list = NIL;
+		subroot->hasHavingQual = false;
+		subroot->hasNonPartialAggs = false;
+		subroot->hasNonSerialAggs = false;
+		subroot->numOrderedAggs = 0;
+		subroot->hasNonCombine = false;
+		subroot->numPureOrderedAggs = 0;
+
+		subroot->processed_tlist = NIL;
+		preprocess_targetlist(subroot);
+
+		/* Compute final locus for the MV scan. */
+		{
+			PathTarget *newtarget = make_pathtarget_from_tlist(subroot->processed_tlist);
+			subroot->final_locus = cdbllize_get_final_locus(subroot, newtarget);
+		}
+
+		/*
+		 * Plan the MV scan.
+		 *
+		 * Clear qp_extra's groupClause and activeWindows because the
+		 * rewritten viewQuery is a simple SELECT from the MV with no
+		 * GROUP BY or windowing.  standard_qp_callback would otherwise
+		 * try to compute group_pathkeys from stale expressions.
+		 *
+		 * Safe: grouping_planner() no longer reads qp_extra after AQUMV.
+		 */
+		{
+			standard_qp_extra *qp = (standard_qp_extra *) aqumv_context->qp_extra;
+			qp->activeWindows = NIL;
+			qp->groupClause = NIL;
+		}
+		mv_final_rel = query_planner(subroot, qp_callback, aqumv_context->qp_extra);
+
+		/* Cost-based decision: use MV only if cheaper. */
+		if (mv_final_rel->cheapest_total_path->total_cost < current_rel->cheapest_total_path->total_cost)
+		{
+			root->parse = viewQuery;
+			root->processed_tlist = subroot->processed_tlist;
+			root->agginfos = subroot->agginfos;
+			root->aggtransinfos = subroot->aggtransinfos;
+			root->simple_rte_array = subroot->simple_rte_array;
+			root->simple_rel_array = subroot->simple_rel_array;
+			root->simple_rel_array_size = subroot->simple_rel_array_size;
+			root->hasNonPartialAggs = subroot->hasNonPartialAggs;
+			root->hasNonSerialAggs = subroot->hasNonSerialAggs;
+			root->numOrderedAggs = subroot->numOrderedAggs;
+			root->hasNonCombine = subroot->hasNonCombine;
+			root->numPureOrderedAggs = subroot->numPureOrderedAggs;
+			root->hasHavingQual = subroot->hasHavingQual;
+			root->group_pathkeys = subroot->group_pathkeys;
+			root->sort_pathkeys = subroot->sort_pathkeys;
+			root->query_pathkeys = subroot->query_pathkeys;
+			root->distinct_pathkeys = subroot->distinct_pathkeys;
+			root->eq_classes = subroot->eq_classes;
+			root->append_rel_list = subroot->append_rel_list;
+			current_rel = mv_final_rel;
+			table_close(matviewRel, NoLock);
+			need_close = false;
+			break;
+		}
+		else
+		{
+			/* MV is not cheaper, reset and try next. */
+			mv_final_rel = current_rel;
+		}
+	}
+
+	if (need_close)
+		table_close(matviewRel, AccessShareLock);
+	systable_endscan(mvscan);
+	table_close(mvauxDesc, AccessShareLock);
+
+	return current_rel;
+}
diff --git a/src/backend/optimizer/plan/createplan.c b/src/backend/optimizer/plan/createplan.c
index 53c1bf7d338..20c1587b062 100644
--- a/src/backend/optimizer/plan/createplan.c
+++ b/src/backend/optimizer/plan/createplan.c
@@ -47,6 +47,7 @@
 #include "parser/parsetree.h"
 #include "partitioning/partdesc.h"
 #include "partitioning/partprune.h"
+#include "tcop/tcopprot.h"
 #include "utils/lsyscache.h"
 #include "utils/uri.h"
 
@@ -8482,7 +8483,19 @@ make_modifytable(PlannerInfo *root, Plan *subplan,
 
 			Assert(rte->rtekind == RTE_RELATION);
 			if (rte->relkind == RELKIND_FOREIGN_TABLE)
+			{
+				/* Check if the access to foreign tables is restricted */
+				if (unlikely((restrict_nonsystem_relation_kind & RESTRICT_RELKIND_FOREIGN_TABLE) != 0))
+				{
+					/* there must not be built-in foreign tables */
+					Assert(rte->relid >= FirstNormalObjectId);
+					ereport(ERROR,
+							(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+							 errmsg("access to non-system foreign table is restricted")));
+				}
+
 				fdwroutine = GetFdwRoutineByRelId(rte->relid);
+			}
 			else
 				fdwroutine = NULL;
 		}
diff --git a/src/backend/optimizer/plan/orca.c b/src/backend/optimizer/plan/orca.c
index 97f63f7a334..a083fcda6c7 100644
--- a/src/backend/optimizer/plan/orca.c
+++ b/src/backend/optimizer/plan/orca.c
@@ -405,6 +405,10 @@ optimize_query(Query *parse, int cursorOptions, ParamListInfo boundParams, Optim
 	result->oneoffPlan = glob->oneoffPlan;
 	result->transientPlan = glob->transientPlan;
 
+	result->queryId = parse->queryId;
+	result->stmt_location = parse->stmt_location;
+	result->stmt_len = parse->stmt_len;
+
 	return result;
 }
 
@@ -545,6 +549,10 @@ push_down_expr_mutator(Node *node, List *child_tlist)
 			{
 				((Const *) child_tle->expr)->consttypmod = ((Var *) node)->vartypmod;
 			}
+			else if (IsA(child_tle->expr, Var))
+			{
+				((Var *) child_tle->expr)->vartypmod = ((Var *) node)->vartypmod;
+			}
 
 			return (Node *) child_tle->expr;
 		}
diff --git a/src/backend/optimizer/plan/planner.c b/src/backend/optimizer/plan/planner.c
index afbf249fc33..5f643b6566f 100644
--- a/src/backend/optimizer/plan/planner.c
+++ b/src/backend/optimizer/plan/planner.c
@@ -121,12 +121,7 @@ create_upper_paths_hook_type create_upper_paths_hook = NULL;
 #define EXPRKIND_TABLEFUNC_LATERAL	12
 #define EXPRKIND_WINDOW_BOUND		13
 
-/* Passthrough data for standard_qp_callback */
-typedef struct
-{
-	List	   *activeWindows;	/* active windows, if any */
-	List	   *groupClause;	/* overrides parse->groupClause */
-} standard_qp_extra;
+/* standard_qp_extra is defined in optimizer/planner.h */
 
 /*
  * Data specific to grouping sets
@@ -333,6 +328,27 @@ planner(Query *parse, const char *query_string, int cursorOptions,
 
 	optimizer_options = palloc(sizeof(OptimizerOptions));
 	optimizer_options->create_vectorization_plan = false;
+
+	/*
+	 * Set parallel plan creation based on PostgreSQL planner's parallel safety checks.
+	 * This synchronizes with the same conditions used in standard_planner().
+	 */
+	if ((cursorOptions & CURSOR_OPT_PARALLEL_OK) != 0 &&
+		IsUnderPostmaster &&
+		parse->commandType == CMD_SELECT &&
+		!parse->hasModifyingCTE &&
+		max_parallel_workers_per_gather > 0 &&
+		!IsParallelWorker())
+	{
+		/* All cheap tests pass, check query tree for parallel safety */
+		char maxParallelHazard = max_parallel_hazard(parse);
+		optimizer_options->create_parallel_plan = (maxParallelHazard != PROPARALLEL_UNSAFE);
+	}
+	else
+	{
+		/* Skip the query tree scan, assume unsafe */
+		optimizer_options->create_parallel_plan = false;
+	}
 	if (planner_hook)
 	{
 		if (gp_log_optimization_time)
@@ -953,6 +969,17 @@ subquery_planner(PlannerGlobal *glob, Query *parse,
 	root->partColsUpdated = false;
 	root->is_correlated_subplan = false;
 
+	/*
+	 * Save a copy of the raw parse tree for AQUMV join exact-match.
+	 * This must be done before any preprocessing modifies the parse tree.
+	 */
+	if (Gp_role == GP_ROLE_DISPATCH &&
+		enable_answer_query_using_materialized_views &&
+		parent_root == NULL)
+		root->aqumv_raw_parse = copyObject(parse);
+	else
+		root->aqumv_raw_parse = NULL;
+
 	/*
 	 * If there is a WITH list, process each WITH query and either convert it
 	 * to RTE_SUBQUERY RTE(s) or build an initplan SubPlan structure for it.
@@ -1965,6 +1992,13 @@ grouping_planner(PlannerInfo *root, double tuple_fraction)
 
 			/* Do the real work. */
 			current_rel = answer_query_using_materialized_views(root, aqumv_context);
+
+			/* Try join AQUMV if single-table didn't rewrite. */
+			if (current_rel == aqumv_context->current_rel)
+			{
+				current_rel = answer_query_using_materialized_views_for_join(root, aqumv_context);
+			}
+
 			/* parse tree may be rewriten. */
 			parse = root->parse;
 		}
diff --git a/src/backend/optimizer/util/clauses.c b/src/backend/optimizer/util/clauses.c
index 2669f2c3017..a039fdd87d2 100644
--- a/src/backend/optimizer/util/clauses.c
+++ b/src/backend/optimizer/util/clauses.c
@@ -5522,35 +5522,45 @@ flatten_join_alias_var_optimizer(Query *query, int queryLevel)
 	if (NIL != targetList)
 	{
 		queryNew->targetList = (List *) flatten_join_alias_vars(queryNew, (Node *) targetList);
-		list_free(targetList);
+		if (targetList != queryNew->targetList)
+			list_free(targetList);
 	}
 
-	List * returningList = queryNew->returningList;
+	List *returningList = queryNew->returningList;
 	if (NIL != returningList)
 	{
 		queryNew->returningList = (List *) flatten_join_alias_vars(queryNew, (Node *) returningList);
-		list_free(returningList);
+		if (returningList != queryNew->returningList)
+			list_free(returningList);
 	}
 
 	Node *havingQual = queryNew->havingQual;
 	if (NULL != havingQual)
 	{
 		queryNew->havingQual = flatten_join_alias_vars(queryNew, havingQual);
-		pfree(havingQual);
+		if (havingQual != queryNew->havingQual)
+		{
+			if (IsA(havingQual, List))
+				list_free((List *) havingQual);
+			else
+				pfree(havingQual);
+		}
 	}
 
 	List *scatterClause = queryNew->scatterClause;
 	if (NIL != scatterClause)
 	{
 		queryNew->scatterClause = (List *) flatten_join_alias_vars(queryNew, (Node *) scatterClause);
-		list_free(scatterClause);
+		if (scatterClause != queryNew->scatterClause)
+			list_free(scatterClause);
 	}
 
 	Node *limitOffset = queryNew->limitOffset;
 	if (NULL != limitOffset)
 	{
 		queryNew->limitOffset = flatten_join_alias_vars(queryNew, limitOffset);
-		pfree(limitOffset);
+		if (limitOffset != queryNew->limitOffset)
+			pfree(limitOffset);
 	}
 
 	List *windowClause = queryNew->windowClause;
@@ -5577,7 +5587,8 @@ flatten_join_alias_var_optimizer(Query *query, int queryLevel)
 	if (NULL != limitCount)
 	{
 		queryNew->limitCount = flatten_join_alias_vars(queryNew, limitCount);
-		pfree(limitCount);
+		if (limitCount != queryNew->limitCount)
+			pfree(limitCount);
 	}
 
     return queryNew;
diff --git a/src/backend/optimizer/util/plancat.c b/src/backend/optimizer/util/plancat.c
index 46d85f3c324..5b8123b67fd 100644
--- a/src/backend/optimizer/util/plancat.c
+++ b/src/backend/optimizer/util/plancat.c
@@ -49,6 +49,7 @@
 #include "rewrite/rewriteManip.h"
 #include "statistics/statistics.h"
 #include "storage/bufmgr.h"
+#include "tcop/tcopprot.h"
 #include "utils/builtins.h"
 #include "utils/lsyscache.h"
 #include "utils/partcache.h"
@@ -484,6 +485,17 @@ get_relation_info(PlannerInfo *root, Oid relationObjectId, bool inhparent,
 	/* Grab foreign-table info using the relcache, while we have it */
 	if (relation->rd_rel->relkind == RELKIND_FOREIGN_TABLE)
 	{
+		/* Check if the access to foreign tables is restricted */
+		if (unlikely((restrict_nonsystem_relation_kind & RESTRICT_RELKIND_FOREIGN_TABLE) != 0))
+		{
+			/* there must not be built-in foreign tables */
+			Assert(RelationGetRelid(relation) >= FirstNormalObjectId);
+
+			ereport(ERROR,
+					(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+					 errmsg("access to non-system foreign table is restricted")));
+		}
+
 		rel->serverid = GetForeignServerIdByRelId(RelationGetRelid(relation));
 		rel->segSeverids = GetForeignServerSegsByRelId(RelationGetRelid(relation));
 		rel->fdwroutine = GetFdwRoutineForRelation(relation, true);
@@ -1625,8 +1637,10 @@ GetExtStatisticsName(Oid statOid)
 		elog(ERROR, "cache lookup failed for statistics object %u", statOid);
 
 	staForm = (Form_pg_statistic_ext) GETSTRUCT(htup);
+	/* Copy the name before releasing the cache entry. */
+	char *result = pstrdup(NameStr(staForm->stxname));
 	ReleaseSysCache(htup);
-	return NameStr(staForm->stxname);
+	return result;
 }
 
 /*
diff --git a/src/backend/optimizer/util/walkers.c b/src/backend/optimizer/util/walkers.c
index 3b3d0311d06..be806f4daf7 100644
--- a/src/backend/optimizer/util/walkers.c
+++ b/src/backend/optimizer/util/walkers.c
@@ -8,11 +8,17 @@
 
 #include "postgres.h"
 
+#include "access/htup_details.h"
+#include "catalog/pg_amop.h"
 #include "catalog/pg_collation.h"
 #include "catalog/pg_type.h"
 #include "miscadmin.h"
 #include "nodes/nodeFuncs.h"
+#include "optimizer/optimizer.h"
 #include "optimizer/walkers.h"
+#include "utils/catcache.h"
+#include "utils/lsyscache.h"
+#include "utils/syscache.h"
 
 /**
  * Plan node walker related methods.
@@ -1011,3 +1017,109 @@ check_collation_walker(Node *node, check_collation_context *context)
 	}
 }
 
+/*
+ * is_ordering_op
+ *
+ * Return true if the operator is registered as an ordering operator
+ * (amoppurpose = AMOP_ORDER) in any opfamily in pg_amop.
+ */
+static bool
+is_ordering_op(Oid opno)
+{
+	CatCList   *catlist = SearchSysCacheList1(AMOPOPID,
+											  ObjectIdGetDatum(opno));
+
+	for (int i = 0; i < catlist->n_members; i++)
+	{
+		HeapTuple	tp = &catlist->members[i]->tuple;
+		Form_pg_amop amop = (Form_pg_amop) GETSTRUCT(tp);
+
+		if (amop->amoppurpose == AMOP_ORDER)
+		{
+			ReleaseSysCacheList(catlist);
+			return true;
+		}
+	}
+	ReleaseSysCacheList(catlist);
+	return false;
+}
+
+/*
+ * has_plain_var_arg
+ *
+ * Return true if the OpExpr has at least one direct Var argument
+ * (not wrapped in a function or other expression).
+ *
+ * Implicit coercions such as RelabelType (binary-compatible casts, e.g.
+ * varchar -> text) are stripped before the check so that a column
+ * reference that was implicitly cast to match the operator's input type
+ * is still recognised as a plain Var.
+ */
+static bool
+has_plain_var_arg(OpExpr *op)
+{
+	ListCell   *arg_lc;
+
+	foreach(arg_lc, op->args)
+	{
+		Node	   *arg = strip_implicit_coercions(lfirst(arg_lc));
+
+		if (IsA(arg, Var))
+			return true;
+	}
+	return false;
+}
+
+/*
+ * has_orderby_ordering_op
+ *
+ * Check if the query's ORDER BY uses ordering operators (amoppurpose =
+ * AMOP_ORDER in pg_amop) that the PostgreSQL planner can safely optimize
+ * with KNN-GiST index scans but ORCA cannot.
+ *
+ * Return true only when ALL ordering-operator expressions in ORDER BY
+ * have at least one direct Var (column reference) argument.  Expressions
+ * like "circle(p,1) <-> point(0,0)" wrap the column in a function,
+ * which can cause "lossy distance functions are not supported in
+ * index-only scans" errors in the planner.  In such cases we leave the
+ * query for ORCA to handle via Seq Scan + Sort.
+ */
+bool
+has_orderby_ordering_op(Query *query)
+{
+	ListCell   *lc;
+	bool		found_ordering_op = false;
+
+	if (query->sortClause == NIL)
+		return false;
+
+	foreach(lc, query->sortClause)
+	{
+		SortGroupClause *sgc = (SortGroupClause *) lfirst(lc);
+		TargetEntry *tle = get_sortgroupclause_tle(sgc, query->targetList);
+		Node	   *expr = (Node *) tle->expr;
+
+		if (!IsA(expr, OpExpr))
+			continue;
+
+		OpExpr	   *opexpr = (OpExpr *) expr;
+
+		if (!is_ordering_op(opexpr->opno))
+			continue;
+
+		/*
+		 * Found an ordering operator.  Check that at least one argument is
+		 * a plain Var.  If any ordering operator has only computed arguments
+		 * (e.g., function calls wrapping columns), bail out immediately —
+		 * falling back to the planner could produce lossy distance errors
+		 * in index-only scans.
+		 */
+		found_ordering_op = true;
+
+		if (!has_plain_var_arg(opexpr))
+			return false;
+	}
+
+	return found_ordering_op;
+}
+
diff --git a/src/backend/parser/parse_partition_gp.c b/src/backend/parser/parse_partition_gp.c
index 747f1940eac..b912b658376 100644
--- a/src/backend/parser/parse_partition_gp.c
+++ b/src/backend/parser/parse_partition_gp.c
@@ -1687,7 +1687,7 @@ generatePartitions(Oid parentrelid, GpPartitionDefinition *gpPartSpec,
 			if (elem->accessMethod && strcmp(elem->accessMethod, "ao_column") == 0)
 				elem->colencs = merge_partition_encoding(pstate, elem->colencs, penc_cls);
 			else if (!elem->colencs) {
-				/* For the aoco, used `transfromColumnEncodingAocoRootPartition` to
+				/* For the aoco, used `transformColumnEncodingAocoRootPartition` to
 				 * pass encoding clause in root partition. The logic in that method is
 				 * relate to aoco that means it only validate and pass the aoco encoding
 				 * clause options. So we have to give up pass root partition encoding
diff --git a/src/backend/rewrite/rewriteHandler.c b/src/backend/rewrite/rewriteHandler.c
index 23c528b60f9..9da36260c77 100644
--- a/src/backend/rewrite/rewriteHandler.c
+++ b/src/backend/rewrite/rewriteHandler.c
@@ -43,6 +43,7 @@
 #include "rewrite/rewriteManip.h"
 #include "rewrite/rewriteSearchCycle.h"
 #include "rewrite/rowsecurity.h"
+#include "tcop/tcopprot.h"
 #include "utils/builtins.h"
 #include "utils/lsyscache.h"
 #include "utils/rel.h"
@@ -1815,6 +1816,14 @@ ApplyRetrieveRule(Query *parsetree,
 	if (rule->qual != NULL)
 		elog(ERROR, "cannot handle qualified ON SELECT rule");
 
+	/* Check if the expansion of non-system views are restricted */
+	if (unlikely((restrict_nonsystem_relation_kind & RESTRICT_RELKIND_VIEW) != 0 &&
+				 RelationGetRelid(relation) >= FirstNormalObjectId))
+		ereport(ERROR,
+				(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+				 errmsg("access to non-system view \"%s\" is restricted",
+						RelationGetRelationName(relation))));
+
 	if (rt_index == parsetree->resultRelation)
 	{
 		/*
@@ -3261,6 +3270,14 @@ rewriteTargetView(Query *parsetree, Relation view)
 		}
 	}
 
+	/* Check if the expansion of non-system views are restricted */
+	if (unlikely((restrict_nonsystem_relation_kind & RESTRICT_RELKIND_VIEW) != 0 &&
+				 RelationGetRelid(view) >= FirstNormalObjectId))
+		ereport(ERROR,
+				(errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
+				 errmsg("access to non-system view \"%s\" is restricted",
+						RelationGetRelationName(view))));
+
 	/*
 	 * For INSERT/UPDATE the modified columns must all be updatable. Note that
 	 * we get the modified columns from the query's targetlist, not from the
diff --git a/src/backend/storage/freespace/freespace.c b/src/backend/storage/freespace/freespace.c
index 796b915156b..ee97e757115 100644
--- a/src/backend/storage/freespace/freespace.c
+++ b/src/backend/storage/freespace/freespace.c
@@ -633,6 +633,14 @@ fsm_extend(Relation rel, BlockNumber fsm_nblocks)
 		!smgrexists(rel->rd_smgr, FSM_FORKNUM))
 		smgrcreate(rel->rd_smgr, FSM_FORKNUM, false);
 
+	/*
+	 * Might have to re-open if smgrcreate triggered AcceptInvalidationMessages
+	 * (via TablespaceCreateDbspace -> LockSharedObject for non-default
+	 * tablespaces), which may have processed a pending SHAREDINVALSMGR_ID
+	 * message and closed our smgr entry.
+	 */
+	RelationOpenSmgr(rel);
+
 	/* Invalidate cache so that smgrnblocks() asks the kernel. */
 	rel->rd_smgr->smgr_cached_nblocks[FSM_FORKNUM] = InvalidBlockNumber;
 	fsm_nblocks_now = smgrnblocks(rel->rd_smgr, FSM_FORKNUM);
diff --git a/src/backend/tcop/postgres.c b/src/backend/tcop/postgres.c
index 37cdcfba46a..6ae0202b396 100644
--- a/src/backend/tcop/postgres.c
+++ b/src/backend/tcop/postgres.c
@@ -89,6 +89,7 @@
 #include "utils/snapmgr.h"
 #include "utils/timeout.h"
 #include "utils/timestamp.h"
+#include "utils/varlena.h"
 
 #include "cdb/cdbutil.h"
 #include "cdb/cdbvars.h"
@@ -151,6 +152,8 @@ cancel_pending_hook_type cancel_pending_hook = NULL;
  * Hook for query execution.
  */
 exec_simple_query_hook_type exec_simple_query_hook = NULL;
+/* flags for non-system relation kinds to restrict use */
+int			restrict_nonsystem_relation_kind;
 
 /* ----------------
  *		private typedefs etc
@@ -4558,6 +4561,66 @@ assign_max_stack_depth(int newval, void *extra)
 	max_stack_depth_bytes = newval_bytes;
 }
 
+/*
+ * GUC check_hook for restrict_nonsystem_relation_kind
+ */
+bool
+check_restrict_nonsystem_relation_kind(char **newval, void **extra, GucSource source)
+{
+	char	   *rawstring;
+	List	   *elemlist;
+	ListCell   *l;
+	int			flags = 0;
+
+	/* Need a modifiable copy of string */
+	rawstring = pstrdup(*newval);
+
+	if (!SplitIdentifierString(rawstring, ',', &elemlist))
+	{
+		/* syntax error in list */
+		GUC_check_errdetail("List syntax is invalid.");
+		pfree(rawstring);
+		list_free(elemlist);
+		return false;
+	}
+
+	foreach(l, elemlist)
+	{
+		char	   *tok = (char *) lfirst(l);
+
+		if (pg_strcasecmp(tok, "view") == 0)
+			flags |= RESTRICT_RELKIND_VIEW;
+		else if (pg_strcasecmp(tok, "foreign-table") == 0)
+			flags |= RESTRICT_RELKIND_FOREIGN_TABLE;
+		else
+		{
+			GUC_check_errdetail("Unrecognized key word: \"%s\".", tok);
+			pfree(rawstring);
+			list_free(elemlist);
+			return false;
+		}
+	}
+
+	pfree(rawstring);
+	list_free(elemlist);
+
+	/* Save the flags in *extra, for use by the assign function */
+	*extra = malloc(sizeof(int));
+	*((int *) *extra) = flags;
+
+	return true;
+}
+
+/*
+ * GUC assign_hook for restrict_nonsystem_relation_kind
+ */
+void
+assign_restrict_nonsystem_relation_kind(const char *newval, void *extra)
+{
+	int		   *flags = (int *) extra;
+
+	restrict_nonsystem_relation_kind = *flags;
+}
 
 /*
  * set_debug_options --- apply "-d N" command line option
diff --git a/src/backend/tcop/pquery.c b/src/backend/tcop/pquery.c
index 532690f1d51..e5512bb8271 100644
--- a/src/backend/tcop/pquery.c
+++ b/src/backend/tcop/pquery.c
@@ -127,6 +127,9 @@ CreateQueryDesc(PlannedStmt *plannedstmt,
 	if (Gp_role != GP_ROLE_EXECUTE)
 		increment_command_count();
 
+	/* null this field until set by GP Stats Collector */
+	qd->gpsc_query_key = NULL;
+
 	return qd;
 }
 
diff --git a/src/backend/utils/adt/xml.c b/src/backend/utils/adt/xml.c
index 6d38a2d0de2..aafa6203b93 100644
--- a/src/backend/utils/adt/xml.c
+++ b/src/backend/utils/adt/xml.c
@@ -65,6 +65,16 @@
 #if LIBXML_VERSION >= 20704
 #define HAVE_XMLSTRUCTUREDERRORCONTEXT 1
 #endif
+
+/*
+ * libxml2 2.12 decided to insert "const" into the error handler API.
+ */
+#if LIBXML_VERSION >= 21200
+#define PgXmlErrorPtr const xmlError *
+#else
+#define PgXmlErrorPtr xmlErrorPtr
+#endif
+
 #endif							/* USE_LIBXML */
 
 #include "access/htup_details.h"
@@ -121,7 +131,7 @@ struct PgXmlErrorContext
 
 static xmlParserInputPtr xmlPgEntityLoader(const char *URL, const char *ID,
 										   xmlParserCtxtPtr ctxt);
-static void xml_errorHandler(void *data, xmlErrorPtr error);
+static void xml_errorHandler(void *data, PgXmlErrorPtr error);
 static void xml_ereport_by_code(int level, int sqlcode,
 								const char *msg, int errcode);
 static void chopStringInfoNewlines(StringInfo str);
@@ -1762,7 +1772,7 @@ xml_ereport(PgXmlErrorContext *errcxt, int level, int sqlcode, const char *msg)
  * Error handler for libxml errors and warnings
  */
 static void
-xml_errorHandler(void *data, xmlErrorPtr error)
+xml_errorHandler(void *data, PgXmlErrorPtr error)
 {
 	PgXmlErrorContext *xmlerrcxt = (PgXmlErrorContext *) data;
 	xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) error->ctxt;
diff --git a/src/backend/utils/init/miscinit.c b/src/backend/utils/init/miscinit.c
index a8e7ff0f057..83dee55ad8a 100644
--- a/src/backend/utils/init/miscinit.c
+++ b/src/backend/utils/init/miscinit.c
@@ -841,6 +841,14 @@ InitializeSessionUserIdStandalone(void)
 	AuthenticatedUserIsSuperuser = true;
 
 	SetSessionUserId(BOOTSTRAP_SUPERUSERID, true);
+
+	/*
+	 * XXX This should set SetConfigOption("session_authorization"), too.
+	 * Since we don't, C code will get NULL, and current_setting() will get an
+	 * empty string.
+	 */
+	SetConfigOption("is_superuser", "on",
+					PGC_INTERNAL, PGC_S_DYNAMIC_DEFAULT);
 }
 
 
diff --git a/src/backend/utils/misc/guc.c b/src/backend/utils/misc/guc.c
index 168f6113ce2..bc3e76d0314 100644
--- a/src/backend/utils/misc/guc.c
+++ b/src/backend/utils/misc/guc.c
@@ -686,6 +686,8 @@ static char *recovery_target_xid_string;
 static char *recovery_target_name_string;
 static char *recovery_target_lsn_string;
 static char *file_encryption_method_str;
+static char *restrict_nonsystem_relation_kind_string;
+
 
 /* should be static, but commands/variable.c needs to get at this */
 char	   *role_string;
@@ -4761,7 +4763,18 @@ static struct config_string ConfigureNamesString[] =
 		"",
 		NULL, NULL, NULL
 	},
-	
+
+	{
+		{"restrict_nonsystem_relation_kind", PGC_USERSET, CLIENT_CONN_STATEMENT,
+			gettext_noop("Sets relation kinds of non-system relation to restrict use"),
+			NULL,
+			GUC_LIST_INPUT | GUC_NOT_IN_SAMPLE
+		},
+		&restrict_nonsystem_relation_kind_string,
+		"",
+		check_restrict_nonsystem_relation_kind, assign_restrict_nonsystem_relation_kind, NULL
+	},
+
 	/* End-of-list marker */
 	{
 		{NULL, 0, 0, NULL, NULL}, NULL, NULL, NULL, NULL, NULL
diff --git a/src/backend/utils/misc/guc_gp.c b/src/backend/utils/misc/guc_gp.c
index 42b61dfbbbb..7a4433cfa98 100644
--- a/src/backend/utils/misc/guc_gp.c
+++ b/src/backend/utils/misc/guc_gp.c
@@ -154,6 +154,7 @@ bool		enable_parallel_dedup_semi_join = true;
 bool		enable_parallel_dedup_semi_reverse_join = true;
 bool		parallel_query_use_streaming_hashagg = false;
 bool		gp_use_streaming_hashagg = true;
+bool		optimizer_use_streaming_hashagg = true;
 int			gp_appendonly_insert_files = 0;
 int			gp_appendonly_insert_files_tuples_range = 0;
 int			gp_random_insert_segments = 0;
@@ -1909,6 +1910,16 @@ struct config_bool ConfigureNamesBool_gp[] =
 		true, NULL, NULL
 	},
 
+	{
+		{"optimizer_use_streaming_hashagg", PGC_USERSET, DEVELOPER_OPTIONS,
+			gettext_noop("Use streaming hash agg in ORCA-generated local partial hash aggregations."),
+			NULL,
+			GUC_NO_SHOW_ALL | GUC_NOT_IN_SAMPLE
+		},
+		&optimizer_use_streaming_hashagg,
+		true, NULL, NULL
+	},
+
 	{
 		{"gp_force_random_redistribution", PGC_USERSET, CUSTOM_OPTIONS,
 			gettext_noop("Force redistribution of insert for randomly-distributed."),
@@ -4936,7 +4947,7 @@ struct config_string ConfigureNamesString_gp[] =
 	{
 		{"gp_resource_manager", PGC_POSTMASTER, RESOURCES,
 			gettext_noop("Sets the type of resource manager."),
-			gettext_noop("Only support \"queue\" and \"group\" for now.")
+			gettext_noop("Only support \"queue\", \"group\" and \"group-v2\" for now.")
 		},
 		&gp_resource_manager_str,
 		"queue",
diff --git a/src/backend/utils/resgroup/resgroup.c b/src/backend/utils/resgroup/resgroup.c
index e474e106490..88f9acea9a0 100644
--- a/src/backend/utils/resgroup/resgroup.c
+++ b/src/backend/utils/resgroup/resgroup.c
@@ -3700,7 +3700,6 @@ check_and_unassign_from_resgroup(PlannedStmt* stmt)
 	} while (!groupIncBypassedRef(&groupInfo));
 
 	bypassedGroup = groupInfo.group;
-	bypassedGroup->totalExecuted++;
 	pgstat_report_resgroup(bypassedGroup->groupId);
 	bypassedSlot.group = groupInfo.group;
 	bypassedSlot.groupId = groupInfo.groupId;
diff --git a/src/backend/utils/workfile_manager/workfile_mgr.c b/src/backend/utils/workfile_manager/workfile_mgr.c
index e5b311cf9ba..21b4463e5f1 100644
--- a/src/backend/utils/workfile_manager/workfile_mgr.c
+++ b/src/backend/utils/workfile_manager/workfile_mgr.c
@@ -192,6 +192,9 @@ static void unpin_workset(workfile_set *work_set);
 
 static bool proc_exit_hook_registered = false;
 
+static uint64 total_bytes_written = 0;
+static uint64 total_files_created = 0;
+
 Datum gp_workfile_mgr_cache_entries(PG_FUNCTION_ARGS);
 Datum gp_workfile_mgr_used_diskspace(PG_FUNCTION_ARGS);
 
@@ -371,6 +374,7 @@ RegisterFileWithSet(File file, workfile_set *work_set)
 	localCtl.entries[file].work_set = work_set;
 	work_set->num_files++;
 	work_set->perquery->num_files++;
+	total_files_created++;
 
 	/* Enforce the limit on number of files */
 	if (gp_workfile_limit_files_per_query > 0 &&
@@ -447,6 +451,7 @@ UpdateWorkFileSize(File file, uint64 newsize)
 					(errcode(ERRCODE_INSUFFICIENT_RESOURCES),
 					 errmsg("workfile per segment size limit exceeded")));
 		}
+		total_bytes_written += diff;
 	}
 
 	/*
@@ -986,3 +991,22 @@ workfile_is_active(workfile_set *workfile)
 {
 	return workfile ? workfile->active : false;
 }
+
+uint64
+WorkfileTotalBytesWritten(void)
+{
+	return total_bytes_written;
+}
+
+uint64
+WorkfileTotalFilesCreated(void)
+{
+	return total_files_created;
+}
+
+void
+WorkfileResetBackendStats(void)
+{
+	total_bytes_written = 0;
+	total_files_created = 0;
+}
diff --git a/src/bin/initdb/initdb.c b/src/bin/initdb/initdb.c
index f7c34a3e208..8fdae656bc8 100644
--- a/src/bin/initdb/initdb.c
+++ b/src/bin/initdb/initdb.c
@@ -175,6 +175,8 @@ static char *external_fts_files;
 #endif
 static char *system_functions_file;
 static char *system_views_file;
+static char *system_views_gp_file;
+static char *system_views_gp_summary_file;
 static bool success = false;
 static bool made_new_pgdata = false;
 static bool found_existing_pgdata = false;
@@ -1705,8 +1707,6 @@ setup_run_file(FILE *cmdfd, const char *filename)
 	}
 
 	PG_CMD_PUTS("\n\n");
-
-	free(lines);
 }
 
 /*
@@ -2024,7 +2024,7 @@ setup_cdb_schema(FILE *cmdfd)
 
 	/* Collect all files with .sql suffix in array. */
 	nscripts = 0;
-	while ((file = readdir(dir)) != NULL)
+	while (errno = 0, (file = readdir(dir)) != NULL)
 	{
 		int			namelen = strlen(file->d_name);
 
@@ -2054,12 +2054,16 @@ setup_cdb_schema(FILE *cmdfd)
 		errno = 0;
 #endif
 
-	closedir(dir);
-
 	if (errno != 0)
 	{
-		/* some kind of I/O error? */
 		pg_log_error("error while reading cdb_init.d directory: %m");
+		closedir(dir);
+		exit(1);
+	}
+
+	if (closedir(dir))
+	{
+		pg_log_error("error while closing cdb_init.d directory: %m");
 		exit(1);
 	}
 
@@ -2833,6 +2837,8 @@ setup_data_file_paths(void)
 	set_input(&system_constraints_file, "system_constraints.sql");
 	set_input(&system_functions_file, "system_functions.sql");
 	set_input(&system_views_file, "system_views.sql");
+	set_input(&system_views_gp_file, "system_views_gp.sql");
+	set_input(&system_views_gp_summary_file, "system_views_gp_summary.sql");
 
 	set_input(&cdb_init_d_dir, "cdb_init.d");
 
@@ -2866,6 +2872,8 @@ setup_data_file_paths(void)
 #endif
 	check_input(system_functions_file);
 	check_input(system_views_file);
+	check_input(system_views_gp_file);
+	check_input(system_views_gp_summary_file);
 }
 
 
@@ -3233,6 +3241,8 @@ initialize_data_directory(void)
 	 */
 
 	setup_run_file(cmdfd, system_views_file);
+	setup_run_file(cmdfd, system_views_gp_file);
+	setup_run_file(cmdfd, system_views_gp_summary_file);
 
 	setup_description(cmdfd);
 
diff --git a/src/bin/pg_dump/pg_dump.c b/src/bin/pg_dump/pg_dump.c
index a484f693b43..f1c2644bfdd 100644
--- a/src/bin/pg_dump/pg_dump.c
+++ b/src/bin/pg_dump/pg_dump.c
@@ -362,6 +362,7 @@ static void appendReloptionsArrayAH(PQExpBuffer buffer, const char *reloptions,
 									const char *prefix, Archive *fout);
 static char *get_synchronized_snapshot(Archive *fout);
 static void setupDumpWorker(Archive *AHX);
+static void set_restrict_relation_kind(Archive *AH, const char *value);
 static TableInfo *getRootTableInfo(const TableInfo *tbinfo);
 static bool forcePartitionRootLoad(const TableInfo *tbinfo);
 
@@ -384,17 +385,17 @@ static char *nextToken(register char **stringp, register const char *delim);
 static void addDistributedBy(Archive *fout, PQExpBuffer q, const TableInfo *tbinfo, int actual_atts);
 static void addDistributedByOld(Archive *fout, PQExpBuffer q, const TableInfo *tbinfo, int actual_atts);
 static void addSchedule(Archive *fout, PQExpBuffer q, const TableInfo *tbinfo);
-static bool isGPDB(Archive *fout);
+static bool isMPP(Archive *fout);
 static bool isGPDB5000OrLater(Archive *fout);
 static bool isGPDB6000OrLater(Archive *fout);
 
 /* END MPP ADDITION */
 
 /*
- * Check if we are talking to GPDB
+ * Check if we are talking to Greenplum or Cloudberry
  */
 static bool
-isGPDB(Archive *fout)
+isMPP(Archive *fout)
 {
 	static int	value = -1;		/* -1 = not known yet, 0 = no, 1 = yes */
 
@@ -408,7 +409,7 @@ isGPDB(Archive *fout)
 		res = ExecuteSqlQuery(fout, query, PGRES_TUPLES_OK);
 
 		ver = (PQgetvalue(res, 0, 0));
-		if (strstr(ver, "Cloudberry") != NULL)
+		if (strstr(ver, "Cloudberry") != NULL || strstr(ver, "Greenplum") != NULL)
 			value = 1;
 		else
 			value = 0;
@@ -422,8 +423,8 @@ isGPDB(Archive *fout)
 static bool
 isGPDB5000OrLater(Archive *fout)
 {
-	if (!isGPDB(fout))
-		return false;		/* Not Cloudberry at all. */
+	if (!isMPP(fout))
+		return false;		/* Not GP-based at all. */
 
 	/* GPDB 5 is based on PostgreSQL 8.3 */
 	return fout->remoteVersion >= 80300;
@@ -433,8 +434,8 @@ isGPDB5000OrLater(Archive *fout)
 static bool
 isGPDB6000OrLater(Archive *fout)
 {
-	if (!isGPDB(fout))
-		return false;		/* Not Cloudberry at all. */
+	if (!isMPP(fout))
+		return false;		/* Not GP-based at all. */
 
 	/* GPDB 6 is based on PostgreSQL 9.4 */
 	return fout->remoteVersion >= 90400;
@@ -1468,6 +1469,13 @@ setup_connection(Archive *AH, const char *dumpencoding,
 			ExecuteSqlStatement(AH, "SET row_security = off");
 	}
 
+	/*
+	 * For security reasons, we restrict the expansion of non-system views and
+	 * access to foreign tables during the pg_dump process. This restriction
+	 * is adjusted when dumping foreign table data.
+	 */
+	set_restrict_relation_kind(AH, "view, foreign-table");
+
 	/*
 	 * Start transaction-snapshot mode transaction to dump consistent data.
 	 */
@@ -2362,6 +2370,11 @@ dumpTableData_copy(Archive *fout, const void *dcontext)
 	 */
 	if (tdinfo->filtercond || tbinfo->relkind == RELKIND_FOREIGN_TABLE)
 	{
+		/* Temporary allows to access to foreign tables to dump data */
+		if (tbinfo->relkind == RELKIND_FOREIGN_TABLE)
+			set_restrict_relation_kind(fout, "view");
+
+		/* Note: this syntax is only supported in 8.2 and up */
 		appendPQExpBufferStr(q, "COPY (SELECT ");
 		/* klugery to get rid of parens in column list */
 		if (strlen(column_list) > 2)
@@ -2473,6 +2486,11 @@ dumpTableData_copy(Archive *fout, const void *dcontext)
 					   classname);
 
 	destroyPQExpBuffer(q);
+
+	/* Revert back the setting */
+	if (tbinfo->relkind == RELKIND_FOREIGN_TABLE)
+		set_restrict_relation_kind(fout, "view, foreign-table");
+
 	return 1;
 }
 
@@ -2499,6 +2517,10 @@ dumpTableData_insert(Archive *fout, const void *dcontext)
 	int			rows_per_statement = dopt->dump_inserts;
 	int			rows_this_statement = 0;
 
+	/* Temporary allows to access to foreign tables to dump data */
+	if (tbinfo->relkind == RELKIND_FOREIGN_TABLE)
+		set_restrict_relation_kind(fout, "view");
+
 	/*
 	 * If we're going to emit INSERTs with column names, the most efficient
 	 * way to deal with generated columns is to exclude them entirely.  For
@@ -2738,6 +2760,10 @@ dumpTableData_insert(Archive *fout, const void *dcontext)
 		destroyPQExpBuffer(insertStmt);
 	free(attgenerated);
 
+	/* Revert back the setting */
+	if (tbinfo->relkind == RELKIND_FOREIGN_TABLE)
+		set_restrict_relation_kind(fout, "view, foreign-table");
+
 	return 1;
 }
 
@@ -4819,6 +4845,28 @@ is_superuser(Archive *fout)
 	return false;
 }
 
+/*
+ * Set the given value to restrict_nonsystem_relation_kind value. Since
+ * restrict_nonsystem_relation_kind is introduced in minor version releases,
+ * the setting query is effective only where available.
+ */
+static void
+set_restrict_relation_kind(Archive *AH, const char *value)
+{
+	PQExpBuffer query = createPQExpBuffer();
+	PGresult   *res;
+
+	appendPQExpBuffer(query,
+					  "SELECT set_config(name, '%s', false) "
+					  "FROM pg_settings "
+					  "WHERE name = 'restrict_nonsystem_relation_kind'",
+					  value);
+	res = ExecuteSqlQuery(AH, query->data, PGRES_TUPLES_OK);
+
+	PQclear(res);
+	destroyPQExpBuffer(query);
+}
+
 /*
  * getSubscriptions
  *	  get information about subscriptions
diff --git a/src/bin/psql/describe.c b/src/bin/psql/describe.c
index 90c8bb777fa..7423459e690 100644
--- a/src/bin/psql/describe.c
+++ b/src/bin/psql/describe.c
@@ -52,7 +52,7 @@ static bool describeOneTSConfig(const char *oid, const char *nspname,
 static void printACLColumn(PQExpBuffer buf, const char *colname);
 static bool listOneExtensionContents(const char *extname, const char *oid);
 
-static bool isGPDB(void);
+static bool isMPP(void);
 static bool isGPDB4200OrLater(void);
 static bool isGPDB5000OrLater(void);
 static bool isGPDB6000OrLater(void);
@@ -64,7 +64,7 @@ static bool validateSQLNamePattern(PQExpBuffer buf, const char *pattern,
 								   const char *visibilityrule,
 								   bool *added_clause, int maxparts);
 
-static bool isGPDB(void)
+static bool isMPP(void)
 {
 	static enum
 	{
@@ -86,7 +86,7 @@ static bool isGPDB(void)
 		return false;
 
 	ver = PQgetvalue(res, 0, 0);
-	if (strstr(ver, "Cloudberry") != NULL)
+	if (strstr(ver, "Cloudberry") != NULL || strstr(ver, "Greenplum") != NULL)
 	{
 		PQclear(res);
 		talking_to_gpdb = gpdb_yes;
@@ -113,7 +113,7 @@ static bool isGPDB4200OrLater(void)
 {
 	bool       retValue = false;
 
-	if (isGPDB() == true)
+	if (isMPP() == true)
 	{
 		PGresult  *result;
 
@@ -134,7 +134,7 @@ isGPDB4300OrLater(void)
 {
 	bool       retValue = false;
 
-	if (isGPDB() == true)
+	if (isMPP() == true)
 	{
 		PGresult  *result;
 
@@ -157,7 +157,7 @@ static bool isGPDB5000OrLater(void)
 {
 	bool	retValue = false;
 
-	if (isGPDB() == true)
+	if (isMPP() == true)
 	{
 		PGresult   *res;
 
@@ -171,8 +171,8 @@ static bool isGPDB5000OrLater(void)
 static bool
 isGPDB6000OrLater(void)
 {
-	if (!isGPDB())
-		return false;		/* Not Cloudberry at all. */
+	if (!isMPP())
+		return false;		/* Not GP-based at all. */
 
 	/* GPDB 6 is based on PostgreSQL 9.4 */
 	return pset.sversion >= 90400;
@@ -181,8 +181,8 @@ isGPDB6000OrLater(void)
 static bool
 isGPDB6000OrBelow(void)
 {
-	if (!isGPDB())
-		return false;		/* Not Cloudberry at all. */
+	if (!isMPP())
+		return false;		/* Not GP-based at all. */
 
 	/* GPDB 6 is based on PostgreSQL 9.4 */
 	return pset.sversion <= 90400;
@@ -191,8 +191,8 @@ isGPDB6000OrBelow(void)
 static bool
 isGPDB7000OrLater(void)
 {
-	if (!isGPDB())
-		return false;		/* Not Cloudberry at all. */
+	if (!isMPP())
+		return false;		/* Not GP-based at all. */
 
 	/* GPDB 7 is based on PostgreSQL v12 */
 	return pset.sversion >= 120000;
@@ -2007,7 +2007,7 @@ describeOneTableDetails(const char *schemaname,
 						   "array(select 'toast.' || x from pg_catalog.unnest(tc.reloptions) x), ', ')\n"
 						   : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "c.relstorage" : "'h'"),
+						  (isMPP() ? "c.relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 90400)
@@ -2027,7 +2027,7 @@ describeOneTableDetails(const char *schemaname,
 						   "array(select 'toast.' || x from pg_catalog.unnest(tc.reloptions) x), ', ')\n"
 						   : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "c.relstorage" : "'h'"),
+						  (isMPP() ? "c.relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 90100)
@@ -2047,7 +2047,7 @@ describeOneTableDetails(const char *schemaname,
 						   "array(select 'toast.' || x from pg_catalog.unnest(tc.reloptions) x), ', ')\n"
 						   : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "c.relstorage" : "'h'"),
+						  (isMPP() ? "c.relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 90000)
@@ -2066,7 +2066,7 @@ describeOneTableDetails(const char *schemaname,
 						   "array(select 'toast.' || x from pg_catalog.unnest(tc.reloptions) x), ', ')\n"
 						   : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "c.relstorage" : "'h'"),
+						  (isMPP() ? "c.relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 80400)
@@ -2084,7 +2084,7 @@ describeOneTableDetails(const char *schemaname,
 						   "array(select 'toast.' || x from pg_catalog.unnest(tc.reloptions) x), ', ')\n"
 						   : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "c.relstorage" : "'h'"),
+						  (isMPP() ? "c.relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 80200)
@@ -2098,7 +2098,7 @@ describeOneTableDetails(const char *schemaname,
 						  (verbose ?
 						   "pg_catalog.array_to_string(reloptions, E', ')" : "''"),
 						  /* GPDB Only:  relstorage  */
-						  (isGPDB() ? "relstorage" : "'h'"),
+						  (isMPP() ? "relstorage" : "'h'"),
 						  oid);
 	}
 	else if (pset.sversion >= 80000)
@@ -2161,7 +2161,7 @@ describeOneTableDetails(const char *schemaname,
 	tableinfo.isdynamic = strcmp(PQgetvalue(res, 0, 16), "t") == 0;
 
 	/* GPDB Only:  relstorage  */
-	if (pset.sversion < 120000 && isGPDB())
+	if (pset.sversion < 120000 && isMPP())
 		tableinfo.relstorage = *(PQgetvalue(res, 0, PQfnumber(res, "relstorage")));
 	else
 		tableinfo.relstorage = 'h';
@@ -3840,7 +3840,7 @@ describeOneTableDetails(const char *schemaname,
 							 * listing them.
 							 */
 							tgdef = PQgetvalue(result, i, 1);
-							if (isGPDB() && strstr(tgdef, "RI_FKey_") != NULL)
+							if (isMPP() && strstr(tgdef, "RI_FKey_") != NULL)
 								list_trigger = false;
 
 							break;
@@ -5145,7 +5145,7 @@ listTables(const char *tabtypes, const char *pattern, bool verbose, bool showSys
 	cols_so_far = 4;
 
 	/* Show Storage type for tables */
-	if (showTables && isGPDB())
+	if (showTables && isMPP())
 	{
 		if (isGPDB7000OrLater())
 		{
diff --git a/src/bin/psql/tab-complete.c b/src/bin/psql/tab-complete.c
index dc401f503b1..905ad740555 100644
--- a/src/bin/psql/tab-complete.c
+++ b/src/bin/psql/tab-complete.c
@@ -1614,6 +1614,12 @@ psql_completion(const char *text, int start, int end)
 		NULL
 	};
 
+	static const char *const list_resource_group_type[] = {
+		"CONCURRENCY", "CPU_MAX_PERCENT", "CPUSET", "CPU_WEIGHT",
+		"MEMORY_QUOTA", "MIN_COST", "IO_LIMIT",
+		NULL
+	};
+
 	/*
 	 * Temporary workaround for a bug in recent (2019) libedit: it incorrectly
 	 * de-escapes the input "text", causing us to fail to recognize backslash
@@ -3115,8 +3121,8 @@ psql_completion(const char *text, int start, int end)
 	else if (Matches("CREATE", "ROLE|USER|GROUP", MatchAny, "IN"))
 		COMPLETE_WITH("GROUP", "ROLE");
 
-/* CREATE/DROP RESOURCE GROUP/QUEUE */
-	else if (Matches("CREATE|DROP", "RESOURCE"))
+/* CREATE/DROP/ALTER RESOURCE GROUP/QUEUE */
+	else if (Matches("CREATE|DROP|ALTER", "RESOURCE"))
 	 {
 		static const char *const list_CREATERESOURCEGROUP[] =
 		{"GROUP", "QUEUE", NULL};
@@ -3130,19 +3136,19 @@ psql_completion(const char *text, int start, int end)
 	else if (Matches("CREATE", "PROFILE", MatchAny, "LIMIT"))
 		COMPLETE_WITH("FAILED_LOGIN_ATTEMPTS", "PASSWORD_REUSE_MAX", "PASSWORD_LOCK_TIME");
 
-	/* CREATE/DROP RESOURCE GROUP */
-	else if (TailMatches("CREATE|DROP", "RESOURCE", "GROUP"))
+	/* CREATE/DROP/ALTER RESOURCE GROUP */
+	else if (TailMatches("CREATE|DROP|ALTER", "RESOURCE", "GROUP"))
 		COMPLETE_WITH_QUERY(Query_for_list_of_resgroups);
 	/* CREATE RESOURCE GROUP <name> */
 	else if (TailMatches("CREATE|DROP", "RESOURCE", "GROUP", MatchAny))
 		COMPLETE_WITH("WITH (");
+	/* ALTER RESOURCE GROUP <name> */
+	else if (TailMatches("ALTER", "RESOURCE", "GROUP", MatchAny))
+		COMPLETE_WITH("SET");
+	else if (TailMatches("ALTER", "RESOURCE", "GROUP", MatchAny, "SET"))
+		COMPLETE_WITH_LIST(list_resource_group_type);
 	else if (TailMatches("RESOURCE", "GROUP", MatchAny, "WITH", "("))
-	{
-		static const char *const list_CREATERESOURCEGROUP[] =
-		{"CONCURRENCY", "CPU_MAX_PERCENT", "CPUSET", "CPU_WEIGHT", "MEMORY_QUOTA", "MIN_COST", "IO_LIMIT", NULL};
-
-		COMPLETE_WITH_LIST(list_CREATERESOURCEGROUP);
-	}
+		COMPLETE_WITH_LIST(list_resource_group_type);
 
 /* CREATE TYPE */
 	else if (Matches("CREATE", "TYPE", MatchAny))
diff --git a/src/include/access/external.h b/src/include/access/external.h
index 35933f54f75..453c3d59179 100644
--- a/src/include/access/external.h
+++ b/src/include/access/external.h
@@ -48,5 +48,10 @@ extern ExtTableEntry *GetExtFromForeignTableOptions(List *ftoptons, Oid relid);
 
 extern ExternalScanInfo *MakeExternalScanInfo(ExtTableEntry *extEntry);
 
+/*
+ * Parse an "encoding" FDW OPTIONS value (symbolic name or numeric string)
+ * into a numeric encoding ID. ereports on invalid input.
+ */
+extern int parse_fdw_encoding_option(const char *value);
 
 #endif   /* EXTERNAL_H */
diff --git a/src/include/access/reloptions.h b/src/include/access/reloptions.h
index 3b411103c19..74bc6fae99a 100644
--- a/src/include/access/reloptions.h
+++ b/src/include/access/reloptions.h
@@ -306,7 +306,7 @@ extern List *transformColumnEncoding(const TableAmRoutine *tam, Relation rel, Li
 										List *stenc, List *withOptions, List *parentenc,
 										bool explicitOnly, bool createDefaultOne, bool appendonly);
 
-List* transfromColumnEncodingAocoRootPartition(List *colDefs, List *stenc, List *withOptions, bool errorOnEncodingClause);
+List* transformColumnEncodingAocoRootPartition(List *colDefs, List *stenc, List *withOptions, bool errorOnEncodingClause);
 
 extern List *transformStorageEncodingClause(List *options, bool validate);
 extern List *form_default_storage_directive(List *enc);
diff --git a/src/include/catalog/catversion.h b/src/include/catalog/catversion.h
index 86910a0dada..ac649996d98 100644
--- a/src/include/catalog/catversion.h
+++ b/src/include/catalog/catversion.h
@@ -56,6 +56,6 @@
  */
 
 /*							3yyymmddN */
-#define CATALOG_VERSION_NO	302502091
+#define CATALOG_VERSION_NO	302509031
 
 #endif
diff --git a/src/include/cdb/cdbinterconnect.h b/src/include/cdb/cdbinterconnect.h
index 5204d4c1b94..c6c64de9590 100644
--- a/src/include/cdb/cdbinterconnect.h
+++ b/src/include/cdb/cdbinterconnect.h
@@ -154,13 +154,13 @@ typedef struct MotionLayerState
 	/*
 	 * GLOBAL MOTION-LAYER STATISTICS
 	 */
-	uint32		stat_total_chunks_sent; /* Tuple-chunks sent. */
-	uint32		stat_total_bytes_sent;	/* Bytes sent, including headers. */
-	uint32		stat_tuple_bytes_sent;	/* Bytes of pure tuple-data sent. */
+	uint64		stat_total_chunks_sent; /* Tuple-chunks sent. */
+	uint64		stat_total_bytes_sent;	/* Bytes sent, including headers. */
+	uint64		stat_tuple_bytes_sent;	/* Bytes of pure tuple-data sent. */
 
-	uint32		stat_total_chunks_recvd;/* Tuple-chunks received. */
-	uint32		stat_total_bytes_recvd; /* Bytes received, including headers. */
-	uint32		stat_tuple_bytes_recvd; /* Bytes of pure tuple-data received. */
+	uint64		stat_total_chunks_recvd;/* Tuple-chunks received. */
+	uint64		stat_total_bytes_recvd; /* Bytes received, including headers. */
+	uint64		stat_tuple_bytes_recvd; /* Bytes of pure tuple-data received. */
 
 	uint32		stat_total_chunkproc_calls;		/* Calls to processIncomingChunks() */
 
diff --git a/src/include/cdb/cdbpathlocus.h b/src/include/cdb/cdbpathlocus.h
index 0f71ba55dfb..9f5a8227e68 100644
--- a/src/include/cdb/cdbpathlocus.h
+++ b/src/include/cdb/cdbpathlocus.h
@@ -292,13 +292,13 @@ typedef struct CdbPathLocus
 		_locus->parallel_workers = (parallel_workers_); \
         Assert(cdbpathlocus_is_valid(*_locus));         \
     } while (0)
-#define CdbPathLocus_MakeHashedOJ(plocus, distkey_, numsegments_)     \
+#define CdbPathLocus_MakeHashedOJ(plocus, distkey_, numsegments_, parallel_workers_)     \
     do {                                                \
         CdbPathLocus *_locus = (plocus);                \
         _locus->locustype = CdbLocusType_HashedOJ;		\
         _locus->numsegments = (numsegments_);           \
         _locus->distkey = (distkey_);					\
-        _locus->parallel_workers = 0;                   \
+		_locus->parallel_workers = (parallel_workers_); \
         Assert(cdbpathlocus_is_valid(*_locus));         \
     } while (0)
 #define CdbPathLocus_MakeHashedWorkers(plocus, distkey_, numsegments_, parallel_workers_)      \
diff --git a/src/include/executor/execdesc.h b/src/include/executor/execdesc.h
index e3ecf31b664..d50d3e48f6b 100644
--- a/src/include/executor/execdesc.h
+++ b/src/include/executor/execdesc.h
@@ -22,6 +22,14 @@
 
 struct CdbExplain_ShowStatCtx;  /* private, in "cdb/cdbexplain.c" */
 
+typedef struct GpscQueryKey
+{
+	int tmid; /* transaction time */
+	int ssid; /* session id */
+	int ccnt; /* command count */
+	int nesting_level;
+	uintptr_t query_desc_addr;
+} GpscQueryKey;
 
 /*
  * SerializedParams is used to serialize external query parameters
@@ -330,6 +338,9 @@ typedef struct QueryDesc
 
 	/* This is always set NULL by the core system, but plugins can change it */
 	struct Instrumentation *totaltime;	/* total time spent in ExecutorRun */
+
+	/* GP Stats Collector */
+	GpscQueryKey *gpsc_query_key;
 } QueryDesc;
 
 /* in pquery.c */
diff --git a/src/include/executor/hashjoin.h b/src/include/executor/hashjoin.h
index e324e67d914..9e243c47847 100644
--- a/src/include/executor/hashjoin.h
+++ b/src/include/executor/hashjoin.h
@@ -195,6 +195,7 @@ typedef struct ParallelHashJoinBatch
 	size_t		ntuples;		/* number of tuples loaded */
 	size_t		old_ntuples;	/* number of tuples before repartitioning */
 	bool		space_exhausted;
+	bool		skip_unmatched; /* whether to abandon unmatched scan */
 
 	/*
 	 * Variable-sized SharedTuplestore objects follow this struct in memory.
@@ -239,7 +240,7 @@ typedef struct ParallelHashJoinBatchAccessor
 	size_t		estimated_size; /* size of partition on disk */
 	size_t		old_ntuples;	/* how many tuples before repartitioning? */
 	bool		at_least_one_chunk; /* has this backend allocated a chunk? */
-
+	bool		outer_eof;		/* has this process hit end of batch? */
 	bool		done;			/* flag to remember that a batch is done */
 	SharedTuplestoreAccessor *inner_tuples;
 	SharedTuplestoreAccessor *outer_tuples;
@@ -306,7 +307,8 @@ typedef struct ParallelHashJoinState
 #define PHJ_BATCH_ALLOCATING			1
 #define PHJ_BATCH_LOADING				2
 #define PHJ_BATCH_PROBING				3
-#define PHJ_BATCH_DONE					4
+#define PHJ_BATCH_SCAN					4
+#define PHJ_BATCH_FREE					5
 
 /* The phases of batch growth while hashing, for grow_batches_barrier. */
 #define PHJ_GROW_BATCHES_ELECTING		0
diff --git a/src/include/executor/nodeHash.h b/src/include/executor/nodeHash.h
index 993de4519b5..36549376ef9 100644
--- a/src/include/executor/nodeHash.h
+++ b/src/include/executor/nodeHash.h
@@ -64,9 +64,12 @@ extern bool ExecScanHashBucket(HashState *hashState, HashJoinState *hjstate,
 extern bool ExecParallelScanHashBucket(HashState *hashState, HashJoinState *hjstate,
 									   ExprContext *econtext);
 extern void ExecPrepHashTableForUnmatched(HashJoinState *hjstate);
+extern bool ExecParallelPrepHashTableForUnmatched(HashJoinState *hjstate);
 extern bool ExecScanHashTableForUnmatched(HashJoinState *hjstate,
 										  ExprContext *econtext);
 extern void ExecHashTableReset(HashState *hashState, HashJoinTable hashtable);
+extern bool ExecParallelScanHashTableForUnmatched(HashJoinState *hjstate,
+												  ExprContext *econtext);
 extern void ExecHashTableResetMatchFlags(HashJoinTable hashtable);
 extern void ExecChooseHashTableSize(double ntuples, int tupwidth, bool useskew,
                                     uint64 operatorMemKB,
diff --git a/src/include/gpopt/gpdbwrappers.h b/src/include/gpopt/gpdbwrappers.h
index 261cd28b5f0..01d7eaa8cce 100644
--- a/src/include/gpopt/gpdbwrappers.h
+++ b/src/include/gpopt/gpdbwrappers.h
@@ -673,6 +673,9 @@ int FindNodes(Node *node, List *nodeTags);
 // look for nodes with non-default collation; returns 1 if any exist, -1 otherwise
 int CheckCollation(Node *node);
 
+// check if ORDER BY uses an ordering operator (amcanorderbyop) unsupported by ORCA
+bool HasOrderByOrderingOp(Query *query);
+
 Node *CoerceToCommonType(ParseState *pstate, Node *node, Oid target_type,
 						 const char *context);
 
@@ -717,6 +720,9 @@ List *GetMergeJoinOpFamilies(Oid opno);
 // get the OID of base elementtype fora given typid
 Oid GetBaseType(Oid typid);
 
+// check if parallel mode is OK (comprehensive check)
+bool IsParallelModeOK(void);
+
 // returns the result of evaluating 'expr' as an Expr. Caller keeps ownership of 'expr'
 // and takes ownership of the result
 Expr *EvaluateExpr(Expr *expr, Oid result_type, int32 typmod);
@@ -768,6 +774,8 @@ List *GetRelChildIndexes(Oid reloid);
 
 Oid GetForeignServerId(Oid reloid);
 
+int16 GetAppendOnlySegmentFilesCount(Relation rel);
+
 void GPDBLockRelationOid(Oid reloid, int lockmode);
 
 char *GetRelFdwName(Oid reloid);
diff --git a/src/include/gpopt/translate/CTranslatorDXLToPlStmt.h b/src/include/gpopt/translate/CTranslatorDXLToPlStmt.h
index 625ed5cd0a3..3cd5fc9d638 100644
--- a/src/include/gpopt/translate/CTranslatorDXLToPlStmt.h
+++ b/src/include/gpopt/translate/CTranslatorDXLToPlStmt.h
@@ -213,6 +213,13 @@ class CTranslatorDXLToPlStmt
 			ctxt_translation_prev_siblings	// translation contexts of previous siblings
 	);
 
+	// translate DXL parallel table scan node into a parallel SeqScan node
+	Plan *TranslateDXLParallelTblScan(
+		const CDXLNode *tbl_scan_dxlnode, CDXLTranslateContext *output_context,
+		CDXLTranslationContextArray *
+			ctxt_translation_prev_siblings	// translation contexts of previous siblings
+	);
+
 	// translate DXL index scan node into a IndexScan node
 	Plan *TranslateDXLIndexScan(
 		const CDXLNode *index_scan_dxlnode,
@@ -657,6 +664,10 @@ class CTranslatorDXLToPlStmt
 
 	// fill the aggno and transno for the aggnode
 	static void TranslateAggFillInfo(CContextDXLToPlStmt *context, Aggref *aggref);
+
+	// extract parallel workers from DXL node tree
+	static ULONG ExtractParallelWorkersFromDXL(const CDXLNode *dxlnode);
+
 };
 }  // namespace gpdxl
 
diff --git a/src/include/gpopt/utils/COptTasks.h b/src/include/gpopt/utils/COptTasks.h
index bed8f36d51a..cc96e63739e 100644
--- a/src/include/gpopt/utils/COptTasks.h
+++ b/src/include/gpopt/utils/COptTasks.h
@@ -90,6 +90,9 @@ struct SOptContext
 	// is serializing a plan to DXL required ?
 	BOOL m_should_serialize_plan_dxl{false};
 
+	// should generate parallel plans ?
+	BOOL m_create_parallel_plan{false};
+
 	// did the optimizer fail unexpectedly?
 	BOOL m_is_unexpected_failure{false};
 
@@ -129,7 +132,8 @@ class COptTasks
 	// create optimizer configuration object
 	static COptimizerConfig *CreateOptimizerConfig(CMemoryPool *mp,
 												   ICostModel *cost_model,
-												   CPlanHint *plan_hints);
+												   CPlanHint *plan_hints,
+												   BOOL enable_parallel_plans = false);
 
 	// optimize a query to a physical DXL
 	static void *OptimizeTask(void *ptr);
diff --git a/src/include/nodes/pathnodes.h b/src/include/nodes/pathnodes.h
index 41220887050..05cac0c9043 100644
--- a/src/include/nodes/pathnodes.h
+++ b/src/include/nodes/pathnodes.h
@@ -505,6 +505,8 @@ struct PlannerInfo
 	int			numPureOrderedAggs; /* CDB: number that use ORDER BY/WITHIN GROUP, not counting DISTINCT */
 	bool		hasNonCombine;	/* CDB: any agg func w/o a combine func? */
 	bool		is_from_orca; /* true if this PlannerInfo was created from Orca*/
+
+	Query	   *aqumv_raw_parse;	/* Raw parse tree for AQUMV join exact-match */
 };
 
 /*
diff --git a/src/include/optimizer/aqumv.h b/src/include/optimizer/aqumv.h
index 6e51d4dbc92..2bb4122cf11 100644
--- a/src/include/optimizer/aqumv.h
+++ b/src/include/optimizer/aqumv.h
@@ -44,5 +44,6 @@ typedef struct AqumvContextData {
 typedef AqumvContextData *AqumvContext;
 
 extern RelOptInfo* answer_query_using_materialized_views(PlannerInfo *root, AqumvContextData *aqumv_context);
+extern RelOptInfo* answer_query_using_materialized_views_for_join(PlannerInfo *root, AqumvContextData *aqumv_context);
 
 #endif   /* AQUMV_H */
diff --git a/src/include/optimizer/orcaopt.h b/src/include/optimizer/orcaopt.h
index 4a045b632c0..6c1f3075bc4 100644
--- a/src/include/optimizer/orcaopt.h
+++ b/src/include/optimizer/orcaopt.h
@@ -33,6 +33,7 @@
 typedef struct OptimizerOptions 
 {
     bool create_vectorization_plan;
+    bool create_parallel_plan;
 } OptimizerOptions;
 
 
diff --git a/src/include/optimizer/planner.h b/src/include/optimizer/planner.h
index 610034b2c62..9715d9fb31a 100644
--- a/src/include/optimizer/planner.h
+++ b/src/include/optimizer/planner.h
@@ -66,4 +66,11 @@ extern bool optimizer_init;
 
 extern void preprocess_qual_conditions(PlannerInfo *root, Node *jtnode);
 
+/* Passthrough data for standard_qp_callback */
+typedef struct
+{
+	List	   *activeWindows;	/* active windows, if any */
+	List	   *groupClause;	/* overrides parse->groupClause */
+} standard_qp_extra;
+
 #endif							/* PLANNER_H */
diff --git a/src/include/optimizer/walkers.h b/src/include/optimizer/walkers.h
index 6d0d38717f5..d29bc5551e8 100644
--- a/src/include/optimizer/walkers.h
+++ b/src/include/optimizer/walkers.h
@@ -43,5 +43,6 @@ extern List *extract_nodes_plan(Plan *pl, int nodeTag, bool descendIntoSubquerie
 extern List *extract_nodes_expression(Node *node, int nodeTag, bool descendIntoSubqueries);
 extern int find_nodes(Node *node, List *nodeTags);
 extern int check_collation(Node *node);
+extern bool has_orderby_ordering_op(Query *query);
 
 #endif /* WALKERS_H_ */
diff --git a/src/include/tcop/tcopprot.h b/src/include/tcop/tcopprot.h
index 33c929e9082..c7c534417a2 100644
--- a/src/include/tcop/tcopprot.h
+++ b/src/include/tcop/tcopprot.h
@@ -47,6 +47,12 @@ typedef enum
 
 extern PGDLLIMPORT int log_statement;
 
+/* Flags for restrict_nonsystem_relation_kind value */
+#define RESTRICT_RELKIND_VIEW			0x01
+#define RESTRICT_RELKIND_FOREIGN_TABLE	0x02
+
+extern PGDLLIMPORT int restrict_nonsystem_relation_kind;
+
 extern List *pg_parse_query(const char *query_string);
 extern List *pg_rewrite_query(Query *query);
 extern List *pg_analyze_and_rewrite(RawStmt *parsetree,
@@ -67,6 +73,9 @@ extern List *pg_plan_queries(List *querytrees, const char *query_string,
 
 extern bool check_max_stack_depth(int *newval, void **extra, GucSource source);
 extern void assign_max_stack_depth(int newval, void *extra);
+extern bool check_restrict_nonsystem_relation_kind(char **newval, void **extra,
+												   GucSource source);
+extern void assign_restrict_nonsystem_relation_kind(const char *newval, void *extra);
 
 extern void die(SIGNAL_ARGS);
 extern void quickdie(SIGNAL_ARGS) pg_attribute_noreturn();
diff --git a/src/include/utils/guc.h b/src/include/utils/guc.h
index aa34138a4b5..652e0b451f3 100644
--- a/src/include/utils/guc.h
+++ b/src/include/utils/guc.h
@@ -295,6 +295,7 @@ extern bool enable_parallel_dedup_semi_join;
 extern bool enable_parallel_dedup_semi_reverse_join;
 extern bool	parallel_query_use_streaming_hashagg;
 extern bool gp_use_streaming_hashagg;
+extern bool optimizer_use_streaming_hashagg;
 extern int  gp_appendonly_insert_files;
 extern int  gp_appendonly_insert_files_tuples_range;
 extern int  gp_random_insert_segments;
diff --git a/src/include/utils/unsync_guc_name.h b/src/include/utils/unsync_guc_name.h
index cba11770a81..85ecb3548e6 100644
--- a/src/include/utils/unsync_guc_name.h
+++ b/src/include/utils/unsync_guc_name.h
@@ -501,6 +501,7 @@
 		"optimizer_skew_factor",
 		"optimizer_use_external_constant_expression_evaluation_for_ints",
 		"optimizer_use_gpdb_allocators",
+		"optimizer_use_streaming_hashagg",
 		"optimizer_xform_bind_threshold",
 		"parallel_leader_participation",
 		"parallel_query_use_streaming_hashagg",
@@ -537,6 +538,7 @@
 		"resource_select_only",
 		"restart_after_crash",
 		"restore_command",
+		"restrict_nonsystem_relation_kind",
 		"role",
 		"runaway_detector_activation_percent",
 		"segment_size",
diff --git a/src/include/utils/workfile_mgr.h b/src/include/utils/workfile_mgr.h
index dfbd17bca57..48c83620610 100644
--- a/src/include/utils/workfile_mgr.h
+++ b/src/include/utils/workfile_mgr.h
@@ -74,4 +74,8 @@ extern workfile_set *workfile_mgr_cache_entries_get_copy(int* num_actives);
 extern uint64 WorkfileSegspace_GetSize(void);
 extern bool workfile_is_active(workfile_set *workfile);
 
+extern uint64 WorkfileTotalBytesWritten(void);
+extern uint64 WorkfileTotalFilesCreated(void);
+extern void WorkfileResetBackendStats(void);
+
 #endif /* __WORKFILE_MGR_H__ */
diff --git a/src/interfaces/libpq/fe-connect.c b/src/interfaces/libpq/fe-connect.c
index 46e8540004e..0d4d2fed864 100644
--- a/src/interfaces/libpq/fe-connect.c
+++ b/src/interfaces/libpq/fe-connect.c
@@ -3168,16 +3168,13 @@ PQconnectPoll(PGconn *conn)
 					{
 						/*
 						 * Server failure of some sort, such as failure to
-						 * fork a backend process.  We need to process and
-						 * report the error message, which might be formatted
-						 * according to either protocol 2 or protocol 3.
-						 * Rather than duplicate the code for that, we flip
-						 * into AWAITING_RESPONSE state and let the code there
-						 * deal with it.  Note we have *not* consumed the "E"
-						 * byte here.
+						 * fork a backend process.  Don't bother retrieving
+						 * the error message; we should not trust it as the
+						 * server has not been authenticated yet.
 						 */
-						conn->status = CONNECTION_AWAITING_RESPONSE;
-						goto keep_going;
+						appendPQExpBuffer(&conn->errorMessage,
+										  libpq_gettext("server sent an error response during SSL exchange\n"));
+						goto error_return;
 					}
 					else
 					{
diff --git a/src/interfaces/libpq/fe-secure-openssl.c b/src/interfaces/libpq/fe-secure-openssl.c
index d75a823b880..186799acf24 100644
--- a/src/interfaces/libpq/fe-secure-openssl.c
+++ b/src/interfaces/libpq/fe-secure-openssl.c
@@ -802,7 +802,6 @@ initialize_SSL(PGconn *conn)
 	bool		have_homedir;
 	bool		have_cert;
 	bool		have_rootcert;
-	EVP_PKEY   *pkey = NULL;
 
 	/*
 	 * We'll need the home directory if any of the relevant parameters are
@@ -1138,6 +1137,7 @@ initialize_SSL(PGconn *conn)
 			/* Colon, but not in second character, treat as engine:key */
 			char	   *engine_str = strdup(conn->sslkey);
 			char	   *engine_colon;
+			EVP_PKEY   *pkey = NULL;
 
 			if (engine_str == NULL)
 			{
diff --git a/src/test/isolation2/expected/analyze_progress.out b/src/test/isolation2/expected/analyze_progress.out
new file mode 100644
index 00000000000..97c02fbe617
--- /dev/null
+++ b/src/test/isolation2/expected/analyze_progress.out
@@ -0,0 +1,95 @@
+-- Test gp_stat_progress_analyze_summary
+-- setup hash distributed table
+CREATE TABLE t_analyze_part (a INT, b INT) DISTRIBUTED BY (a);
+CREATE
+INSERT INTO t_analyze_part SELECT i, i FROM generate_series(1, 100000) i;
+INSERT 100000
+
+-- Suspend analyze after scanning 20 blocks on each segment
+SELECT gp_inject_fault('analyze_block', 'suspend', '', '', '', 20, 20, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_inject_fault 
+-----------------
+ Success:        
+ Success:        
+ Success:        
+(3 rows)
+
+-- session 1: analyze the table
+1&: ANALYZE t_analyze_part;  <waiting ...>
+SELECT gp_wait_until_triggered_fault('analyze_block', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_wait_until_triggered_fault 
+-------------------------------
+ Success:                      
+ Success:                      
+ Success:                      
+(3 rows)
+
+-- session 2: query pg_stat_progress_analyze while the analyze is running, the view should indicate 60 blocks have been scanned as aggregated progress of 3 segments
+2: SELECT pid IS NOT NULL as has_pid, datname, relid::regclass, phase, sample_blks_total, sample_blks_scanned FROM gp_stat_progress_analyze_summary;
+ has_pid | datname        | relid          | phase                 | sample_blks_total | sample_blks_scanned 
+---------+----------------+----------------+-----------------------+-------------------+---------------------
+ t       | isolation2test | t_analyze_part | acquiring sample rows | 111               | 60                  
+(1 row)
+
+-- Reset fault injector
+SELECT gp_inject_fault('analyze_block', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_inject_fault 
+-----------------
+ Success:        
+ Success:        
+ Success:        
+(3 rows)
+1<:  <... completed>
+ANALYZE
+
+-- teardown
+DROP TABLE t_analyze_part;
+DROP
+
+-- setup replicated table
+CREATE TABLE t_analyze_repl (a INT, b INT) DISTRIBUTED REPLICATED;
+CREATE
+INSERT INTO t_analyze_repl SELECT i, i FROM generate_series(1, 100000) i;
+INSERT 100000
+
+-- Suspend analyze after scanning 20 blocks on each segment
+SELECT gp_inject_fault('analyze_block', 'suspend', '', '', '', 20, 20, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_inject_fault 
+-----------------
+ Success:        
+ Success:        
+ Success:        
+(3 rows)
+
+-- session 1: analyze the table
+1&: ANALYZE t_analyze_repl;  <waiting ...>
+SELECT gp_wait_until_triggered_fault('analyze_block', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_wait_until_triggered_fault 
+-------------------------------
+ Success:                      
+ Success:                      
+ Success:                      
+(3 rows)
+
+-- session 2: query pg_stat_progress_analyze while the analyze is running, the view should indicate 20 blocks have been scanned as average progress of 3 segments
+2: SELECT pid IS NOT NULL as has_pid, datname, relid::regclass, phase, sample_blks_total, sample_blks_scanned FROM gp_stat_progress_analyze_summary;
+ has_pid | datname        | relid          | phase                 | sample_blks_total | sample_blks_scanned 
+---------+----------------+----------------+-----------------------+-------------------+---------------------
+ t       | isolation2test | t_analyze_repl | acquiring sample rows | 111               | 20                  
+(1 row)
+
+-- Reset fault injector
+SELECT gp_inject_fault('analyze_block', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+ gp_inject_fault 
+-----------------
+ Success:        
+ Success:        
+ Success:        
+(3 rows)
+1<:  <... completed>
+ANALYZE
+
+-- teardown
+DROP TABLE t_analyze_repl;
+DROP
+
diff --git a/src/test/isolation2/expected/ao_index_build_progress.out b/src/test/isolation2/expected/ao_index_build_progress.out
index 1048076ce9f..2cc97d09031 100644
--- a/src/test/isolation2/expected/ao_index_build_progress.out
+++ b/src/test/isolation2/expected/ao_index_build_progress.out
@@ -8,36 +8,52 @@ CREATE
 -- Insert all tuples to seg1.
 INSERT INTO ao_index_build_progress SELECT 0, i FROM generate_series(1, 100000) i;
 INSERT 100000
+INSERT INTO ao_index_build_progress SELECT 2, i FROM generate_series(1, 100000) i;
+INSERT 100000
+INSERT INTO ao_index_build_progress SELECT 5, i FROM generate_series(1, 100000) i;
+INSERT 100000
 
 -- Suspend execution when some blocks have been read.
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 10, 10, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 10, 10, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1&: CREATE INDEX ON ao_index_build_progress(i);  <waiting ...>
 
 -- Wait until some AO varblocks have been read.
-SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 10, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 10, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
-(1 row)
+ Success:                      
+ Success:                      
+(3 rows)
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the relation's on-disk size.
-1U: SELECT command, phase, (pg_relation_size('ao_index_build_progress') + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS blocks_total_actual, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM pg_stat_progress_create_index WHERE relid = 'ao_index_build_progress'::regclass;
+SELECT command, phase, (pg_relation_size('ao_index_build_progress') + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS blocks_total_actual, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM gp_stat_progress_create_index WHERE gp_segment_id = 1 AND relid = 'ao_index_build_progress'::regclass;
  command      | phase                          | blocks_total_actual | blocks_total_reported | blocks_done_reported 
 --------------+--------------------------------+---------------------+-----------------------+----------------------
  CREATE INDEX | building index: scanning table | 10                  | 10                    | 2                    
 (1 row)
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'ao_index_build_progress'::regclass;
+ command      | phase                          | blocks_total | blocks_done 
+--------------+--------------------------------+--------------+-------------
+ CREATE INDEX | building index: scanning table | 30           | 6           
+(1 row)
 
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1<:  <... completed>
 CREATE
@@ -49,38 +65,54 @@ CREATE
 -- Insert all tuples to seg1.
 INSERT INTO aoco_index_build_progress SELECT 0, i FROM generate_series(1, 100000) i;
 INSERT 100000
+INSERT INTO aoco_index_build_progress SELECT 2, i FROM generate_series(1, 100000) i;
+INSERT 100000
+INSERT INTO aoco_index_build_progress SELECT 5, i FROM generate_series(1, 100000) i;
+INSERT 100000
 
 -- Suspend execution when some blocks have been read.
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1&: CREATE INDEX ON aoco_index_build_progress(i);  <waiting ...>
 
 -- Wait until some AOCO varblocks have been read.
-SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
-(1 row)
+ Success:                      
+ Success:                      
+(3 rows)
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the relation's on-disk size.
 -- Note: all blocks for the relation have to be scanned as we are building an
 -- index for the first time and a block directory has to be created.
-1U: SELECT command, phase, (pg_relation_size('aoco_index_build_progress') + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS blocks_total_actual, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM pg_stat_progress_create_index WHERE relid = 'aoco_index_build_progress'::regclass;
+SELECT command, phase, (pg_relation_size('aoco_index_build_progress') + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS blocks_total_actual, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM gp_stat_progress_create_index WHERE gp_segment_id = 1 AND relid = 'aoco_index_build_progress'::regclass;
  command      | phase                          | blocks_total_actual | blocks_total_reported | blocks_done_reported 
 --------------+--------------------------------+---------------------+-----------------------+----------------------
  CREATE INDEX | building index: scanning table | 20                  | 20                    | 4                    
 (1 row)
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'aoco_index_build_progress'::regclass;
+ command      | phase                          | blocks_total | blocks_done 
+--------------+--------------------------------+--------------+-------------
+ CREATE INDEX | building index: scanning table | 60           | 12          
+(1 row)
 
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1<:  <... completed>
 CREATE
@@ -88,36 +120,48 @@ CREATE
 -- Repeat the test for another index build
 
 -- Suspend execution when some blocks have been read.
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1&: CREATE INDEX ON aoco_index_build_progress(j);  <waiting ...>
 
 -- Wait until some AOCO varblocks have been read.
-SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
-(1 row)
+ Success:                      
+ Success:                      
+(3 rows)
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the size of col j's segfile.
 -- Note: since we already had a block directory prior to the index build on
--- column 'j', only column 'j' will be scanned. CBDB_CHERRY_PICK_MERGE_FIXME: fix when ao blkdir will be supported
-1U: SELECT command, phase, ((pg_stat_file(pg_relation_filepath('aoco_index_build_progress') || '.' || 129)).size + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS col_j_blocks, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM pg_stat_progress_create_index WHERE relid = 'aoco_index_build_progress'::regclass;
+-- column 'j', only column 'j' will be scanned.
+1U: SELECT command, phase, ((pg_stat_file(pg_relation_filepath('aoco_index_build_progress') || '.' || 129)).size + (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS col_j_blocks, blocks_total AS blocks_total_reported, blocks_done AS blocks_done_reported FROM gp_stat_progress_create_index WHERE gp_segment_id = 1 AND relid = 'aoco_index_build_progress'::regclass;
  command      | phase                          | col_j_blocks | blocks_total_reported | blocks_done_reported 
 --------------+--------------------------------+--------------+-----------------------+----------------------
  CREATE INDEX | building index: scanning table | 8            | 20                    | 4                    
 (1 row)
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'aoco_index_build_progress'::regclass;
+ command      | phase                          | blocks_total | blocks_done 
+--------------+--------------------------------+--------------+-------------
+ CREATE INDEX | building index: scanning table | 24           | 9           
+(1 row)
 
-SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1<:  <... completed>
 CREATE
diff --git a/src/test/isolation2/expected/copy_to_concurrent_reorganize.out b/src/test/isolation2/expected/copy_to_concurrent_reorganize.out
deleted file mode 100644
index 0a7dfd38801..00000000000
--- a/src/test/isolation2/expected/copy_to_concurrent_reorganize.out
+++ /dev/null
@@ -1,918 +0,0 @@
--- Test: COPY TO concurrent with ALTER TABLE SET WITH (reorganize=true)
--- Issue: https://github.com/apache/cloudberry/issues/1545
---
--- Tests 2.1: Core fix (relation-based COPY TO)
--- Tests 2.2-2.5: Extended fixes for query-based, partitioned, RLS, and CTAS paths
-
--- ============================================================
--- Test 2.1: relation-based COPY TO + concurrent reorganize
--- Reproduces issue #1545: COPY TO should return correct row count
--- after waiting for reorganize to release AccessExclusiveLock.
--- ============================================================
-
-CREATE TABLE copy_reorg_test (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_reorg_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_test;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_reorg_test SET WITH (reorganize=true);
-ALTER
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
--- At this point PortalRunUtility has already acquired a snapshot (before reorganize commits),
--- then DoCopy tries to acquire the lock and blocks.
-2&: COPY copy_reorg_test TO '/tmp/copy_reorg_test.csv';  <waiting ...>
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_reorg_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-COMMIT
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_reorg_verify FROM '/tmp/copy_reorg_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_reorg_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_reorg_verify;
-DROP
-DROP TABLE copy_reorg_test;
-DROP
-
--- ============================================================
--- Test 2.2: query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after pg_analyze_and_rewrite()
--- acquires all relation locks via AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_test (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_query_reorg_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_query_reorg_test;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: reorganize holds AccessExclusiveLock
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_query_reorg_test SET WITH (reorganize=true);
-ALTER
-
--- Session 2: query-based COPY TO blocks (lock acquired in pg_analyze_and_rewrite -> AcquireRewriteLocks)
-2&: COPY (SELECT * FROM copy_query_reorg_test) TO '/tmp/copy_query_reorg_test.csv';  <waiting ...>
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY (SELECT%copy_query_reorg_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit
-1: COMMIT;
-COMMIT
-
--- Session 2: Complete
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_query_reorg_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_query_reorg_verify FROM '/tmp/copy_query_reorg_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_query_reorg_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_query_reorg_verify;
-DROP
-DROP TABLE copy_query_reorg_test;
-DROP
-
--- ============================================================
--- Test 2.3: partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to eagerly lock all child
--- partitions before refreshing the snapshot, ensuring the snapshot sees all
--- child reorganize commits before the query is built.
--- ============================================================
-
-CREATE TABLE copy_part_parent (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE
-CREATE TABLE copy_part_child1 PARTITION OF copy_part_parent FOR VALUES FROM (1) TO (501);
-CREATE
-CREATE TABLE copy_part_child2 PARTITION OF copy_part_parent FOR VALUES FROM (501) TO (1001);
-CREATE
-INSERT INTO copy_part_parent SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_part_parent;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: reorganize the child partition
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_part_child1 SET WITH (reorganize=true);
-ALTER
-
--- Session 2: COPY parent TO (internally converted to query-based, child lock acquired in analyze phase)
-2&: COPY copy_part_parent TO '/tmp/copy_part_parent.csv';  <waiting ...>
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_part_parent%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit
-1: COMMIT;
-COMMIT
-
--- Session 2: Complete
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_part_verify (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_part_verify FROM '/tmp/copy_part_parent.csv';
-COPY 1000
-SELECT count(*) FROM copy_part_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_part_verify;
-DROP
-DROP TABLE copy_part_parent;
-DROP
-
--- ============================================================
--- Test 2.4: RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.2 — BeginCopy() refreshes snapshot after AcquireRewriteLocks()
--- which also acquires the lock on the RLS policy's lookup table.
--- ============================================================
-
-CREATE TABLE copy_rls_lookup (cat INT) DISTRIBUTED BY (cat);
-CREATE
-INSERT INTO copy_rls_lookup SELECT i FROM generate_series(1, 2) i;
-INSERT 2
-
-CREATE TABLE copy_rls_main (a INT, category INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_rls_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-INSERT 1000
-
-ALTER TABLE copy_rls_main ENABLE ROW LEVEL SECURITY;
-ALTER
-CREATE POLICY p_rls ON copy_rls_main USING (category IN (SELECT cat FROM copy_rls_lookup));
-CREATE
-
--- Create non-superuser to trigger RLS (needs pg_write_server_files to COPY TO file)
-CREATE ROLE copy_rls_testuser;
-CREATE
-GRANT pg_write_server_files TO copy_rls_testuser;
-GRANT
-GRANT ALL ON copy_rls_main TO copy_rls_testuser;
-GRANT
-GRANT ALL ON copy_rls_lookup TO copy_rls_testuser;
-GRANT
-
-SELECT count(*) FROM copy_rls_main;
- count 
--------
- 1000  
-(1 row)
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_testuser; COPY copy_rls_main TO '/tmp/copy_rls_main.csv';
-SET 400
-
--- Session 1: reorganize the lookup table
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_rls_lookup SET WITH (reorganize=true);
-ALTER
-
--- Session 2: COPY TO as non-superuser (RLS active, internally converted to query-based)
-2&: SET ROLE copy_rls_testuser; COPY copy_rls_main TO '/tmp/copy_rls_main.csv';  <waiting ...>
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE '%COPY copy_rls_main%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit
-1: COMMIT;
-COMMIT
-
--- Session 2: Complete
-2<:  <... completed>
-SET 400
-
--- Reset session 2's role to avoid leaking to subsequent tests
-2: RESET ROLE;
-RESET
-
--- Verify: should match baseline count (400 rows filtered by RLS)
-RESET ROLE;
-RESET
-CREATE TABLE copy_rls_verify (a INT, category INT) DISTRIBUTED BY (a);
-CREATE
-COPY copy_rls_verify FROM '/tmp/copy_rls_main.csv';
-COPY 400
-SELECT count(*) FROM copy_rls_verify;
- count 
--------
- 400   
-(1 row)
-
--- Cleanup
-DROP TABLE copy_rls_verify;
-DROP
-DROP POLICY p_rls ON copy_rls_main;
-DROP
-DROP TABLE copy_rls_main;
-DROP
-DROP TABLE copy_rls_lookup;
-DROP
-DROP ROLE copy_rls_testuser;
-DROP
-
--- ============================================================
--- Test 2.5: CTAS + concurrent reorganize
--- Fixed as a side effect: CTAS goes through pg_analyze_and_rewrite() +
--- AcquireRewriteLocks(), so the snapshot refresh in BeginCopy() also fixes it.
--- ============================================================
-
-CREATE TABLE ctas_reorg_src (a INT, b INT) DISTRIBUTED BY (a);
-CREATE
-INSERT INTO ctas_reorg_src SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM ctas_reorg_src;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: reorganize
-1: BEGIN;
-BEGIN
-1: ALTER TABLE ctas_reorg_src SET WITH (reorganize=true);
-ALTER
-
--- Session 2: CTAS should block (lock acquired in executor or analyze phase)
-2&: CREATE TABLE ctas_reorg_dst AS SELECT * FROM ctas_reorg_src DISTRIBUTED BY (a);  <waiting ...>
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'CREATE TABLE ctas_reorg_dst%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit
-1: COMMIT;
-COMMIT
-
--- Session 2: Complete
-2<:  <... completed>
-CREATE 1000
-
--- Verify row count after CTAS completes
-SELECT count(*) FROM ctas_reorg_dst;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE ctas_reorg_dst;
-DROP
-DROP TABLE ctas_reorg_src;
-DROP
-
--- NOTE: Test 2.6 (change distribution key + query-based COPY TO) removed because
--- ALTER TABLE SET DISTRIBUTED BY + concurrent query-based COPY TO causes a server
--- crash (pre-existing Cloudberry bug, not related to this fix).
-
--- ============================================================
--- Test 2.1a: AO row table — relation-based COPY TO + concurrent reorganize
--- Same as 2.1 but using append-optimized row-oriented table.
--- ============================================================
-
-CREATE TABLE copy_reorg_ao_row_test (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_reorg_ao_row_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_ao_row_test;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_reorg_ao_row_test SET WITH (reorganize=true);
-ALTER
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_ao_row_test TO '/tmp/copy_reorg_ao_row_test.csv';  <waiting ...>
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_reorg_ao_row_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-COMMIT
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-COPY copy_reorg_ao_row_verify FROM '/tmp/copy_reorg_ao_row_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_reorg_ao_row_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_reorg_ao_row_verify;
-DROP
-DROP TABLE copy_reorg_ao_row_test;
-DROP
-
--- ============================================================
--- Test 2.1b: AO column table — relation-based COPY TO + concurrent reorganize
--- Same as 2.1 but using append-optimized column-oriented table.
--- ============================================================
-
-CREATE TABLE copy_reorg_ao_col_test (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_reorg_ao_col_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_ao_col_test;
- count 
--------
- 1000  
-(1 row)
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_reorg_ao_col_test SET WITH (reorganize=true);
-ALTER
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_ao_col_test TO '/tmp/copy_reorg_ao_col_test.csv';  <waiting ...>
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_reorg_ao_col_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-COMMIT
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:  <... completed>
-COPY 1000
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-COPY copy_reorg_ao_col_verify FROM '/tmp/copy_reorg_ao_col_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_reorg_ao_col_verify;
- count 
--------
- 1000  
-(1 row)
-
--- Cleanup
-DROP TABLE copy_reorg_ao_col_verify;
-DROP
-DROP TABLE copy_reorg_ao_col_test;
-DROP
-
--- ============================================================
--- Test 2.2a: AO row — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_ao_row_test (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_query_reorg_ao_row_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_query_reorg_ao_row_test;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_query_reorg_ao_row_test SET WITH (reorganize=true);
-ALTER
-
-2&: COPY (SELECT * FROM copy_query_reorg_ao_row_test) TO '/tmp/copy_query_reorg_ao_row_test.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY (SELECT%copy_query_reorg_ao_row_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_query_reorg_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-COPY copy_query_reorg_ao_row_verify FROM '/tmp/copy_query_reorg_ao_row_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_query_reorg_ao_row_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_query_reorg_ao_row_verify;
-DROP
-DROP TABLE copy_query_reorg_ao_row_test;
-DROP
-
--- ============================================================
--- Test 2.2b: AO column — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_ao_col_test (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_query_reorg_ao_col_test SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_query_reorg_ao_col_test;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_query_reorg_ao_col_test SET WITH (reorganize=true);
-ALTER
-
-2&: COPY (SELECT * FROM copy_query_reorg_ao_col_test) TO '/tmp/copy_query_reorg_ao_col_test.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY (SELECT%copy_query_reorg_ao_col_test%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_query_reorg_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-COPY copy_query_reorg_ao_col_verify FROM '/tmp/copy_query_reorg_ao_col_test.csv';
-COPY 1000
-SELECT count(*) FROM copy_query_reorg_ao_col_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_query_reorg_ao_col_verify;
-DROP
-DROP TABLE copy_query_reorg_ao_col_test;
-DROP
-
--- ============================================================
--- Test 2.3a: AO row — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_ao_row (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE
-CREATE TABLE copy_part_child1_ao_row PARTITION OF copy_part_parent_ao_row FOR VALUES FROM (1) TO (501) USING ao_row;
-CREATE
-CREATE TABLE copy_part_child2_ao_row PARTITION OF copy_part_parent_ao_row FOR VALUES FROM (501) TO (1001) USING ao_row;
-CREATE
-INSERT INTO copy_part_parent_ao_row SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_part_parent_ao_row;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_part_child1_ao_row SET WITH (reorganize=true);
-ALTER
-
-2&: COPY copy_part_parent_ao_row TO '/tmp/copy_part_parent_ao_row.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_part_parent_ao_row%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_part_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-COPY copy_part_ao_row_verify FROM '/tmp/copy_part_parent_ao_row.csv';
-COPY 1000
-SELECT count(*) FROM copy_part_ao_row_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_part_ao_row_verify;
-DROP
-DROP TABLE copy_part_parent_ao_row;
-DROP
-
--- ============================================================
--- Test 2.3b: AO column — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_ao_col (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE
-CREATE TABLE copy_part_child1_ao_col PARTITION OF copy_part_parent_ao_col FOR VALUES FROM (1) TO (501) USING ao_column;
-CREATE
-CREATE TABLE copy_part_child2_ao_col PARTITION OF copy_part_parent_ao_col FOR VALUES FROM (501) TO (1001) USING ao_column;
-CREATE
-INSERT INTO copy_part_parent_ao_col SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM copy_part_parent_ao_col;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_part_child1_ao_col SET WITH (reorganize=true);
-ALTER
-
-2&: COPY copy_part_parent_ao_col TO '/tmp/copy_part_parent_ao_col.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'COPY copy_part_parent_ao_col%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-COPY 1000
-
-CREATE TABLE copy_part_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-COPY copy_part_ao_col_verify FROM '/tmp/copy_part_parent_ao_col.csv';
-COPY 1000
-SELECT count(*) FROM copy_part_ao_col_verify;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE copy_part_ao_col_verify;
-DROP
-DROP TABLE copy_part_parent_ao_col;
-DROP
-
--- ============================================================
--- Test 2.4a: AO row — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.4 — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_ao_row_lookup (cat INT) USING ao_row DISTRIBUTED BY (cat);
-CREATE
-INSERT INTO copy_rls_ao_row_lookup SELECT i FROM generate_series(1, 2) i;
-INSERT 2
-
-CREATE TABLE copy_rls_ao_row_main (a INT, category INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_rls_ao_row_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-INSERT 1000
-
-ALTER TABLE copy_rls_ao_row_main ENABLE ROW LEVEL SECURITY;
-ALTER
-CREATE POLICY p_rls_ao_row ON copy_rls_ao_row_main USING (category IN (SELECT cat FROM copy_rls_ao_row_lookup));
-CREATE
-
-CREATE ROLE copy_rls_ao_row_testuser;
-CREATE
-GRANT pg_write_server_files TO copy_rls_ao_row_testuser;
-GRANT
-GRANT ALL ON copy_rls_ao_row_main TO copy_rls_ao_row_testuser;
-GRANT
-GRANT ALL ON copy_rls_ao_row_lookup TO copy_rls_ao_row_testuser;
-GRANT
-
-SELECT count(*) FROM copy_rls_ao_row_main;
- count 
--------
- 1000  
-(1 row)
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_ao_row_testuser; COPY copy_rls_ao_row_main TO '/tmp/copy_rls_ao_row_main.csv';
-SET 400
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_rls_ao_row_lookup SET WITH (reorganize=true);
-ALTER
-
-2&: SET ROLE copy_rls_ao_row_testuser; COPY copy_rls_ao_row_main TO '/tmp/copy_rls_ao_row_main.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE '%COPY copy_rls_ao_row_main%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-SET 400
-
-2: RESET ROLE;
-RESET
-
-RESET ROLE;
-RESET
-CREATE TABLE copy_rls_ao_row_verify (a INT, category INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-COPY copy_rls_ao_row_verify FROM '/tmp/copy_rls_ao_row_main.csv';
-COPY 400
-SELECT count(*) FROM copy_rls_ao_row_verify;
- count 
--------
- 400   
-(1 row)
-
-DROP TABLE copy_rls_ao_row_verify;
-DROP
-DROP POLICY p_rls_ao_row ON copy_rls_ao_row_main;
-DROP
-DROP TABLE copy_rls_ao_row_main;
-DROP
-DROP TABLE copy_rls_ao_row_lookup;
-DROP
-DROP ROLE copy_rls_ao_row_testuser;
-DROP
-
--- ============================================================
--- Test 2.4b: AO column — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.4 — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_ao_col_lookup (cat INT) USING ao_column DISTRIBUTED BY (cat);
-CREATE
-INSERT INTO copy_rls_ao_col_lookup SELECT i FROM generate_series(1, 2) i;
-INSERT 2
-
-CREATE TABLE copy_rls_ao_col_main (a INT, category INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-INSERT INTO copy_rls_ao_col_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-INSERT 1000
-
-ALTER TABLE copy_rls_ao_col_main ENABLE ROW LEVEL SECURITY;
-ALTER
-CREATE POLICY p_rls_ao_col ON copy_rls_ao_col_main USING (category IN (SELECT cat FROM copy_rls_ao_col_lookup));
-CREATE
-
-CREATE ROLE copy_rls_ao_col_testuser;
-CREATE
-GRANT pg_write_server_files TO copy_rls_ao_col_testuser;
-GRANT
-GRANT ALL ON copy_rls_ao_col_main TO copy_rls_ao_col_testuser;
-GRANT
-GRANT ALL ON copy_rls_ao_col_lookup TO copy_rls_ao_col_testuser;
-GRANT
-
-SELECT count(*) FROM copy_rls_ao_col_main;
- count 
--------
- 1000  
-(1 row)
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_ao_col_testuser; COPY copy_rls_ao_col_main TO '/tmp/copy_rls_ao_col_main.csv';
-SET 400
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE copy_rls_ao_col_lookup SET WITH (reorganize=true);
-ALTER
-
-2&: SET ROLE copy_rls_ao_col_testuser; COPY copy_rls_ao_col_main TO '/tmp/copy_rls_ao_col_main.csv';  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE '%COPY copy_rls_ao_col_main%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-SET 400
-
-2: RESET ROLE;
-RESET
-
-RESET ROLE;
-RESET
-CREATE TABLE copy_rls_ao_col_verify (a INT, category INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-COPY copy_rls_ao_col_verify FROM '/tmp/copy_rls_ao_col_main.csv';
-COPY 400
-SELECT count(*) FROM copy_rls_ao_col_verify;
- count 
--------
- 400   
-(1 row)
-
-DROP TABLE copy_rls_ao_col_verify;
-DROP
-DROP POLICY p_rls_ao_col ON copy_rls_ao_col_main;
-DROP
-DROP TABLE copy_rls_ao_col_main;
-DROP
-DROP TABLE copy_rls_ao_col_lookup;
-DROP
-DROP ROLE copy_rls_ao_col_testuser;
-DROP
-
--- ============================================================
--- Test 2.5a: AO row — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_ao_row_src (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-CREATE
-INSERT INTO ctas_reorg_ao_row_src SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM ctas_reorg_ao_row_src;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE ctas_reorg_ao_row_src SET WITH (reorganize=true);
-ALTER
-
-2&: CREATE TABLE ctas_reorg_ao_row_dst AS SELECT * FROM ctas_reorg_ao_row_src DISTRIBUTED BY (a);  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'CREATE TABLE ctas_reorg_ao_row_dst%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-CREATE 1000
-
-SELECT count(*) FROM ctas_reorg_ao_row_dst;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE ctas_reorg_ao_row_dst;
-DROP
-DROP TABLE ctas_reorg_ao_row_src;
-DROP
-
--- ============================================================
--- Test 2.5b: AO column — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_ao_col_src (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-CREATE
-INSERT INTO ctas_reorg_ao_col_src SELECT i, i FROM generate_series(1, 1000) i;
-INSERT 1000
-
-SELECT count(*) FROM ctas_reorg_ao_col_src;
- count 
--------
- 1000  
-(1 row)
-
-1: BEGIN;
-BEGIN
-1: ALTER TABLE ctas_reorg_ao_col_src SET WITH (reorganize=true);
-ALTER
-
-2&: CREATE TABLE ctas_reorg_ao_col_dst AS SELECT * FROM ctas_reorg_ao_col_src DISTRIBUTED BY (a);  <waiting ...>
-
-1: SELECT count(*) > 0 FROM pg_stat_activity WHERE query LIKE 'CREATE TABLE ctas_reorg_ao_col_dst%' AND wait_event_type = 'Lock';
- ?column? 
-----------
- t        
-(1 row)
-
-1: COMMIT;
-COMMIT
-2<:  <... completed>
-CREATE 1000
-
-SELECT count(*) FROM ctas_reorg_ao_col_dst;
- count 
--------
- 1000  
-(1 row)
-
-DROP TABLE ctas_reorg_ao_col_dst;
-DROP
-DROP TABLE ctas_reorg_ao_col_src;
-DROP
-
--- NOTE: Tests 2.6a/2.6b (AO variants of change distribution key + query-based COPY TO)
--- removed for the same reason as test 2.6 (server crash, pre-existing bug).
diff --git a/src/test/isolation2/expected/resgroup/resgroup_bypass.out b/src/test/isolation2/expected/resgroup/resgroup_bypass.out
index 5cff41d745f..878c759c306 100644
--- a/src/test/isolation2/expected/resgroup/resgroup_bypass.out
+++ b/src/test/isolation2/expected/resgroup/resgroup_bypass.out
@@ -276,6 +276,24 @@ SELECT gp_inject_fault('func_init_plan_end', 'reset', 1);
 1q: ... <quitting>
 2q: ... <quitting>
 
+-- verify the increment of num_executed in gp_toolkit.gp_resgroup_status
+1: SET ROLE role_bypass;
+SET
+1: SELECT num_executed INTO temporary temp_num1 FROM gp_toolkit.gp_resgroup_status WHERE groupname='rg_bypass';
+SELECT 1
+1: SELECT num_executed INTO temporary temp_num2 FROM gp_toolkit.gp_resgroup_status WHERE groupname='rg_bypass';
+SELECT 1
+1: SELECT temp_num2.num_executed - temp_num1.num_executed AS delta FROM temp_num1, temp_num2;
+ delta 
+-------
+ 1     
+(1 row)
+1: DROP TABLE temp_num1;
+DROP
+1: DROP TABLE temp_num2;
+DROP
+1q: ... <quitting>
+
 -- cleanup
 -- start_ignore
 DROP TABLE t_bypass;
diff --git a/src/test/isolation2/expected/vacuum_progress_row.out b/src/test/isolation2/expected/vacuum_progress_row.out
index 0f1b3e65ef5..619b3e41b80 100644
--- a/src/test/isolation2/expected/vacuum_progress_row.out
+++ b/src/test/isolation2/expected/vacuum_progress_row.out
@@ -16,22 +16,21 @@ CREATE
 CREATE INDEX on vacuum_progress_ao_row(j);
 CREATE
 
--- Insert all tuples to seg1 from two current sessions so that data are stored
--- in two segment files.
+-- Insert from two current sessions so that data are stored in two segment files.
 1: BEGIN;
 BEGIN
 2: BEGIN;
 BEGIN
-1: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
+1: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
 INSERT 100000
-2: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
+2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
 INSERT 100000
 -- Commit so that the logical EOF of segno 2 is non-zero.
 2: COMMIT;
 COMMIT
 2: BEGIN;
 BEGIN
-2: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
+2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
 INSERT 100000
 -- Abort so that segno 2 has dead tuples after its logical EOF
 2: ABORT;
@@ -53,6 +52,11 @@ SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_
 (1 row)
 SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
  n_live_tup | n_dead_tup | last_vacuum | vacuum_count 
+------------+------------+-------------+--------------
+ 33327      | 66654      |             | 0            
+(1 row)
+SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM gp_stat_all_tables_summary WHERE relname = 'vacuum_progress_ao_row';
+ n_live_tup | n_dead_tup | last_vacuum | vacuum_count 
 ------------+------------+-------------+--------------
  100000     | 200000     |             | 0            
 (1 row)
@@ -60,11 +64,13 @@ SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM pg_stat_all_tables
 -- Perform VACUUM and observe the progress
 
 -- Suspend execution at pre-cleanup phase after truncating both segfiles to their logical EOF.
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', '', '', '', 2, 2, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', '', '', '', 2, 2, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 
 1: set Debug_appendonly_print_compaction to on;
 SET
@@ -75,85 +81,120 @@ SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 2
  Success:                      
 (1 row)
 -- We are in pre_cleanup phase and some blocks should've been vacuumed by now
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
  relname                | phase                        | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ------------------------+------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | append-optimized pre-cleanup | 165             | 0                 | 110                | 0                  | 100000          | 0               
+ vacuum_progress_ao_row | append-optimized pre-cleanup | 55              | 0                 | 37                 | 0                  | 33327           | 0               
+(1 row)
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+ relname                | phase                        | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized pre-cleanup | 166             | 0                 | 111                | 0                  | 100000          | 0               
 (1 row)
 
 -- Resume execution and suspend again in the middle of compact phase
-SELECT gp_inject_fault('appendonly_insert', 'suspend', '', '', '', 200, 200, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_insert', 'suspend', '', '', '', 200, 200, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+ Success:        
+ Success:        
+(3 rows)
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 SELECT gp_wait_until_triggered_fault('appendonly_insert', 200, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
 (1 row)
 -- We are in compact phase. num_dead_tuples should increase as we move and count tuples, one by one.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
  relname                | phase                    | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ------------------------+--------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | append-optimized compact | 165             | 0                 | 110                | 0                  | 100000          | 199             
+ vacuum_progress_ao_row | append-optimized compact | 55              | 0                 | 37                 | 0                  | 33327           | 227             
+(1 row)
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+ relname                | phase                    | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+--------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized compact | 166             | 0                 | 111                | 0                  | 100000          | 594             
 (1 row)
 
 -- Resume execution and suspend again after compacting all segfiles
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_compact', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
-SELECT gp_inject_fault('appendonly_insert', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+ Success:        
+ Success:        
+(3 rows)
+SELECT gp_inject_fault('appendonly_insert', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 SELECT gp_wait_until_triggered_fault('vacuum_ao_after_compact', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
 (1 row)
 -- After compacting all segfiles we expect 50000 dead tuples
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
  relname                | phase                    | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ------------------------+--------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | append-optimized compact | 165             | 55                | 110                | 0                  | 100000          | 50000           
+ vacuum_progress_ao_row | append-optimized compact | 55              | 19                | 37                 | 0                  | 33327           | 16622           
+(1 row)
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+ relname                | phase                    | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+--------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized compact | 166             | 57                | 111                | 0                  | 100000          | 50000           
 (1 row)
 
 -- Resume execution and entering post_cleaup phase, suspend at the end of it.
-SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+ Success:        
+ Success:        
+(3 rows)
+SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 SELECT gp_wait_until_triggered_fault('vacuum_ao_post_cleanup_end', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
 (1 row)
 -- We should have skipped recycling the awaiting drop segment because the segment was still visible to the SELECT gp_wait_until_triggered_fault query.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
  relname                | phase                         | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ------------------------+-------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | append-optimized post-cleanup | 165             | 55                | 110                | 0                  | 100000          | 50000           
+ vacuum_progress_ao_row | append-optimized post-cleanup | 55              | 19                | 37                 | 0                  | 33327           | 16622           
 (1 row)
-SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+ relname                | phase                         | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+-------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized post-cleanup | 166             | 57                | 111                | 0                  | 100000          | 50000           
+(1 row)
+
+SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
+ Success:        
+ Success:        
+(3 rows)
 1<:  <... completed>
 VACUUM
 
@@ -166,63 +207,68 @@ VACUUM
 SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_progress_ao_row';
  relpages | reltuples | relallvisible 
 ----------+-----------+---------------
- 83       | 50000     | 0             
+ 84       | 50000     | 0             
 (1 row)
 SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
  n_live_tup | n_dead_tup | has_last_vacuum | vacuum_count 
 ------------+------------+-----------------+--------------
- 50000      | 0          | t               | 1            
+ 16705      | 0          | t               | 1            
 (1 row)
 
 -- Perform VACUUM again to recycle the remaining awaiting drop segment marked by the previous run.
-SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
 (1 row)
-1&: VACUUM vacuum_progress_ao_row;  <waiting ...>
--- Resume execution and entering pre_cleanup phase, suspend at vacuuming indexes.
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', dbid) FROM gp_segment_configuration WHERE content > 0 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
-SELECT gp_wait_until_triggered_fault('vacuum_ao_after_index_delete', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+ Success:        
+(2 rows)
+1&: VACUUM vacuum_progress_ao_row;  <waiting ...>
+-- Resume execution and entering pre_cleanup phase, suspend at vacuuming indexes for segment 0.
+SELECT gp_wait_until_triggered_fault('vacuum_ao_after_index_delete', 1, dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
  gp_wait_until_triggered_fault 
 -------------------------------
  Success:                      
 (1 row)
--- We are in vacuuming indexes phase (part of ao pre_cleanup phase), index_vacuum_count should increase to 1.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+-- Resume execution and moving on to truncate segments that were marked as AWAITING_DROP for segment 1 and 2, there should be only 1.
+SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 1, dbid) FROM gp_segment_configuration WHERE content > 0 AND role = 'p';
+ gp_wait_until_triggered_fault 
+-------------------------------
+ Success:                      
+ Success:                      
+(2 rows)
+-- Segment 0 is in vacuuming indexes phase (part of ao pre_cleanup phase), index_vacuum_count should increase to 1.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 0;
  relname                | phase             | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ------------------------+-------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | vacuuming indexes | 83              | 0                 | 0                  | 1                  | 50000           | 0               
+ vacuum_progress_ao_row | vacuuming indexes | 28              | 0                 | 0                  | 1                  | 16737           | 0               
 (1 row)
+-- Segment 1 and 2 are in truncate segments phase (part of ao post_cleanup phase), heap_blks_vacuumed should increase to 1.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id > 0;
+ relname                | phase                        | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized pre-cleanup | 28              | 0                 | 19                 | 2                  | 16558           | 0               
+ vacuum_progress_ao_row | append-optimized pre-cleanup | 28              | 0                 | 19                 | 2                  | 16705           | 0               
+(2 rows)
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+ relname                | phase                        | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+------------------------+------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+ vacuum_progress_ao_row | append-optimized pre-cleanup | 56              | 0                 | 38                 | 4                  | 33263           | 0               
+ vacuum_progress_ao_row | vacuuming indexes            | 28              | 0                 | 0                  | 1                  | 16737           | 0               
+(2 rows)
 
--- Resume execution and moving on to truncate segments that were marked as AWAITING_DROP, there should be only 1.
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
-(1 row)
-SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
- gp_inject_fault 
------------------
  Success:        
-(1 row)
-SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
- gp_wait_until_triggered_fault 
--------------------------------
- Success:                      
-(1 row)
--- We are in post_cleanup phase and should have truncated the old segfile. Both indexes should be vacuumed by now, and heap_blks_vacuumed should also increased
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
- relname                | phase                        | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
-------------------------+------------------------------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
- vacuum_progress_ao_row | append-optimized pre-cleanup | 83              | 0                 | 55                 | 2                  | 50000           | 0               
-(1 row)
-
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+ Success:        
+(3 rows)
+SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'reset', dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
  gp_inject_fault 
 -----------------
  Success:        
@@ -230,25 +276,34 @@ SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid)
 1<:  <... completed>
 VACUUM
 
--- Vacuum has finished, nothing should show up in the progress view.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+-- Vacuum has finished, nothing should show up in the view.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+ relname | phase | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
+---------+-------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
+(0 rows)
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
  relname | phase | heap_blks_total | heap_blks_scanned | heap_blks_vacuumed | index_vacuum_count | max_dead_tuples | num_dead_tuples 
 ---------+-------+-----------------+-------------------+--------------------+--------------------+-----------------+-----------------
 (0 rows)
 
 -- pg_class and collected stats view should be updated after the 2nd VACUUM
-1U: SELECT wait_until_dead_tup_change_to('vacuum_progress_ao_row'::regclass::oid, 0);
- wait_until_dead_tup_change_to 
--------------------------------
- OK                            
+1U: SELECT wait_until_vacuum_count_change_to('vacuum_progress_ao_row'::regclass::oid, 2);
+ wait_until_vacuum_count_change_to 
+-----------------------------------
+ OK                                
 (1 row)
 SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_progress_ao_row';
  relpages | reltuples | relallvisible 
 ----------+-----------+---------------
- 28       | 50000     | 0             
+ 30       | 50000     | 0             
 (1 row)
 SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
  n_live_tup | n_dead_tup | has_last_vacuum | vacuum_count 
+------------+------------+-----------------+--------------
+ 16705      | 0          | t               | 2            
+(1 row)
+SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM gp_stat_all_tables_summary WHERE relname = 'vacuum_progress_ao_row';
+ n_live_tup | n_dead_tup | has_last_vacuum | vacuum_count 
 ------------+------------+-----------------+--------------
  50000      | 0          | t               | 2            
 (1 row)
diff --git a/src/test/isolation2/input/hot_standby/query_conflict.source b/src/test/isolation2/input/hot_standby/query_conflict.source
index 0e2706bfa5a..5f2aee3be53 100644
--- a/src/test/isolation2/input/hot_standby/query_conflict.source
+++ b/src/test/isolation2/input/hot_standby/query_conflict.source
@@ -126,8 +126,8 @@ select gp_inject_fault('after_open_temp_file', 'reset',dbid) from gp_segment_con
 -1S<:
 -1Sq:
 
--- conflict has been recorded
--1S: select max(confl_tablespace) from gp_stat_database_conflicts where datname = 'isolation2-hot-standby';
+-- conflict has been recorded. The query has multiple slices
+-1S: select max(confl_tablespace) >= 1 from gp_stat_database_conflicts where datname = 'isolation2-hot-standby';
 
 -- cleanup
 !\retcode rm -rf @testtablespace@/hs_tablespace_directory;
diff --git a/src/test/isolation2/isolation2_schedule b/src/test/isolation2/isolation2_schedule
index c4318923c1f..d9d33ad76e4 100644
--- a/src/test/isolation2/isolation2_schedule
+++ b/src/test/isolation2/isolation2_schedule
@@ -152,7 +152,6 @@ test: uao/fast_analyze_row
 
 test: uao/create_index_allows_readonly_row
 test: reorganize_after_ao_vacuum_skip_drop truncate_after_ao_vacuum_skip_drop mark_all_aoseg_await_drop
-test: copy_to_concurrent_reorganize
 # below test(s) inject faults so each of them need to be in a separate group
 test: segwalrep/master_wal_switch
 
@@ -237,6 +236,7 @@ test: idle_gang_cleaner
 # test idle_in_transaction_session_timeout
 
 test: ao_index_build_progress
+test: analyze_progress
 
 # Tests for FTS
 test: fts_errors
diff --git a/src/test/isolation2/output/hot_standby/query_conflict.source b/src/test/isolation2/output/hot_standby/query_conflict.source
index 397e3977d12..909d2532df3 100644
--- a/src/test/isolation2/output/hot_standby/query_conflict.source
+++ b/src/test/isolation2/output/hot_standby/query_conflict.source
@@ -269,11 +269,11 @@ ERROR:  canceling statement due to conflict with recovery  (seg1 slice3 127.0.1.
 DETAIL:  User was or might have been using tablespace that must be dropped.
 -1Sq: ... <quitting>
 
--- conflict has been recorded
--1S: select max(confl_tablespace) from gp_stat_database_conflicts where datname = 'isolation2-hot-standby';
- max 
------
- 1   
+-- conflict has been recorded. The query has multiple slices
+-1S: select max(confl_tablespace) >= 1 from gp_stat_database_conflicts where datname = 'isolation2-hot-standby';
+ ?column? 
+----------
+ t        
 (1 row)
 
 -- cleanup
diff --git a/src/test/isolation2/sql/analyze_progress.sql b/src/test/isolation2/sql/analyze_progress.sql
new file mode 100644
index 00000000000..311ab161eb2
--- /dev/null
+++ b/src/test/isolation2/sql/analyze_progress.sql
@@ -0,0 +1,42 @@
+-- Test gp_stat_progress_analyze_summary
+-- setup hash distributed table
+CREATE TABLE t_analyze_part (a INT, b INT) DISTRIBUTED BY (a);
+INSERT INTO t_analyze_part SELECT i, i FROM generate_series(1, 100000) i;
+
+-- Suspend analyze after scanning 20 blocks on each segment
+SELECT gp_inject_fault('analyze_block', 'suspend', '', '', '', 20, 20, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+
+-- session 1: analyze the table
+1&: ANALYZE t_analyze_part;
+SELECT gp_wait_until_triggered_fault('analyze_block', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+
+-- session 2: query pg_stat_progress_analyze while the analyze is running, the view should indicate 60 blocks have been scanned as aggregated progress of 3 segments
+2: SELECT pid IS NOT NULL as has_pid, datname, relid::regclass, phase, sample_blks_total, sample_blks_scanned FROM gp_stat_progress_analyze_summary;
+
+-- Reset fault injector
+SELECT gp_inject_fault('analyze_block', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+1<:
+
+-- teardown
+DROP TABLE t_analyze_part;
+
+-- setup replicated table
+CREATE TABLE t_analyze_repl (a INT, b INT) DISTRIBUTED REPLICATED;
+INSERT INTO t_analyze_repl SELECT i, i FROM generate_series(1, 100000) i;
+
+-- Suspend analyze after scanning 20 blocks on each segment
+SELECT gp_inject_fault('analyze_block', 'suspend', '', '', '', 20, 20, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+
+-- session 1: analyze the table
+1&: ANALYZE t_analyze_repl;
+SELECT gp_wait_until_triggered_fault('analyze_block', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+
+-- session 2: query pg_stat_progress_analyze while the analyze is running, the view should indicate 20 blocks have been scanned as average progress of 3 segments
+2: SELECT pid IS NOT NULL as has_pid, datname, relid::regclass, phase, sample_blks_total, sample_blks_scanned FROM gp_stat_progress_analyze_summary;
+
+-- Reset fault injector
+SELECT gp_inject_fault('analyze_block', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+1<:
+
+-- teardown
+DROP TABLE t_analyze_repl;
diff --git a/src/test/isolation2/sql/ao_index_build_progress.sql b/src/test/isolation2/sql/ao_index_build_progress.sql
index 19aade99e29..c5e34d1eab7 100644
--- a/src/test/isolation2/sql/ao_index_build_progress.sql
+++ b/src/test/isolation2/sql/ao_index_build_progress.sql
@@ -7,30 +7,34 @@ CREATE TABLE ao_index_build_progress(i int, j bigint) USING ao_row
 
 -- Insert all tuples to seg1.
 INSERT INTO ao_index_build_progress SELECT 0, i FROM generate_series(1, 100000) i;
+INSERT INTO ao_index_build_progress SELECT 2, i FROM generate_series(1, 100000) i;
+INSERT INTO ao_index_build_progress SELECT 5, i FROM generate_series(1, 100000) i;
 
 -- Suspend execution when some blocks have been read.
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 10, 10, 0, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1&: CREATE INDEX ON ao_index_build_progress(i);
 
 -- Wait until some AO varblocks have been read.
 SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 10, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the relation's on-disk size.
-1U: SELECT command, phase,
+SELECT command, phase,
         (pg_relation_size('ao_index_build_progress') +
          (current_setting('block_size')::int - 1)) / current_setting('block_size')::int
         AS blocks_total_actual,
         blocks_total AS blocks_total_reported,
         blocks_done AS blocks_done_reported
-    FROM pg_stat_progress_create_index
-    WHERE relid = 'ao_index_build_progress'::regclass;
+    FROM gp_stat_progress_create_index
+    WHERE gp_segment_id = 1 AND relid = 'ao_index_build_progress'::regclass;
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'ao_index_build_progress'::regclass;
 
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1<:
 
@@ -40,31 +44,35 @@ CREATE TABLE aoco_index_build_progress(i int, j int ENCODING (compresstype=zstd,
 
 -- Insert all tuples to seg1.
 INSERT INTO aoco_index_build_progress SELECT 0, i FROM generate_series(1, 100000) i;
+INSERT INTO aoco_index_build_progress SELECT 2, i FROM generate_series(1, 100000) i;
+INSERT INTO aoco_index_build_progress SELECT 5, i FROM generate_series(1, 100000) i;
 
 -- Suspend execution when some blocks have been read.
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1&: CREATE INDEX ON aoco_index_build_progress(i);
 
 -- Wait until some AOCO varblocks have been read.
 SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the relation's on-disk size.
 -- Note: all blocks for the relation have to be scanned as we are building an
 -- index for the first time and a block directory has to be created.
-1U: SELECT command, phase,
+SELECT command, phase,
            (pg_relation_size('aoco_index_build_progress') +
             (current_setting('block_size')::int - 1)) / current_setting('block_size')::int AS blocks_total_actual,
             blocks_total AS blocks_total_reported,
            blocks_done AS blocks_done_reported
-    FROM pg_stat_progress_create_index
-    WHERE relid = 'aoco_index_build_progress'::regclass;
+    FROM gp_stat_progress_create_index
+    WHERE gp_segment_id = 1 AND relid = 'aoco_index_build_progress'::regclass;
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'aoco_index_build_progress'::regclass;
 
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1<:
 
@@ -72,13 +80,13 @@ SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', d
 
 -- Suspend execution when some blocks have been read.
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'suspend', '', '', '', 5, 5, 0, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1&: CREATE INDEX ON aoco_index_build_progress(j);
 
 -- Wait until some AOCO varblocks have been read.
 SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_success', 5, dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 -- By now, we should have reported some blocks (of size 'block_size') as "done",
 -- as well as a total number of blocks that matches the size of col j's segfile.
@@ -90,10 +98,12 @@ SELECT gp_wait_until_triggered_fault('AppendOnlyStorageRead_ReadNextBlock_succes
                 AS col_j_blocks,
            blocks_total AS blocks_total_reported,
            blocks_done AS blocks_done_reported
-    FROM pg_stat_progress_create_index
-    WHERE relid = 'aoco_index_build_progress'::regclass;
+    FROM gp_stat_progress_create_index
+    WHERE gp_segment_id = 1 AND relid = 'aoco_index_build_progress'::regclass;
+-- The same should be true for the summary view, and the total number of blocks should be tripled.
+SELECT command, phase, blocks_total, blocks_done FROM gp_stat_progress_create_index_summary WHERE relid = 'aoco_index_build_progress'::regclass;
 
 SELECT gp_inject_fault('AppendOnlyStorageRead_ReadNextBlock_success', 'reset', dbid)
-    FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+    FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1<:
diff --git a/src/test/isolation2/sql/copy_to_concurrent_reorganize.sql b/src/test/isolation2/sql/copy_to_concurrent_reorganize.sql
deleted file mode 100644
index 3473193d142..00000000000
--- a/src/test/isolation2/sql/copy_to_concurrent_reorganize.sql
+++ /dev/null
@@ -1,561 +0,0 @@
--- Test: COPY TO concurrent with ALTER TABLE SET WITH (reorganize=true)
--- Issue: https://github.com/apache/cloudberry/issues/1545
---
--- Tests 2.1: Core fix (relation-based COPY TO)
--- Tests 2.2-2.5: Extended fixes for query-based, partitioned, RLS, and CTAS paths
-
--- ============================================================
--- Test 2.1: relation-based COPY TO + concurrent reorganize
--- Reproduces issue #1545: COPY TO should return correct row count
--- after waiting for reorganize to release AccessExclusiveLock.
--- ============================================================
-
-CREATE TABLE copy_reorg_test (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO copy_reorg_test SELECT i, i FROM generate_series(1, 1000) i;
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_test;
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-1: ALTER TABLE copy_reorg_test SET WITH (reorganize=true);
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
--- At this point PortalRunUtility has already acquired a snapshot (before reorganize commits),
--- then DoCopy tries to acquire the lock and blocks.
-2&: COPY copy_reorg_test TO '/tmp/copy_reorg_test.csv';
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_reorg_test%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_reorg_verify FROM '/tmp/copy_reorg_test.csv';
-SELECT count(*) FROM copy_reorg_verify;
-
--- Cleanup
-DROP TABLE copy_reorg_verify;
-DROP TABLE copy_reorg_test;
-
--- ============================================================
--- Test 2.2: query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after pg_analyze_and_rewrite()
--- acquires all relation locks via AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_test (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO copy_query_reorg_test SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_query_reorg_test;
-
--- Session 1: reorganize holds AccessExclusiveLock
-1: BEGIN;
-1: ALTER TABLE copy_query_reorg_test SET WITH (reorganize=true);
-
--- Session 2: query-based COPY TO blocks (lock acquired in pg_analyze_and_rewrite -> AcquireRewriteLocks)
-2&: COPY (SELECT * FROM copy_query_reorg_test) TO '/tmp/copy_query_reorg_test.csv';
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY (SELECT%copy_query_reorg_test%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit
-1: COMMIT;
-
--- Session 2: Complete
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_query_reorg_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_query_reorg_verify FROM '/tmp/copy_query_reorg_test.csv';
-SELECT count(*) FROM copy_query_reorg_verify;
-
--- Cleanup
-DROP TABLE copy_query_reorg_verify;
-DROP TABLE copy_query_reorg_test;
-
--- ============================================================
--- Test 2.3: partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to eagerly lock all child
--- partitions before refreshing the snapshot, ensuring the snapshot sees all
--- child reorganize commits before the query is built.
--- ============================================================
-
-CREATE TABLE copy_part_parent (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE TABLE copy_part_child1 PARTITION OF copy_part_parent FOR VALUES FROM (1) TO (501);
-CREATE TABLE copy_part_child2 PARTITION OF copy_part_parent FOR VALUES FROM (501) TO (1001);
-INSERT INTO copy_part_parent SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_part_parent;
-
--- Session 1: reorganize the child partition
-1: BEGIN;
-1: ALTER TABLE copy_part_child1 SET WITH (reorganize=true);
-
--- Session 2: COPY parent TO (internally converted to query-based, child lock acquired in analyze phase)
-2&: COPY copy_part_parent TO '/tmp/copy_part_parent.csv';
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_part_parent%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit
-1: COMMIT;
-
--- Session 2: Complete
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_part_verify (a INT, b INT) DISTRIBUTED BY (a);
-COPY copy_part_verify FROM '/tmp/copy_part_parent.csv';
-SELECT count(*) FROM copy_part_verify;
-
--- Cleanup
-DROP TABLE copy_part_verify;
-DROP TABLE copy_part_parent;
-
--- ============================================================
--- Test 2.4: RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.2 — BeginCopy() refreshes snapshot after AcquireRewriteLocks()
--- which also acquires the lock on the RLS policy's lookup table.
--- ============================================================
-
-CREATE TABLE copy_rls_lookup (cat INT) DISTRIBUTED BY (cat);
-INSERT INTO copy_rls_lookup SELECT i FROM generate_series(1, 2) i;
-
-CREATE TABLE copy_rls_main (a INT, category INT) DISTRIBUTED BY (a);
-INSERT INTO copy_rls_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-
-ALTER TABLE copy_rls_main ENABLE ROW LEVEL SECURITY;
-CREATE POLICY p_rls ON copy_rls_main USING (category IN (SELECT cat FROM copy_rls_lookup));
-
--- Create non-superuser to trigger RLS (needs pg_write_server_files to COPY TO file)
-CREATE ROLE copy_rls_testuser;
-GRANT pg_write_server_files TO copy_rls_testuser;
-GRANT ALL ON copy_rls_main TO copy_rls_testuser;
-GRANT ALL ON copy_rls_lookup TO copy_rls_testuser;
-
-SELECT count(*) FROM copy_rls_main;
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_testuser; COPY copy_rls_main TO '/tmp/copy_rls_main.csv';
-
--- Session 1: reorganize the lookup table
-1: BEGIN;
-1: ALTER TABLE copy_rls_lookup SET WITH (reorganize=true);
-
--- Session 2: COPY TO as non-superuser (RLS active, internally converted to query-based)
-2&: SET ROLE copy_rls_testuser; COPY copy_rls_main TO '/tmp/copy_rls_main.csv';
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE '%COPY copy_rls_main%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit
-1: COMMIT;
-
--- Session 2: Complete
-2<:
-
--- Reset session 2's role to avoid leaking to subsequent tests
-2: RESET ROLE;
-
--- Verify: should match baseline count (400 rows filtered by RLS)
-RESET ROLE;
-CREATE TABLE copy_rls_verify (a INT, category INT) DISTRIBUTED BY (a);
-COPY copy_rls_verify FROM '/tmp/copy_rls_main.csv';
-SELECT count(*) FROM copy_rls_verify;
-
--- Cleanup
-DROP TABLE copy_rls_verify;
-DROP POLICY p_rls ON copy_rls_main;
-DROP TABLE copy_rls_main;
-DROP TABLE copy_rls_lookup;
-DROP ROLE copy_rls_testuser;
-
--- ============================================================
--- Test 2.5: CTAS + concurrent reorganize
--- Fixed as a side effect: CTAS goes through pg_analyze_and_rewrite() +
--- AcquireRewriteLocks(), so the snapshot refresh in BeginCopy() also fixes it.
--- ============================================================
-
-CREATE TABLE ctas_reorg_src (a INT, b INT) DISTRIBUTED BY (a);
-INSERT INTO ctas_reorg_src SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM ctas_reorg_src;
-
--- Session 1: reorganize
-1: BEGIN;
-1: ALTER TABLE ctas_reorg_src SET WITH (reorganize=true);
-
--- Session 2: CTAS should block (lock acquired in executor or analyze phase)
-2&: CREATE TABLE ctas_reorg_dst AS SELECT * FROM ctas_reorg_src DISTRIBUTED BY (a);
-
--- Confirm Session 2 is blocked
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'CREATE TABLE ctas_reorg_dst%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit
-1: COMMIT;
-
--- Session 2: Complete
-2<:
-
--- Verify row count after CTAS completes
-SELECT count(*) FROM ctas_reorg_dst;
-
--- Cleanup
-DROP TABLE ctas_reorg_dst;
-DROP TABLE ctas_reorg_src;
-
--- NOTE: Test 2.6 (change distribution key + query-based COPY TO) removed because
--- ALTER TABLE SET DISTRIBUTED BY + concurrent query-based COPY TO causes a server
--- crash (pre-existing Cloudberry bug, not related to this fix).
-
--- ============================================================
--- Test 2.1a: AO row table — relation-based COPY TO + concurrent reorganize
--- Same as 2.1 but using append-optimized row-oriented table.
--- ============================================================
-
-CREATE TABLE copy_reorg_ao_row_test (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-INSERT INTO copy_reorg_ao_row_test SELECT i, i FROM generate_series(1, 1000) i;
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_ao_row_test;
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-1: ALTER TABLE copy_reorg_ao_row_test SET WITH (reorganize=true);
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_ao_row_test TO '/tmp/copy_reorg_ao_row_test.csv';
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_reorg_ao_row_test%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-COPY copy_reorg_ao_row_verify FROM '/tmp/copy_reorg_ao_row_test.csv';
-SELECT count(*) FROM copy_reorg_ao_row_verify;
-
--- Cleanup
-DROP TABLE copy_reorg_ao_row_verify;
-DROP TABLE copy_reorg_ao_row_test;
-
--- ============================================================
--- Test 2.1b: AO column table — relation-based COPY TO + concurrent reorganize
--- Same as 2.1 but using append-optimized column-oriented table.
--- ============================================================
-
-CREATE TABLE copy_reorg_ao_col_test (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-INSERT INTO copy_reorg_ao_col_test SELECT i, i FROM generate_series(1, 1000) i;
-
--- Record original row count
-SELECT count(*) FROM copy_reorg_ao_col_test;
-
--- Session 1: Begin reorganize (holds AccessExclusiveLock)
-1: BEGIN;
-1: ALTER TABLE copy_reorg_ao_col_test SET WITH (reorganize=true);
-
--- Session 2: relation-based COPY TO should block on AccessShareLock
-2&: COPY copy_reorg_ao_col_test TO '/tmp/copy_reorg_ao_col_test.csv';
-
--- Confirm Session 2 is waiting for the lock
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_reorg_ao_col_test%' AND wait_event_type = 'Lock';
-
--- Session 1: Commit reorganize, releasing AccessExclusiveLock
-1: COMMIT;
-
--- Session 2: Should return 1000 rows (fixed), not 0 rows (broken)
-2<:
-
--- Verify the output file contains all rows
-CREATE TABLE copy_reorg_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-COPY copy_reorg_ao_col_verify FROM '/tmp/copy_reorg_ao_col_test.csv';
-SELECT count(*) FROM copy_reorg_ao_col_verify;
-
--- Cleanup
-DROP TABLE copy_reorg_ao_col_verify;
-DROP TABLE copy_reorg_ao_col_test;
-
--- ============================================================
--- Test 2.2a: AO row — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_ao_row_test (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-INSERT INTO copy_query_reorg_ao_row_test SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_query_reorg_ao_row_test;
-
-1: BEGIN;
-1: ALTER TABLE copy_query_reorg_ao_row_test SET WITH (reorganize=true);
-
-2&: COPY (SELECT * FROM copy_query_reorg_ao_row_test) TO '/tmp/copy_query_reorg_ao_row_test.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY (SELECT%copy_query_reorg_ao_row_test%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_query_reorg_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-COPY copy_query_reorg_ao_row_verify FROM '/tmp/copy_query_reorg_ao_row_test.csv';
-SELECT count(*) FROM copy_query_reorg_ao_row_verify;
-
-DROP TABLE copy_query_reorg_ao_row_verify;
-DROP TABLE copy_query_reorg_ao_row_test;
-
--- ============================================================
--- Test 2.2b: AO column — query-based COPY TO + concurrent reorganize
--- Fixed: BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_query_reorg_ao_col_test (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-INSERT INTO copy_query_reorg_ao_col_test SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_query_reorg_ao_col_test;
-
-1: BEGIN;
-1: ALTER TABLE copy_query_reorg_ao_col_test SET WITH (reorganize=true);
-
-2&: COPY (SELECT * FROM copy_query_reorg_ao_col_test) TO '/tmp/copy_query_reorg_ao_col_test.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY (SELECT%copy_query_reorg_ao_col_test%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_query_reorg_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-COPY copy_query_reorg_ao_col_verify FROM '/tmp/copy_query_reorg_ao_col_test.csv';
-SELECT count(*) FROM copy_query_reorg_ao_col_verify;
-
-DROP TABLE copy_query_reorg_ao_col_verify;
-DROP TABLE copy_query_reorg_ao_col_test;
-
--- ============================================================
--- Test 2.3a: AO row — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_ao_row (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE TABLE copy_part_child1_ao_row PARTITION OF copy_part_parent_ao_row FOR VALUES FROM (1) TO (501) USING ao_row;
-CREATE TABLE copy_part_child2_ao_row PARTITION OF copy_part_parent_ao_row FOR VALUES FROM (501) TO (1001) USING ao_row;
-INSERT INTO copy_part_parent_ao_row SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_part_parent_ao_row;
-
-1: BEGIN;
-1: ALTER TABLE copy_part_child1_ao_row SET WITH (reorganize=true);
-
-2&: COPY copy_part_parent_ao_row TO '/tmp/copy_part_parent_ao_row.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_part_parent_ao_row%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_part_ao_row_verify (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-COPY copy_part_ao_row_verify FROM '/tmp/copy_part_parent_ao_row.csv';
-SELECT count(*) FROM copy_part_ao_row_verify;
-
-DROP TABLE copy_part_ao_row_verify;
-DROP TABLE copy_part_parent_ao_row;
-
--- ============================================================
--- Test 2.3b: AO column — partitioned table COPY TO + child partition concurrent reorganize
--- Fixed: DoCopy() calls find_all_inheritors() to lock all child partitions first.
--- ============================================================
-
-CREATE TABLE copy_part_parent_ao_col (a INT, b INT) PARTITION BY RANGE (a) DISTRIBUTED BY (a);
-CREATE TABLE copy_part_child1_ao_col PARTITION OF copy_part_parent_ao_col FOR VALUES FROM (1) TO (501) USING ao_column;
-CREATE TABLE copy_part_child2_ao_col PARTITION OF copy_part_parent_ao_col FOR VALUES FROM (501) TO (1001) USING ao_column;
-INSERT INTO copy_part_parent_ao_col SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM copy_part_parent_ao_col;
-
-1: BEGIN;
-1: ALTER TABLE copy_part_child1_ao_col SET WITH (reorganize=true);
-
-2&: COPY copy_part_parent_ao_col TO '/tmp/copy_part_parent_ao_col.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'COPY copy_part_parent_ao_col%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-CREATE TABLE copy_part_ao_col_verify (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-COPY copy_part_ao_col_verify FROM '/tmp/copy_part_parent_ao_col.csv';
-SELECT count(*) FROM copy_part_ao_col_verify;
-
-DROP TABLE copy_part_ao_col_verify;
-DROP TABLE copy_part_parent_ao_col;
-
--- ============================================================
--- Test 2.4a: AO row — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.4 — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_ao_row_lookup (cat INT) USING ao_row DISTRIBUTED BY (cat);
-INSERT INTO copy_rls_ao_row_lookup SELECT i FROM generate_series(1, 2) i;
-
-CREATE TABLE copy_rls_ao_row_main (a INT, category INT) USING ao_row DISTRIBUTED BY (a);
-INSERT INTO copy_rls_ao_row_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-
-ALTER TABLE copy_rls_ao_row_main ENABLE ROW LEVEL SECURITY;
-CREATE POLICY p_rls_ao_row ON copy_rls_ao_row_main USING (category IN (SELECT cat FROM copy_rls_ao_row_lookup));
-
-CREATE ROLE copy_rls_ao_row_testuser;
-GRANT pg_write_server_files TO copy_rls_ao_row_testuser;
-GRANT ALL ON copy_rls_ao_row_main TO copy_rls_ao_row_testuser;
-GRANT ALL ON copy_rls_ao_row_lookup TO copy_rls_ao_row_testuser;
-
-SELECT count(*) FROM copy_rls_ao_row_main;
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_ao_row_testuser; COPY copy_rls_ao_row_main TO '/tmp/copy_rls_ao_row_main.csv';
-
-1: BEGIN;
-1: ALTER TABLE copy_rls_ao_row_lookup SET WITH (reorganize=true);
-
-2&: SET ROLE copy_rls_ao_row_testuser; COPY copy_rls_ao_row_main TO '/tmp/copy_rls_ao_row_main.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE '%COPY copy_rls_ao_row_main%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-2: RESET ROLE;
-
-RESET ROLE;
-CREATE TABLE copy_rls_ao_row_verify (a INT, category INT) USING ao_row DISTRIBUTED BY (a);
-COPY copy_rls_ao_row_verify FROM '/tmp/copy_rls_ao_row_main.csv';
-SELECT count(*) FROM copy_rls_ao_row_verify;
-
-DROP TABLE copy_rls_ao_row_verify;
-DROP POLICY p_rls_ao_row ON copy_rls_ao_row_main;
-DROP TABLE copy_rls_ao_row_main;
-DROP TABLE copy_rls_ao_row_lookup;
-DROP ROLE copy_rls_ao_row_testuser;
-
--- ============================================================
--- Test 2.4b: AO column — RLS table COPY TO + policy-referenced table concurrent reorganize
--- Fixed: same as 2.4 — BeginCopy() refreshes snapshot after AcquireRewriteLocks().
--- ============================================================
-
-CREATE TABLE copy_rls_ao_col_lookup (cat INT) USING ao_column DISTRIBUTED BY (cat);
-INSERT INTO copy_rls_ao_col_lookup SELECT i FROM generate_series(1, 2) i;
-
-CREATE TABLE copy_rls_ao_col_main (a INT, category INT) USING ao_column DISTRIBUTED BY (a);
-INSERT INTO copy_rls_ao_col_main SELECT i, (i % 5) + 1 FROM generate_series(1, 1000) i;
-
-ALTER TABLE copy_rls_ao_col_main ENABLE ROW LEVEL SECURITY;
-CREATE POLICY p_rls_ao_col ON copy_rls_ao_col_main USING (category IN (SELECT cat FROM copy_rls_ao_col_lookup));
-
-CREATE ROLE copy_rls_ao_col_testuser;
-GRANT pg_write_server_files TO copy_rls_ao_col_testuser;
-GRANT ALL ON copy_rls_ao_col_main TO copy_rls_ao_col_testuser;
-GRANT ALL ON copy_rls_ao_col_lookup TO copy_rls_ao_col_testuser;
-
-SELECT count(*) FROM copy_rls_ao_col_main;
-
--- Baseline: verify RLS filters correctly (should return 400 rows: categories 1 and 2 only)
-2: SET ROLE copy_rls_ao_col_testuser; COPY copy_rls_ao_col_main TO '/tmp/copy_rls_ao_col_main.csv';
-
-1: BEGIN;
-1: ALTER TABLE copy_rls_ao_col_lookup SET WITH (reorganize=true);
-
-2&: SET ROLE copy_rls_ao_col_testuser; COPY copy_rls_ao_col_main TO '/tmp/copy_rls_ao_col_main.csv';
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE '%COPY copy_rls_ao_col_main%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-2: RESET ROLE;
-
-RESET ROLE;
-CREATE TABLE copy_rls_ao_col_verify (a INT, category INT) USING ao_column DISTRIBUTED BY (a);
-COPY copy_rls_ao_col_verify FROM '/tmp/copy_rls_ao_col_main.csv';
-SELECT count(*) FROM copy_rls_ao_col_verify;
-
-DROP TABLE copy_rls_ao_col_verify;
-DROP POLICY p_rls_ao_col ON copy_rls_ao_col_main;
-DROP TABLE copy_rls_ao_col_main;
-DROP TABLE copy_rls_ao_col_lookup;
-DROP ROLE copy_rls_ao_col_testuser;
-
--- ============================================================
--- Test 2.5a: AO row — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_ao_row_src (a INT, b INT) USING ao_row DISTRIBUTED BY (a);
-INSERT INTO ctas_reorg_ao_row_src SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM ctas_reorg_ao_row_src;
-
-1: BEGIN;
-1: ALTER TABLE ctas_reorg_ao_row_src SET WITH (reorganize=true);
-
-2&: CREATE TABLE ctas_reorg_ao_row_dst AS SELECT * FROM ctas_reorg_ao_row_src DISTRIBUTED BY (a);
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'CREATE TABLE ctas_reorg_ao_row_dst%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-SELECT count(*) FROM ctas_reorg_ao_row_dst;
-
-DROP TABLE ctas_reorg_ao_row_dst;
-DROP TABLE ctas_reorg_ao_row_src;
-
--- ============================================================
--- Test 2.5b: AO column — CTAS + concurrent reorganize
--- Fixed as a side effect via BeginCopy() snapshot refresh.
--- ============================================================
-
-CREATE TABLE ctas_reorg_ao_col_src (a INT, b INT) USING ao_column DISTRIBUTED BY (a);
-INSERT INTO ctas_reorg_ao_col_src SELECT i, i FROM generate_series(1, 1000) i;
-
-SELECT count(*) FROM ctas_reorg_ao_col_src;
-
-1: BEGIN;
-1: ALTER TABLE ctas_reorg_ao_col_src SET WITH (reorganize=true);
-
-2&: CREATE TABLE ctas_reorg_ao_col_dst AS SELECT * FROM ctas_reorg_ao_col_src DISTRIBUTED BY (a);
-
-1: SELECT count(*) > 0 FROM pg_stat_activity
-   WHERE query LIKE 'CREATE TABLE ctas_reorg_ao_col_dst%' AND wait_event_type = 'Lock';
-
-1: COMMIT;
-2<:
-
-SELECT count(*) FROM ctas_reorg_ao_col_dst;
-
-DROP TABLE ctas_reorg_ao_col_dst;
-DROP TABLE ctas_reorg_ao_col_src;
-
--- NOTE: Tests 2.6a/2.6b (AO variants of change distribution key + query-based COPY TO)
--- removed for the same reason as test 2.6 (server crash, pre-existing bug).
diff --git a/src/test/isolation2/sql/resgroup/resgroup_bypass.sql b/src/test/isolation2/sql/resgroup/resgroup_bypass.sql
index 19c50771f75..01d9d60cbd0 100644
--- a/src/test/isolation2/sql/resgroup/resgroup_bypass.sql
+++ b/src/test/isolation2/sql/resgroup/resgroup_bypass.sql
@@ -133,6 +133,15 @@ SELECT gp_inject_fault('func_init_plan_end', 'reset', 1);
 1q:
 2q:
 
+-- verify the increment of num_executed in gp_toolkit.gp_resgroup_status
+1: SET ROLE role_bypass;
+1: SELECT num_executed INTO temporary temp_num1 FROM gp_toolkit.gp_resgroup_status WHERE groupname='rg_bypass';
+1: SELECT num_executed INTO temporary temp_num2 FROM gp_toolkit.gp_resgroup_status WHERE groupname='rg_bypass';
+1: SELECT temp_num2.num_executed - temp_num1.num_executed AS delta FROM temp_num1, temp_num2;
+1: DROP TABLE temp_num1;
+1: DROP TABLE temp_num2;
+1q:
+
 -- cleanup
 -- start_ignore
 DROP TABLE t_bypass;
diff --git a/src/test/isolation2/sql/setup.sql b/src/test/isolation2/sql/setup.sql
index 949f22f0002..6241413ba3b 100644
--- a/src/test/isolation2/sql/setup.sql
+++ b/src/test/isolation2/sql/setup.sql
@@ -461,6 +461,27 @@ begin
 end; /* in func */
 $$ language plpgsql;
 
+-- Helper function that ensures stats collector receives stat from the latest operation.
+create or replace function wait_until_vacuum_count_change_to(relid oid, stat_val_expected bigint)
+    returns text as $$
+declare
+    stat_val int; /* in func */
+    i int; /* in func */
+begin
+    i := 0; /* in func */
+    while i < 1200 loop
+            select pg_stat_get_vacuum_count(relid) into stat_val; /* in func */
+            if stat_val = stat_val_expected then /* in func */
+                return 'OK'; /* in func */
+            end if; /* in func */
+            perform pg_sleep(0.1); /* in func */
+            perform pg_stat_clear_snapshot(); /* in func */
+            i := i + 1; /* in func */
+        end loop; /* in func */
+    return 'Fail'; /* in func */
+end; /* in func */
+$$ language plpgsql;
+
 -- Helper function to get the number of blocks in a relation.
 CREATE OR REPLACE FUNCTION nblocks(rel regclass) RETURNS int AS $$ /* in func */
 BEGIN /* in func */
diff --git a/src/test/isolation2/sql/vacuum_progress_row.sql b/src/test/isolation2/sql/vacuum_progress_row.sql
index 1ccf6ca090f..93da2a47bbc 100644
--- a/src/test/isolation2/sql/vacuum_progress_row.sql
+++ b/src/test/isolation2/sql/vacuum_progress_row.sql
@@ -11,16 +11,15 @@ CREATE TABLE vacuum_progress_ao_row(i int, j int);
 CREATE INDEX on vacuum_progress_ao_row(i);
 CREATE INDEX on vacuum_progress_ao_row(j);
 
--- Insert all tuples to seg1 from two current sessions so that data are stored
--- in two segment files.
+-- Insert from two current sessions so that data are stored in two segment files.
 1: BEGIN;
 2: BEGIN;
-1: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
-2: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
+1: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
+2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
 -- Commit so that the logical EOF of segno 2 is non-zero.
 2: COMMIT;
 2: BEGIN;
-2: INSERT INTO vacuum_progress_ao_row SELECT 0, i FROM generate_series(1, 100000) i;
+2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
 -- Abort so that segno 2 has dead tuples after its logical EOF
 2: ABORT;
 2q:
@@ -32,40 +31,46 @@ DELETE FROM vacuum_progress_ao_row where j % 2 = 0;
 
 -- Lookup pg_class and collected stats view before VACUUM
 SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_progress_ao_row';
-SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
+SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM gp_stat_all_tables WHERE relname = 'vacuum_progress_ao_row' and gp_segment_id = 1;
+SELECT n_live_tup, n_dead_tup, last_vacuum, vacuum_count FROM gp_stat_all_tables_summary WHERE relname = 'vacuum_progress_ao_row';
 
 -- Perform VACUUM and observe the progress
 
 -- Suspend execution at pre-cleanup phase after truncating both segfiles to their logical EOF.
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', '', '', '', 2, 2, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', '', '', '', 2, 2, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 
 1: set Debug_appendonly_print_compaction to on;
 1&: VACUUM vacuum_progress_ao_row;
 SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 2, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
 -- We are in pre_cleanup phase and some blocks should've been vacuumed by now
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
 
 -- Resume execution and suspend again in the middle of compact phase
-SELECT gp_inject_fault('appendonly_insert', 'suspend', '', '', '', 200, 200, 0, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_insert', 'suspend', '', '', '', 200, 200, 0, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 SELECT gp_wait_until_triggered_fault('appendonly_insert', 200, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
 -- We are in compact phase. num_dead_tuples should increase as we move and count tuples, one by one.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
 
 -- Resume execution and suspend again after compacting all segfiles
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_inject_fault('appendonly_insert', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_compact', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+SELECT gp_inject_fault('appendonly_insert', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 SELECT gp_wait_until_triggered_fault('vacuum_ao_after_compact', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
 -- After compacting all segfiles we expect 50000 dead tuples
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
 
 -- Resume execution and entering post_cleaup phase, suspend at the end of it.
-SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 SELECT gp_wait_until_triggered_fault('vacuum_ao_post_cleanup_end', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
 -- We should have skipped recycling the awaiting drop segment because the segment was still visible to the SELECT gp_wait_until_triggered_fault query.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
-SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+
+SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
 1<:
 
 -- pg_class and collected stats view should be updated after the 1st VACUUM
@@ -74,113 +79,34 @@ SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_
 SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
 
 -- Perform VACUUM again to recycle the remaining awaiting drop segment marked by the previous run.
-SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', dbid) FROM gp_segment_configuration WHERE content > 0 AND role = 'p';
 1&: VACUUM vacuum_progress_ao_row;
--- Resume execution and entering pre_cleanup phase, suspend at vacuuming indexes.
-SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_wait_until_triggered_fault('vacuum_ao_after_index_delete', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
--- We are in vacuuming indexes phase (part of ao pre_cleanup phase), index_vacuum_count should increase to 1.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
-
--- Resume execution and moving on to truncate segments that were marked as AWAITING_DROP, there should be only 1.
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'suspend', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
-SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 1, dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
--- We are in post_cleanup phase and should have truncated the old segfile. Both indexes should be vacuumed by now, and heap_blks_vacuumed should also increased
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
-
-SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content = 1 AND role = 'p';
+-- Resume execution and entering pre_cleanup phase, suspend at vacuuming indexes for segment 0.
+SELECT gp_wait_until_triggered_fault('vacuum_ao_after_index_delete', 1, dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
+-- Resume execution and moving on to truncate segments that were marked as AWAITING_DROP for segment 1 and 2, there should be only 1.
+SELECT gp_wait_until_triggered_fault('appendonly_after_truncate_segment_file', 1, dbid) FROM gp_segment_configuration WHERE content > 0 AND role = 'p';
+-- Segment 0 is in vacuuming indexes phase (part of ao pre_cleanup phase), index_vacuum_count should increase to 1.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 0;
+-- Segment 1 and 2 are in truncate segments phase (part of ao post_cleanup phase), heap_blks_vacuumed should increase to 1.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id > 0;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
+
+SELECT gp_inject_fault('appendonly_after_truncate_segment_file', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
+SELECT gp_inject_fault('vacuum_ao_after_index_delete', 'reset', dbid) FROM gp_segment_configuration WHERE content = 0 AND role = 'p';
 1<:
 
--- Vacuum has finished, nothing should show up in the progress view.
-1U: select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from pg_stat_progress_vacuum;
+-- Vacuum has finished, nothing should show up in the view.
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id = 1;
+select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
 
 -- pg_class and collected stats view should be updated after the 2nd VACUUM
-1U: SELECT wait_until_dead_tup_change_to('vacuum_progress_ao_row'::regclass::oid, 0);
+1U: SELECT wait_until_vacuum_count_change_to('vacuum_progress_ao_row'::regclass::oid, 2);
 SELECT relpages, reltuples, relallvisible FROM pg_class where relname = 'vacuum_progress_ao_row';
-SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM pg_stat_all_tables WHERE relname = 'vacuum_progress_ao_row';
+SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM gp_stat_all_tables WHERE relname = 'vacuum_progress_ao_row' and gp_segment_id = 1;
+SELECT n_live_tup, n_dead_tup, last_vacuum is not null as has_last_vacuum, vacuum_count FROM gp_stat_all_tables_summary WHERE relname = 'vacuum_progress_ao_row';
 
--- open if system views gp_stat_progress_vacuum* are enabled
---1q:
----- Test vacuum worker process is changed at post-cleanup phase due to mirror down.
----- Current behavior is it will clear previous compact phase num_dead_tuples in post-cleanup
----- phase (at injecting point vacuum_ao_post_cleanup_end), which is different from above case
----- in which vacuum worker isn't changed.
---ALTER SYSTEM SET gp_fts_mark_mirror_down_grace_period to 10;
---ALTER SYSTEM SET gp_fts_probe_interval to 10;
---SELECT gp_segment_id, pg_reload_conf() FROM gp_id UNION SELECT gp_segment_id, pg_reload_conf() FROM gp_dist_random('gp_id');
---
---DROP TABLE IF EXISTS vacuum_progress_ao_row;
---CREATE TABLE vacuum_progress_ao_row(i int, j int);
---CREATE INDEX on vacuum_progress_ao_row(i);
---CREATE INDEX on vacuum_progress_ao_row(j);
---1: BEGIN;
---2: BEGIN;
---1: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
---2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
---2: COMMIT;
---2: BEGIN;
---2: INSERT INTO vacuum_progress_ao_row SELECT i, i FROM generate_series(1, 100000) i;
---2: ABORT;
---2q:
---1: ABORT;
---DELETE FROM vacuum_progress_ao_row where j % 2 = 0;
---
----- Suspend execution at the end of compact phase.
---2: SELECT gp_inject_fault('vacuum_ao_after_compact', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---
---1: set debug_appendonly_print_compaction to on;
---1&: vacuum vacuum_progress_ao_row;
---
---2: SELECT gp_wait_until_triggered_fault('vacuum_ao_after_compact', 3, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---
----- Non-zero progressing data num_dead_tuples is showed up.
---select gp_segment_id, relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id > -1;
---select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
---
----- Resume execution of compact phase and block at syncrep.
---2: SELECT gp_inject_fault_infinite('wal_sender_loop', 'suspend', dbid) FROM gp_segment_configuration WHERE role = 'p' and content = 1;
---2: SELECT gp_inject_fault('vacuum_ao_after_compact', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
----- stop the mirror should turn off syncrep
---2: SELECT pg_ctl(datadir, 'stop', 'immediate') FROM gp_segment_configuration WHERE content=1 AND role = 'm';
---
----- Resume walsender to detect mirror down and suspend at the beginning
----- of post-cleanup taken over by a new vacuum worker.
---2: SELECT gp_inject_fault('vacuum_worker_changed', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
----- resume walsender and let it exit so that mirror stop can be detected
---2: SELECT gp_inject_fault_infinite('wal_sender_loop', 'reset', dbid) FROM gp_segment_configuration WHERE role = 'p' and content = 1;
----- Ensure we enter into the target logic which stops cumulative data but
----- initializes a new vacrelstats at the beginning of post-cleanup phase.
----- Also all segments should reach to the same "vacuum_worker_changed" point
----- due to FTS version being changed.
---2: SELECT gp_wait_until_triggered_fault('vacuum_worker_changed', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
----- now seg1's mirror is marked as down
---2: SELECT content, role, preferred_role, mode, status FROM gp_segment_configuration WHERE content > -1;
---
----- Resume execution and entering post_cleaup phase, suspend at the end of it.
---2: SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'suspend', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---2: SELECT gp_inject_fault('vacuum_worker_changed', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---2: SELECT gp_wait_until_triggered_fault('vacuum_ao_post_cleanup_end', 1, dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---
----- The previous collected num_dead_tuples in compact phase is zero.
---select gp_segment_id, relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum where gp_segment_id > -1;
---select relid::regclass as relname, phase, heap_blks_total, heap_blks_scanned, heap_blks_vacuumed, index_vacuum_count, max_dead_tuples, num_dead_tuples from gp_stat_progress_vacuum_summary;
---
---2: SELECT gp_inject_fault('vacuum_ao_post_cleanup_end', 'reset', dbid) FROM gp_segment_configuration WHERE content > -1 AND role = 'p';
---
---1<:
---
----- restore environment
---1: reset debug_appendonly_print_compaction;
---
---2: SELECT pg_ctl_start(datadir, port) FROM gp_segment_configuration WHERE role = 'm' AND content = 1;
---2: SELECT wait_until_all_segments_synchronized();
---
----- Cleanup
---SELECT gp_inject_fault_infinite('all', 'reset', dbid) FROM gp_segment_configuration;
---reset Debug_appendonly_print_compaction;
---reset default_table_access_method;
---ALTER SYSTEM RESET gp_fts_mark_mirror_down_grace_period;
---ALTER SYSTEM RESET gp_fts_probe_interval;
---SELECT gp_segment_id, pg_reload_conf() FROM gp_id UNION SELECT gp_segment_id, pg_reload_conf() FROM gp_dist_random('gp_id');
---
\ No newline at end of file
+-- Cleanup
+SELECT gp_inject_fault_infinite('all', 'reset', dbid) FROM gp_segment_configuration;
+reset Debug_appendonly_print_compaction;
+reset default_table_access_method;
diff --git a/src/test/perl/PostgresNode.pm b/src/test/perl/PostgresNode.pm
index b9896d5076a..50ba9d041bc 100644
--- a/src/test/perl/PostgresNode.pm
+++ b/src/test/perl/PostgresNode.pm
@@ -708,7 +708,7 @@ sub adjust_conf
 
     my $conffile = $self->data_dir . '/' . $filename;
 
-    my $contents = PostgreSQL::Test::Utils::slurp_file($conffile);
+    my $contents = TestLib::slurp_file($conffile);
     my @lines    = split(/\n/, $contents);
     my @result;
     my $eq = $skip_equals ? '' : '= ';
@@ -1296,7 +1296,7 @@ sub enable_archiving
 	my $copy_command =
 	  $TestLib::windows_os
 	  ? qq{copy "%p" "$path\\\\%f"}
-	  : qq{cp "%p" "$path/%f"};
+	  : qq{install -m 644 "%p" "$path/%f"};
 
 	# Enable archive_mode and archive_command on node
 	$self->append_conf(
diff --git a/src/test/regress/GNUmakefile b/src/test/regress/GNUmakefile
index 9bc8b67591e..60f8d491efb 100644
--- a/src/test/regress/GNUmakefile
+++ b/src/test/regress/GNUmakefile
@@ -223,6 +223,12 @@ installcheck-cbdb-parallel: all tablespace-setup twophase_pqexecparams
 	$(pg_regress_installcheck) $(REGRESS_OPTS) --schedule=$(srcdir)/parallel_schedule --schedule=$(srcdir)/greenplum_schedule --max-connections=5 $(EXTRA_TESTS) --exclude-tests explain \
 	)
 
+installcheck-orca-parallel: all tablespace-setup twophase_pqexecparams
+	( \
+	export PGOPTIONS='-c optimizer=on -c enable_parallel=true -c min_parallel_table_scan_size=0 -c min_parallel_index_scan_size=0 -c parallel_setup_cost=0'; \
+	$(pg_regress_installcheck) $(REGRESS_OPTS) --exclude-file=$(srcdir)/excluded_tests.conf --schedule=$(srcdir)/parallel_schedule --schedule=$(srcdir)/greenplum_schedule --max-connections=4 --ignore-plans $(EXTRA_TESTS) \
+	)
+
 installcheck-tests: all
 	$(pg_regress_installcheck) $(REGRESS_OPTS) $(TESTS) $(EXTRA_TESTS)
 
diff --git a/src/test/regress/excluded_tests.conf b/src/test/regress/excluded_tests.conf
new file mode 100644
index 00000000000..e29197946d4
--- /dev/null
+++ b/src/test/regress/excluded_tests.conf
@@ -0,0 +1,14 @@
+brin_bloom
+join_hash
+explain
+memoize
+cte_prune
+tuplesort
+gporca
+brin_ao
+brin_aocs
+direct_dispatch
+bfv_dd
+bfv_dd_multicolumn
+planhints
+rowhints
diff --git a/src/test/regress/expected/.gitignore b/src/test/regress/expected/.gitignore
index c837ca324d5..f625061dbd6 100644
--- a/src/test/regress/expected/.gitignore
+++ b/src/test/regress/expected/.gitignore
@@ -70,3 +70,4 @@
 /ao_unique_index_partition.out
 /bfv_copy.out
 /copy_encoding_error.out
+/vacuum_fsm_nondefault_tablespace.out
diff --git a/src/test/regress/expected/analyze.out b/src/test/regress/expected/analyze.out
index 843a728c9b6..74169660301 100644
--- a/src/test/regress/expected/analyze.out
+++ b/src/test/regress/expected/analyze.out
@@ -1314,3 +1314,30 @@ select * from pg_stats where tablename like 'part2';
 (1 row)
 
 drop table multipart cascade;
+--
+-- Test column-specific ANALYZE correctly uses attnum-based NDV index (not loop index).
+-- When ANALYZE t(b) is run, the QD loop has i=0 for column b (attnum=2),
+-- so attnum-1=1 != i=0. Without the fix, colNDVBySeg[i=0] reads column a's NDV
+-- instead of column b's NDV.
+--
+CREATE TABLE analyze_col_ndv_drop (a int, b int, c int) DISTRIBUTED BY (a);
+INSERT INTO analyze_col_ndv_drop SELECT i%5, i, i%50 FROM generate_series(1, 100) i;
+-- ANALYZE specific column b: QD loop has i=0, b.attnum=2, so attnum-1=1 != i=0
+ANALYZE analyze_col_ndv_drop (b);
+-- stadistinctbyseg for b should be 100 (all distinct), not ~5 (NDV of column a at index 0)
+SELECT a.attname,
+       CASE WHEN s.stakind1 = 8 THEN array_to_string(s.stavalues1, ',')
+            WHEN s.stakind2 = 8 THEN array_to_string(s.stavalues2, ',')
+            WHEN s.stakind3 = 8 THEN array_to_string(s.stavalues3, ',')
+            WHEN s.stakind4 = 8 THEN array_to_string(s.stavalues4, ',')
+            WHEN s.stakind5 = 8 THEN array_to_string(s.stavalues5, ',')
+       END AS stadistinctbyseg
+FROM pg_statistic s
+JOIN pg_attribute a ON a.attrelid = s.starelid AND a.attnum = s.staattnum
+WHERE s.starelid = 'analyze_col_ndv_drop'::regclass AND a.attname = 'b';
+ attname | stadistinctbyseg 
+---------+------------------
+ b       | 100
+(1 row)
+
+DROP TABLE analyze_col_ndv_drop;
diff --git a/src/test/regress/expected/brin.out b/src/test/regress/expected/brin.out
index 20807f31997..2a0d670300a 100644
--- a/src/test/regress/expected/brin.out
+++ b/src/test/regress/expected/brin.out
@@ -323,6 +323,7 @@ BEGIN
 		SET enable_bitmapscan = 1;
 		SET optimizer_enable_tablescan = 0;
 		SET optimizer_enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		is_planner_plan := false;
diff --git a/src/test/regress/expected/brin_bloom.out b/src/test/regress/expected/brin_bloom.out
index 241847a2707..e636c9ba4ae 100644
--- a/src/test/regress/expected/brin_bloom.out
+++ b/src/test/regress/expected/brin_bloom.out
@@ -230,6 +230,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_bloom WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/expected/brin_bloom_optimizer.out b/src/test/regress/expected/brin_bloom_optimizer.out
index 65622f51b4b..2fb93d2819f 100644
--- a/src/test/regress/expected/brin_bloom_optimizer.out
+++ b/src/test/regress/expected/brin_bloom_optimizer.out
@@ -230,6 +230,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_bloom WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/expected/brin_multi.out b/src/test/regress/expected/brin_multi.out
index 0720a66b2ae..677fb45f1fd 100644
--- a/src/test/regress/expected/brin_multi.out
+++ b/src/test/regress/expected/brin_multi.out
@@ -260,6 +260,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_multi WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/expected/brin_multi_optimizer.out b/src/test/regress/expected/brin_multi_optimizer.out
index a31f69d9a16..91a0fa232cb 100644
--- a/src/test/regress/expected/brin_multi_optimizer.out
+++ b/src/test/regress/expected/brin_multi_optimizer.out
@@ -260,6 +260,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_multi WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/expected/brin_multi_optimizer_1.out b/src/test/regress/expected/brin_multi_optimizer_1.out
index 15e850fbca7..d56000ba8fb 100644
--- a/src/test/regress/expected/brin_multi_optimizer_1.out
+++ b/src/test/regress/expected/brin_multi_optimizer_1.out
@@ -260,6 +260,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_multi WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/expected/brin_optimizer.out b/src/test/regress/expected/brin_optimizer.out
index 37d3d21fb10..b749771b08e 100644
--- a/src/test/regress/expected/brin_optimizer.out
+++ b/src/test/regress/expected/brin_optimizer.out
@@ -323,6 +323,7 @@ BEGIN
 		SET enable_bitmapscan = 1;
 		SET optimizer_enable_tablescan = 0;
 		SET optimizer_enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		is_planner_plan := false;
diff --git a/src/test/regress/expected/cbdb_parallel.out b/src/test/regress/expected/cbdb_parallel.out
index 35e90eebfa1..af975de50f4 100644
--- a/src/test/regress/expected/cbdb_parallel.out
+++ b/src/test/regress/expected/cbdb_parallel.out
@@ -112,8 +112,8 @@ set local enable_parallel_dedup_semi_reverse_join = on;
 set local enable_parallel_dedup_semi_join = on;
 explain (costs off)
 select sum(foo.a) from foo where exists (select 1 from bar where foo.a = bar.b);
-                                           QUERY PLAN                                           
-------------------------------------------------------------------------------------------------
+                                          QUERY PLAN                                           
+-----------------------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 6:1  (slice1; segments: 6)
          ->  Partial Aggregate
@@ -1032,6 +1032,15 @@ explain(locus, costs off) select * from rt1 join t1 on rt1.a = t1.b join rt2 on
 select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
+  1 |  2 |  1 |  1 |  1 |  2
+  2 |  3 |  1 |  2 |  2 |  3
+  5 |  6 |  5 |  5 |  5 |  6
+  6 |  7 |  6 |  6 |  6 |  7
+  9 | 10 |  9 |  9 |  9 | 10
+ 10 | 11 | 10 | 10 | 10 | 11
+  6 |  7 |  5 |  6 |  6 |  7
+  7 |  8 |  6 |  7 |  7 |  8
+ 10 | 11 |  9 | 10 | 10 | 11
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  3 |  3 |  3 |  4
   4 |  5 |  4 |  4 |  4 |  5
@@ -1042,15 +1051,6 @@ select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
   5 |  6 |  4 |  5 |  5 |  6
   8 |  9 |  7 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
-  5 |  6 |  5 |  5 |  5 |  6
-  6 |  7 |  6 |  6 |  6 |  7
-  9 | 10 |  9 |  9 |  9 | 10
- 10 | 11 | 10 | 10 | 10 | 11
-  6 |  7 |  5 |  6 |  6 |  7
-  7 |  8 |  6 |  7 |  7 |  8
- 10 | 11 |  9 | 10 | 10 | 11
-  1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
 (19 rows)
 
 -- parallel hash join
@@ -1093,13 +1093,8 @@ explain(locus, costs off) select * from rt1 join t1 on rt1.a = t1.b join rt2 on
 select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
-  5 |  6 |  5 |  5 |  5 |  6
-  6 |  7 |  5 |  6 |  6 |  7
-  6 |  7 |  6 |  6 |  6 |  7
-  7 |  8 |  6 |  7 |  7 |  8
-  9 | 10 |  9 |  9 |  9 | 10
- 10 | 11 |  9 | 10 | 10 | 11
- 10 | 11 | 10 | 10 | 10 | 11
+  1 |  2 |  1 |  1 |  1 |  2
+  2 |  3 |  1 |  2 |  2 |  3
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  2 |  3 |  3 |  4
   3 |  4 |  3 |  3 |  3 |  4
@@ -1110,8 +1105,13 @@ select * from rt1 join t1 on rt1.a = t1.b join rt2 on rt2.a = t1.b;
   8 |  9 |  7 |  8 |  8 |  9
   8 |  9 |  8 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
-  1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
+  5 |  6 |  5 |  5 |  5 |  6
+  6 |  7 |  5 |  6 |  6 |  7
+  6 |  7 |  6 |  6 |  6 |  7
+  7 |  8 |  6 |  7 |  7 |  8
+  9 | 10 |  9 |  9 |  9 | 10
+ 10 | 11 |  9 | 10 | 10 | 11
+ 10 | 11 | 10 | 10 | 10 | 11
 (19 rows)
 
 --
@@ -1145,6 +1145,8 @@ explain(locus, costs off) select * from rt1 join t1 on rt1.a = t1.b join rt3 on
 select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
+  1 |  2 |  1 |  1 |  1 |  2
+  2 |  3 |  1 |  2 |  2 |  3
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  3 |  3 |  3 |  4
   4 |  5 |  4 |  4 |  4 |  5
@@ -1155,8 +1157,6 @@ select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
   5 |  6 |  4 |  5 |  5 |  6
   8 |  9 |  7 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
-  1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
   5 |  6 |  5 |  5 |  5 |  6
   6 |  7 |  6 |  6 |  6 |  7
   9 | 10 |  9 |  9 |  9 | 10
@@ -1201,14 +1201,11 @@ select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
  a  | b  | a  | b  | a  | b  
 ----+----+----+----+----+----
   1 |  2 |  1 |  1 |  1 |  2
-  2 |  3 |  1 |  2 |  2 |  3
   5 |  6 |  5 |  5 |  5 |  6
   6 |  7 |  6 |  6 |  6 |  7
   9 | 10 |  9 |  9 |  9 | 10
  10 | 11 | 10 | 10 | 10 | 11
-  6 |  7 |  5 |  6 |  6 |  7
-  7 |  8 |  6 |  7 |  7 |  8
- 10 | 11 |  9 | 10 | 10 | 11
+  2 |  3 |  1 |  2 |  2 |  3
   2 |  3 |  2 |  2 |  2 |  3
   3 |  4 |  3 |  3 |  3 |  4
   4 |  5 |  4 |  4 |  4 |  5
@@ -1219,6 +1216,9 @@ select * from rt1 join t1 on rt1.a = t1.b join rt3 on rt3.a = t1.b;
   5 |  6 |  4 |  5 |  5 |  6
   8 |  9 |  7 |  8 |  8 |  9
   9 | 10 |  8 |  9 |  9 | 10
+  6 |  7 |  5 |  6 |  6 |  7
+  7 |  8 |  6 |  7 |  7 |  8
+ 10 | 11 |  9 | 10 | 10 | 11
 (19 rows)
 
 create table t2(a int, b int) with(parallel_workers=0);
@@ -1271,12 +1271,12 @@ explain(locus, costs off) select * from rt4 join t2 using(b);
 select * from rt4 join t2 using(b);
  b  | a  | a  
 ----+----+----
-  2 |  1 |  1
   3 |  2 |  2
   4 |  3 |  3
   5 |  4 |  4
   8 |  7 |  7
   9 |  8 |  8
+  2 |  1 |  1
   6 |  5 |  5
   7 |  6 |  6
  10 |  9 |  9
@@ -1362,9 +1362,9 @@ explain(locus, costs off) select * from t_replica_workers_2 join t_random_worker
 select * from t_replica_workers_2 join t_random_workers_0 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
- 3 | 4 | 4
  1 | 2 | 2
+ 3 | 4 | 4
+ 2 | 3 | 3
  4 | 5 | 5
  5 | 6 | 6
 (5 rows)
@@ -1374,9 +1374,9 @@ set local enable_parallel=false;
 select * from t_replica_workers_2 join t_random_workers_0 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
- 3 | 4 | 4
  1 | 2 | 2
+ 3 | 4 | 4
+ 2 | 3 | 3
  4 | 5 | 5
  5 | 6 | 6
 (5 rows)
@@ -1419,9 +1419,9 @@ explain(locus, costs off) select * from t_replica_workers_2 right join t_random_
 select * from t_replica_workers_2 right join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
+ 2 | 3 | 3
  5 | 6 | 6
  1 | 2 | 2
- 2 | 3 | 3
  3 | 4 | 4
  4 | 5 | 5
 (5 rows)
@@ -1431,11 +1431,11 @@ set local enable_parallel=false;
 select * from t_replica_workers_2 right join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
+ 5 | 6 | 6
  1 | 2 | 2
- 2 | 3 | 3
  3 | 4 | 4
  4 | 5 | 5
- 5 | 6 | 6
+ 2 | 3 | 3
 (5 rows)
 
 abort;
@@ -1471,13 +1471,13 @@ explain(locus, costs off) select * from t_replica_workers_2 join t_random_worker
                      Locus: Strewn
                      Parallel Workers: 2
  Optimizer: Postgres query optimizer
-(16 rows)
+(15 rows)
 
 select * from t_replica_workers_2 join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
  1 | 2 | 2
+ 2 | 3 | 3
  3 | 4 | 4
  4 | 5 | 5
  5 | 6 | 6
@@ -1488,11 +1488,11 @@ set local enable_parallel=false;
 select * from t_replica_workers_2 join t_random_workers_2 using(a);
  a | b | b 
 ---+---+---
- 2 | 3 | 3
- 1 | 2 | 2
  3 | 4 | 4
  4 | 5 | 5
  5 | 6 | 6
+ 1 | 2 | 2
+ 2 | 3 | 3
 (5 rows)
 
 abort;
@@ -1510,28 +1510,28 @@ analyze t1;
 analyze rt1;
 set local enable_parallel = on;
 explain(locus, costs off) select * from (select count(*) as a from t1) t1 left join rt1  on rt1.a = t1.a;
-                      QUERY PLAN                      
-------------------------------------------------------
- Parallel Hash Left Join
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Parallel Hash Right Join
    Locus: Entry
-   Hash Cond: ((count(*)) = rt1.a)
-   ->  Finalize Aggregate
+   Hash Cond: (rt1.a = (count(*)))
+   ->  Gather Motion 2:1  (slice1; segments: 2)
          Locus: Entry
-         ->  Gather Motion 6:1  (slice1; segments: 6)
-               Locus: Entry
-               ->  Partial Aggregate
-                     Locus: HashedWorkers
-                     Parallel Workers: 2
-                     ->  Parallel Seq Scan on t1
-                           Locus: HashedWorkers
-                           Parallel Workers: 2
+         ->  Parallel Seq Scan on rt1
+               Locus: SegmentGeneralWorkers
+               Parallel Workers: 2
    ->  Parallel Hash
          Locus: Entry
-         ->  Gather Motion 2:1  (slice2; segments: 2)
+         ->  Finalize Aggregate
                Locus: Entry
-               ->  Parallel Seq Scan on rt1
-                     Locus: SegmentGeneralWorkers
-                     Parallel Workers: 2
+               ->  Gather Motion 6:1  (slice2; segments: 6)
+                     Locus: Entry
+                     ->  Partial Aggregate
+                           Locus: HashedWorkers
+                           Parallel Workers: 2
+                           ->  Parallel Seq Scan on t1
+                                 Locus: HashedWorkers
+                                 Parallel Workers: 2
  Optimizer: Postgres query optimizer
 (21 rows)
 
@@ -1661,17 +1661,17 @@ explain(costs off) select * from t1 right join t2 on t1.b = t2.a;
                             QUERY PLAN                            
 ------------------------------------------------------------------
  Gather Motion 9:1  (slice1; segments: 9)
-   ->  Parallel Hash Left Join
-         Hash Cond: (t2.a = t1.b)
-         ->  Redistribute Motion 6:9  (slice2; segments: 6)
-               Hash Key: t2.a
+   ->  Parallel Hash Right Join
+         Hash Cond: (t1.b = t2.a)
+         ->  Redistribute Motion 9:9  (slice2; segments: 9)
+               Hash Key: t1.b
                Hash Module: 3
-               ->  Parallel Seq Scan on t2
+               ->  Parallel Seq Scan on t1
          ->  Parallel Hash
-               ->  Redistribute Motion 9:9  (slice3; segments: 9)
-                     Hash Key: t1.b
+               ->  Redistribute Motion 6:9  (slice3; segments: 6)
+                     Hash Key: t2.a
                      Hash Module: 3
-                     ->  Parallel Seq Scan on t1
+                     ->  Parallel Seq Scan on t2
  Optimizer: Postgres query optimizer
 (13 rows)
 
@@ -1690,34 +1690,34 @@ analyze t2;
 set local enable_parallel = on;
 -- parallel hash join with shared table, SinglQE as outer partial path.
 explain(locus, costs off) select * from (select count(*) as a from t2) t2 left join t1 on t1.a = t2.a;
-                            QUERY PLAN                            
-------------------------------------------------------------------
+                               QUERY PLAN                               
+------------------------------------------------------------------------
  Gather Motion 6:1  (slice1; segments: 6)
    Locus: Entry
-   ->  Parallel Hash Left Join
-         Locus: Hashed
+   ->  Parallel Hash Right Join
+         Locus: HashedWorkers
          Parallel Workers: 2
-         Hash Cond: ((count(*)) = t1.a)
-         ->  Redistribute Motion 1:6  (slice2; segments: 1)
-               Locus: Hashed
+         Hash Cond: (t1.a = (count(*)))
+         ->  Parallel Seq Scan on t1
+               Locus: HashedWorkers
                Parallel Workers: 2
-               Hash Key: (count(*))
-               Hash Module: 3
-               ->  Finalize Aggregate
-                     Locus: SingleQE
-                     ->  Gather Motion 6:1  (slice3; segments: 6)
-                           Locus: SingleQE
-                           ->  Partial Aggregate
-                                 Locus: HashedWorkers
-                                 Parallel Workers: 2
-                                 ->  Parallel Seq Scan on t2
-                                       Locus: HashedWorkers
-                                       Parallel Workers: 2
          ->  Parallel Hash
                Locus: Hashed
-               ->  Parallel Seq Scan on t1
-                     Locus: HashedWorkers
+               ->  Redistribute Motion 1:6  (slice2; segments: 1)
+                     Locus: Hashed
                      Parallel Workers: 2
+                     Hash Key: (count(*))
+                     Hash Module: 3
+                     ->  Finalize Aggregate
+                           Locus: SingleQE
+                           ->  Gather Motion 6:1  (slice3; segments: 6)
+                                 Locus: SingleQE
+                                 ->  Partial Aggregate
+                                       Locus: HashedWorkers
+                                       Parallel Workers: 2
+                                       ->  Parallel Seq Scan on t2
+                                             Locus: HashedWorkers
+                                             Parallel Workers: 2
  Optimizer: Postgres query optimizer
 (27 rows)
 
@@ -1975,7 +1975,7 @@ explain (locus, costs off) select * from rt1 union all select * from t1;
          ->  Result
                Locus: Strewn
                Parallel Workers: 3
-               One-Time Filter: (gp_execution_segment() = 0)
+               One-Time Filter: (gp_execution_segment() = 1)
                ->  Parallel Seq Scan on rt1
                      Locus: SegmentGeneralWorkers
                      Parallel Workers: 3
@@ -1999,7 +1999,7 @@ explain (locus, costs off) select * from rt1 union all select * from t2;
          ->  Result
                Locus: Strewn
                Parallel Workers: 3
-               One-Time Filter: (gp_execution_segment() = 0)
+               One-Time Filter: (gp_execution_segment() = 1)
                ->  Parallel Seq Scan on rt1
                      Locus: SegmentGeneralWorkers
                      Parallel Workers: 3
@@ -2296,8 +2296,8 @@ analyze t1;
 analyze t2;
 analyze t3_null;
 explain(costs off) select sum(t1.c1) from t1 where c1 not in (select c2 from t2);
-                                     QUERY PLAN                                     
-------------------------------------------------------------------------------------
+                                    QUERY PLAN                                     
+-----------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 6:1  (slice1; segments: 6)
          ->  Partial Aggregate
@@ -2317,8 +2317,8 @@ select sum(t1.c1) from t1 where c1 not in (select c2 from t2);
 (1 row)
 
 explain(costs off) select * from t1 where c1 not in (select c2 from t3_null);
-                               QUERY PLAN                               
-------------------------------------------------------------------------
+                              QUERY PLAN                               
+-----------------------------------------------------------------------
  Gather Motion 6:1  (slice1; segments: 6)
    ->  Parallel Hash Left Anti Semi (Not-In) Join
          Hash Cond: (t1.c1 = t3_null.c2)
@@ -2457,8 +2457,11 @@ abort;
 begin;
 create table pagg_tab (a int, b int, c text, d int) partition by list(c);
 create table pagg_tab_p1 partition of pagg_tab for values in ('0000', '0001', '0002', '0003', '0004');
+NOTICE:  table has parent, setting distribution columns to match parent table
 create table pagg_tab_p2 partition of pagg_tab for values in ('0005', '0006', '0007', '0008');
+NOTICE:  table has parent, setting distribution columns to match parent table
 create table pagg_tab_p3 partition of pagg_tab for values in ('0009', '0010', '0011');
+NOTICE:  table has parent, setting distribution columns to match parent table
 insert into pagg_tab select i % 20, i % 30, to_char(i % 12, 'FM0000'), i % 30 from generate_series(0, 2999) i;
 analyze pagg_tab;
 set local enable_parallel to off;
@@ -2972,7 +2975,7 @@ create table t2_anti(a int, b int) with(parallel_workers=2) distributed by (b);
 insert into t2_anti values(generate_series(5, 10));
 explain(costs off, verbose)
 select t1_anti.a, t1_anti.b from t1_anti left join t2_anti on t1_anti.a = t2_anti.a where t2_anti.a is null;
-                            QUERY PLAN                            
+                            QUERY PLAN
 ------------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    Output: t1_anti.a, t1_anti.b
@@ -3068,8 +3071,8 @@ select t1_anti.a, t1_anti.b from t1_anti left join t2_anti on t1_anti.a = t2_ant
 ---+---
  3 |  
  4 |  
- 1 |  
  2 |  
+ 1 |  
 (4 rows)
 
 abort;
@@ -3098,7 +3101,7 @@ insert into t_distinct_0 select * from t_distinct_0;
 analyze t_distinct_0;
 explain(costs off)
 select distinct a from t_distinct_0;
-                         QUERY PLAN                         
+                         QUERY PLAN
 ------------------------------------------------------------
  Gather Motion 3:1  (slice1; segments: 3)
    ->  HashAggregate
@@ -3232,8 +3235,6 @@ select distinct a, b from t_distinct_0;
 drop table if exists t_distinct_1;
 NOTICE:  table "t_distinct_1" does not exist, skipping
 create table t_distinct_1(a int, b int) using ao_column;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into t_distinct_1 select * from t_distinct_0;
 analyze t_distinct_1;
 set enable_parallel = off;
@@ -3520,10 +3521,7 @@ WHERE e.salary > (
 -- Test https://github.com/apache/cloudberry/issues/1376
 --
 create table t1(a int, b int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table t2 (like t1);
-NOTICE:  table doesn't have 'DISTRIBUTED BY' clause, defaulting to distribution columns from LIKE table
 set gp_cte_sharing = on;
 explain(locus, costs off) with x as
   (select a, count(*) as b from t1 group by a union all
@@ -3571,8 +3569,184 @@ explain(locus, costs off) with x as
 reset gp_cte_sharing;
 reset enable_parallel;
 reset min_parallel_table_scan_size;
+--
+-- Parallel Hash Full/Right Join
+--
+begin;
+create table pj_t1(id int, v int) with(parallel_workers=2) distributed by (id);
+create table pj_t2(id int, v int) with(parallel_workers=2) distributed by (id);
+create table pj_t3(id int, v int) with(parallel_workers=0) distributed by (id);
+-- pj_t1 is 3x larger than pj_t2 so the planner hashes the smaller pj_t2
+-- and probes with pj_t1, producing a genuine Parallel Hash Right Join plan.
+insert into pj_t1 select i, i from generate_series(1,30000)i;
+insert into pj_t2 select i, i from generate_series(25001,35000)i;
+insert into pj_t3 select i, i from generate_series(1,10000)i;
+analyze pj_t1;
+analyze pj_t2;
+analyze pj_t3;
+set local enable_parallel = on;
+set local min_parallel_table_scan_size = 0;
+-- 12_P_12_10: Parallel Hash Full Join: HashedWorkers FULL JOIN HashedWorkers -> HashedOJ(parallel)
+explain(costs off, locus)
+select count(*) from pj_t1 full join pj_t2 using (id);
+                        QUERY PLAN                        
+----------------------------------------------------------
+ Finalize Aggregate
+   Locus: Entry
+   ->  Gather Motion 6:1  (slice1; segments: 6)
+         Locus: Entry
+         ->  Partial Aggregate
+               Locus: HashedOJ
+               Parallel Workers: 2
+               ->  Parallel Hash Full Join
+                     Locus: HashedOJ
+                     Parallel Workers: 2
+                     Hash Cond: (pj_t1.id = pj_t2.id)
+                     ->  Parallel Seq Scan on pj_t1
+                           Locus: HashedWorkers
+                           Parallel Workers: 2
+                     ->  Parallel Hash
+                           Locus: Hashed
+                           ->  Parallel Seq Scan on pj_t2
+                                 Locus: HashedWorkers
+                                 Parallel Workers: 2
+ Optimizer: Postgres query optimizer
+(20 rows)
+
+-- correctness: parallel result matches non-parallel
+set local enable_parallel = off;
+select count(*) from pj_t1 full join pj_t2 using (id);
+ count 
+-------
+ 35000
+(1 row)
+
+set local enable_parallel = on;
+select count(*) from pj_t1 full join pj_t2 using (id);
+ count 
+-------
+ 35000
+(1 row)
+
+-- Parallel Hash Right Join: pj_t1 (30K) is larger, so the planner hashes the smaller pj_t2
+-- (10K) as the build side and probes with pj_t1; result locus HashedWorkers(parallel)
+explain(costs off, locus)
+select count(*) from pj_t1 right join pj_t2 using (id);
+                        QUERY PLAN                        
+----------------------------------------------------------
+ Finalize Aggregate
+   Locus: Entry
+   ->  Gather Motion 6:1  (slice1; segments: 6)
+         Locus: Entry
+         ->  Partial Aggregate
+               Locus: HashedWorkers
+               Parallel Workers: 2
+               ->  Parallel Hash Right Join
+                     Locus: HashedWorkers
+                     Parallel Workers: 2
+                     Hash Cond: (pj_t1.id = pj_t2.id)
+                     ->  Parallel Seq Scan on pj_t1
+                           Locus: HashedWorkers
+                           Parallel Workers: 2
+                     ->  Parallel Hash
+                           Locus: Hashed
+                           ->  Parallel Seq Scan on pj_t2
+                                 Locus: HashedWorkers
+                                 Parallel Workers: 2
+ Optimizer: Postgres query optimizer
+(20 rows)
+
+-- correctness: parallel result matches non-parallel
+set local enable_parallel = off;
+select count(*) from pj_t1 right join pj_t2 using (id);
+ count 
+-------
+ 10000
+(1 row)
+
+set local enable_parallel = on;
+select count(*) from pj_t1 right join pj_t2 using (id);
+ count 
+-------
+ 10000
+(1 row)
+
+-- Locus propagation: HashedOJ(parallel) followed by INNER JOIN with Hashed(serial)
+-- The full join result (HashedOJ,parallel=2) is joined with pj_t3 (Hashed,serial)
+explain(costs off, locus)
+select count(*) from (pj_t1 full join pj_t2 using (id)) fj inner join pj_t3 using (id);
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
+ Finalize Aggregate
+   Locus: Entry
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Locus: Entry
+         ->  Partial Aggregate
+               Locus: HashedOJ
+               ->  Hash Join
+                     Locus: HashedOJ
+                     Hash Cond: (COALESCE(pj_t1.id, pj_t2.id) = pj_t3.id)
+                     ->  Hash Full Join
+                           Locus: HashedOJ
+                           Hash Cond: (pj_t1.id = pj_t2.id)
+                           ->  Seq Scan on pj_t1
+                                 Locus: Hashed
+                           ->  Hash
+                                 Locus: Hashed
+                                 ->  Seq Scan on pj_t2
+                                       Locus: Hashed
+                     ->  Hash
+                           Locus: Replicated
+                           ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                                 Locus: Replicated
+                                 ->  Seq Scan on pj_t3
+                                       Locus: Hashed
+ Optimizer: Postgres query optimizer
+(25 rows)
+
+-- Locus propagation: HashedOJ(parallel) followed by FULL JOIN with Hashed(serial)
+explain(costs off, locus)
+select count(*) from (pj_t1 full join pj_t2 using (id)) fj full join pj_t3 using (id);
+                                QUERY PLAN                                
+--------------------------------------------------------------------------
+ Finalize Aggregate
+   Locus: Entry
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Locus: Entry
+         ->  Partial Aggregate
+               Locus: HashedOJ
+               ->  Hash Full Join
+                     Locus: HashedOJ
+                     Hash Cond: (COALESCE(pj_t1.id, pj_t2.id) = pj_t3.id)
+                     ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                           Locus: Hashed
+                           Hash Key: COALESCE(pj_t1.id, pj_t2.id)
+                           ->  Hash Full Join
+                                 Locus: HashedOJ
+                                 Hash Cond: (pj_t1.id = pj_t2.id)
+                                 ->  Seq Scan on pj_t1
+                                       Locus: Hashed
+                                 ->  Hash
+                                       Locus: Hashed
+                                       ->  Seq Scan on pj_t2
+                                             Locus: Hashed
+                     ->  Hash
+                           Locus: Hashed
+                           ->  Seq Scan on pj_t3
+                                 Locus: Hashed
+ Optimizer: Postgres query optimizer
+(26 rows)
+
+abort;
 -- start_ignore
 drop schema test_parallel cascade;
+NOTICE:  drop cascades to 6 other objects
+DETAIL:  drop cascades to table t_distinct_0
+drop cascades to table t_distinct_1
+drop cascades to table departments
+drop cascades to table employees
+drop cascades to table t1
+drop cascades to table t2
 -- end_ignore
 reset gp_appendonly_insert_files;
 reset force_parallel_mode;
diff --git a/src/test/regress/expected/create_index.out b/src/test/regress/expected/create_index.out
index 0bc2aaa9f6e..f71a81ef9cf 100644
--- a/src/test/regress/expected/create_index.out
+++ b/src/test/regress/expected/create_index.out
@@ -1705,7 +1705,7 @@ DROP TABLE syscol_table;
 --
 -- Tests for IS NULL/IS NOT NULL with b-tree indexes
 --
-CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek;
+CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek DISTRIBUTED BY (unique1);
 INSERT INTO onek_with_null (unique1,unique2) VALUES (NULL, -1), (NULL, NULL);
 CREATE UNIQUE INDEX onek_nulltest ON onek_with_null (unique2,unique1);
 SET enable_seqscan = OFF;
diff --git a/src/test/regress/expected/create_index_optimizer.out b/src/test/regress/expected/create_index_optimizer.out
index 65f5f92b8bd..c133678d152 100644
--- a/src/test/regress/expected/create_index_optimizer.out
+++ b/src/test/regress/expected/create_index_optimizer.out
@@ -652,18 +652,16 @@ SELECT * FROM point_tblv WHERE f1 IS NOT NULL ORDER BY f1 <-> '0,1';
 --SELECT * FROM point_tbl WHERE f1 IS NOT NULL ORDER BY f1 <-> '0,1';
 EXPLAIN (COSTS OFF)
 SELECT * FROM point_tblv WHERE f1 <@ '(-10,-10),(10,10)':: box ORDER BY f1 <-> '0,1';
-                                                                                QUERY PLAN                                                                                
---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
- Result
-   ->  Sort
-         Sort Key: ((f1 <-> '(0,1)'::point))
-         ->  Result
-               ->  Gather Motion 3:1  (slice1; segments: 3)
-                     ->  Index Scan using gpointind on point_tbl
-                           Index Cond: (f1 <@ '(10,10),(-10,-10)'::box)
-                           Filter: ((f1 <> '(1e-300,-1e-300)'::point) AND ((f1 <-> '(0,0)'::point) <> 'Infinity'::double precision) AND (f1 <@ '(10,10),(-10,-10)'::box))
- Optimizer: Pivotal Optimizer (GPORCA)
-(9 rows)
+                                                    QUERY PLAN                                                     
+-------------------------------------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Merge Key: ((point_tbl.f1 <-> '(0,1)'::point))
+   ->  Index Only Scan using gpointind on point_tbl
+         Index Cond: (f1 <@ '(10,10),(-10,-10)'::box)
+         Order By: (f1 <-> '(0,1)'::point)
+         Filter: ((f1 <> '(1e-300,-1e-300)'::point) AND ((f1 <-> '(0,0)'::point) <> 'Infinity'::double precision))
+ Optimizer: Postgres query optimizer
+(7 rows)
 
 SELECT * FROM point_tblv WHERE f1 <@ '(-10,-10),(10,10)':: box ORDER BY f1 <-> '0,1';
    f1    
@@ -767,18 +765,19 @@ SET enable_indexscan = OFF;
 SET enable_bitmapscan = ON;
 EXPLAIN (COSTS OFF)
 SELECT * FROM point_tblv WHERE f1 <@ '(-10,-10),(10,10)':: box ORDER BY f1 <-> '0,1';
-                                                                                QUERY PLAN                                                                                
---------------------------------------------------------------------------------------------------------------------------------------------------------------------------
- Result
+                                                       QUERY PLAN                                                        
+-------------------------------------------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Merge Key: ((point_tbl.f1 <-> '(0,1)'::point))
    ->  Sort
-         Sort Key: ((f1 <-> '(0,1)'::point))
-         ->  Result
-               ->  Gather Motion 3:1  (slice1; segments: 3)
-                     ->  Index Scan using gpointind on point_tbl
-                           Index Cond: (f1 <@ '(10,10),(-10,-10)'::box)
-                           Filter: ((f1 <> '(1e-300,-1e-300)'::point) AND ((f1 <-> '(0,0)'::point) <> 'Infinity'::double precision) AND (f1 <@ '(10,10),(-10,-10)'::box))
- Optimizer: Pivotal Optimizer (GPORCA)
-(9 rows)
+         Sort Key: ((point_tbl.f1 <-> '(0,1)'::point))
+         ->  Bitmap Heap Scan on point_tbl
+               Recheck Cond: (f1 <@ '(10,10),(-10,-10)'::box)
+               Filter: ((f1 <> '(1e-300,-1e-300)'::point) AND ((f1 <-> '(0,0)'::point) <> 'Infinity'::double precision))
+               ->  Bitmap Index Scan on gpointind
+                     Index Cond: (f1 <@ '(10,10),(-10,-10)'::box)
+ Optimizer: Postgres query optimizer
+(10 rows)
 
 SELECT * FROM point_tblv WHERE f1 <@ '(-10,-10),(10,10)':: box ORDER BY f1 <-> '0,1';
    f1    
@@ -1734,7 +1733,7 @@ DROP TABLE syscol_table;
 --
 -- Tests for IS NULL/IS NOT NULL with b-tree indexes
 --
-CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek;
+CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek DISTRIBUTED BY (unique1);
 INSERT INTO onek_with_null (unique1,unique2) VALUES (NULL, -1), (NULL, NULL);
 CREATE UNIQUE INDEX onek_nulltest ON onek_with_null (unique2,unique1);
 SET enable_seqscan = OFF;
diff --git a/src/test/regress/expected/create_view.out b/src/test/regress/expected/create_view.out
index ac88c92f398..2a1fdca3562 100644
--- a/src/test/regress/expected/create_view.out
+++ b/src/test/regress/expected/create_view.out
@@ -1999,6 +1999,44 @@ select pg_get_viewdef('tt26v', true);
     FROM ( VALUES (1,2,3)) v(x, y, z);
 (1 row)
 
+-- Test that changing the relkind of a relcache entry doesn't cause
+-- trouble. Prior instances of where it did:
+-- CALDaNm2yXz+zOtv7y5zBd5WKT8O0Ld3YxikuU3dcyCvxF7gypA@mail.gmail.com
+-- CALDaNm3oZA-8Wbps2Jd1g5_Gjrr-x3YWrJPek-mF5Asrrvz2Dg@mail.gmail.com
+CREATE TABLE tt26(c int);
+BEGIN;
+CREATE TABLE tt27(c int);
+SAVEPOINT q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+SELECT * FROM tt27;
+ c 
+---
+(0 rows)
+
+ROLLBACK TO q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+ROLLBACK;
+BEGIN;
+CREATE TABLE tt28(c int);
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+ERROR:  "tt28" is already a view
+ROLLBACK;
+-- test restriction on non-system view expansion.
+create table tt27v_tbl (a int);
+create view tt27v as select a from tt27v_tbl;
+set restrict_nonsystem_relation_kind to 'view';
+select a from tt27v where a > 0; -- Error
+ERROR:  access to non-system view "tt27v" is restricted
+insert into tt27v values (1); -- Error
+ERROR:  access to non-system view "tt27v" is restricted
+select viewname from pg_views where viewname = 'tt27v'; -- Ok to access a system view.
+ viewname 
+----------
+ tt27v
+(1 row)
+
+reset restrict_nonsystem_relation_kind;
 -- test display negative operator of const-folder expression
 create table tdis(a int, b int, c int);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Greenplum Database data distribution key for this table.
@@ -2046,7 +2084,7 @@ drop cascades to view aliased_view_2
 drop cascades to view aliased_view_3
 drop cascades to view aliased_view_4
 DROP SCHEMA testviewschm2 CASCADE;
-NOTICE:  drop cascades to 76 other objects
+NOTICE:  drop cascades to 79 other objects
 DETAIL:  drop cascades to table t1
 drop cascades to view temporal1
 drop cascades to view temporal2
@@ -2121,5 +2159,8 @@ drop cascades to view tt23v
 drop cascades to view tt24v
 drop cascades to view tt25v
 drop cascades to view tt26v
+drop cascades to table tt26
+drop cascades to table tt27v_tbl
+drop cascades to view tt27v
 drop cascades to table tdis
 drop cascades to view tdis_v1
diff --git a/src/test/regress/expected/create_view_optimizer.out b/src/test/regress/expected/create_view_optimizer.out
index ece2034d92d..c17ae313cac 100755
--- a/src/test/regress/expected/create_view_optimizer.out
+++ b/src/test/regress/expected/create_view_optimizer.out
@@ -1997,6 +1997,44 @@ select pg_get_viewdef('tt26v', true);
     FROM ( VALUES (1,2,3)) v(x, y, z);
 (1 row)
 
+-- Test that changing the relkind of a relcache entry doesn't cause
+-- trouble. Prior instances of where it did:
+-- CALDaNm2yXz+zOtv7y5zBd5WKT8O0Ld3YxikuU3dcyCvxF7gypA@mail.gmail.com
+-- CALDaNm3oZA-8Wbps2Jd1g5_Gjrr-x3YWrJPek-mF5Asrrvz2Dg@mail.gmail.com
+CREATE TABLE tt26(c int);
+BEGIN;
+CREATE TABLE tt27(c int);
+SAVEPOINT q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+SELECT * FROM tt27;
+ c 
+---
+(0 rows)
+
+ROLLBACK TO q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+ROLLBACK;
+BEGIN;
+CREATE TABLE tt28(c int);
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+ERROR:  "tt28" is already a view
+ROLLBACK;
+-- test restriction on non-system view expansion.
+create table tt27v_tbl (a int);
+create view tt27v as select a from tt27v_tbl;
+set restrict_nonsystem_relation_kind to 'view';
+select a from tt27v where a > 0; -- Error
+ERROR:  access to non-system view "tt27v" is restricted
+insert into tt27v values (1); -- Error
+ERROR:  access to non-system view "tt27v" is restricted
+select viewname from pg_views where viewname = 'tt27v'; -- Ok to access a system view.
+ viewname 
+----------
+ tt27v
+(1 row)
+
+reset restrict_nonsystem_relation_kind;
 -- test display negative operator of const-folder expression
 create table tdis(a int, b int, c int);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
@@ -2044,7 +2082,7 @@ drop cascades to view aliased_view_2
 drop cascades to view aliased_view_3
 drop cascades to view aliased_view_4
 DROP SCHEMA testviewschm2 CASCADE;
-NOTICE:  drop cascades to 76 other objects
+NOTICE:  drop cascades to 79 other objects
 DETAIL:  drop cascades to table t1
 drop cascades to view temporal1
 drop cascades to view temporal2
@@ -2119,5 +2157,8 @@ drop cascades to view tt23v
 drop cascades to view tt24v
 drop cascades to view tt25v
 drop cascades to view tt26v
+drop cascades to table tt26
+drop cascades to table tt27v_tbl
+drop cascades to view tt27v
 drop cascades to table tdis
 drop cascades to view tdis_v1
diff --git a/src/test/regress/expected/gist_optimizer.out b/src/test/regress/expected/gist_optimizer.out
index e9020c5db70..abb8b5524cf 100644
--- a/src/test/regress/expected/gist_optimizer.out
+++ b/src/test/regress/expected/gist_optimizer.out
@@ -98,18 +98,15 @@ select p from gist_tbl where p <@ box(point(0,0), point(0.5, 0.5));
 explain (costs off)
 select p from gist_tbl where p <@ box(point(0,0), point(0.5, 0.5))
 order by p <-> point(0.201, 0.201);
-                             QUERY PLAN                              
----------------------------------------------------------------------
- Result
-   ->  Gather Motion 3:1  (slice1; segments: 3)
-         Merge Key: ((p <-> '(0.201,0.201)'::point))
-         ->  Sort
-               Sort Key: ((p <-> '(0.201,0.201)'::point))
-               ->  Index Scan using gist_tbl_point_index on gist_tbl
-                     Index Cond: (p <@ '(0.5,0.5),(0,0)'::box)
-                     Filter: (p <@ '(0.5,0.5),(0,0)'::box)
- Optimizer: Pivotal Optimizer (GPORCA) version 3.83.0
-(9 rows)
+                          QUERY PLAN                          
+--------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Merge Key: ((p <-> '(0.201,0.201)'::point))
+   ->  Index Only Scan using gist_tbl_point_index on gist_tbl
+         Index Cond: (p <@ '(0.5,0.5),(0,0)'::box)
+         Order By: (p <-> '(0.201,0.201)'::point)
+ Optimizer: Postgres query optimizer
+(6 rows)
 
 select p from gist_tbl where p <@ box(point(0,0), point(0.5, 0.5))
 order by p <-> point(0.201, 0.201);
@@ -132,18 +129,15 @@ order by p <-> point(0.201, 0.201);
 explain (costs off)
 select p from gist_tbl where p <@ box(point(0,0), point(0.5, 0.5))
 order by point(0.101, 0.101) <-> p;
-                             QUERY PLAN                              
----------------------------------------------------------------------
- Result
-   ->  Gather Motion 3:1  (slice1; segments: 3)
-         Merge Key: (('(0.101,0.101)'::point <-> p))
-         ->  Sort
-               Sort Key: (('(0.101,0.101)'::point <-> p))
-               ->  Index Scan using gist_tbl_point_index on gist_tbl
-                     Index Cond: (p <@ '(0.5,0.5),(0,0)'::box)
-                     Filter: (p <@ '(0.5,0.5),(0,0)'::box)
- Optimizer: Pivotal Optimizer (GPORCA) version 3.83.0
-(9 rows)
+                          QUERY PLAN                          
+--------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Merge Key: (('(0.101,0.101)'::point <-> p))
+   ->  Index Only Scan using gist_tbl_point_index on gist_tbl
+         Index Cond: (p <@ '(0.5,0.5),(0,0)'::box)
+         Order By: (p <-> '(0.101,0.101)'::point)
+ Optimizer: Postgres query optimizer
+(6 rows)
 
 select p from gist_tbl where p <@ box(point(0,0), point(0.5, 0.5))
 order by point(0.101, 0.101) <-> p;
@@ -248,18 +242,15 @@ select b from gist_tbl where b <@ box(point(5,5), point(6,6));
 explain (costs off)
 select b from gist_tbl where b <@ box(point(5,5), point(6,6))
 order by b <-> point(5.2, 5.91);
-                            QUERY PLAN                             
--------------------------------------------------------------------
- Result
-   ->  Gather Motion 3:1  (slice1; segments: 3)
-         Merge Key: ((b <-> '(5.2,5.91)'::point))
-         ->  Sort
-               Sort Key: ((b <-> '(5.2,5.91)'::point))
-               ->  Index Scan using gist_tbl_box_index on gist_tbl
-                     Index Cond: (b <@ '(6,6),(5,5)'::box)
-                     Filter: (b <@ '(6,6),(5,5)'::box)
- Optimizer: Pivotal Optimizer (GPORCA)
-(9 rows)
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Merge Key: ((b <-> '(5.2,5.91)'::point))
+   ->  Index Only Scan using gist_tbl_box_index on gist_tbl
+         Index Cond: (b <@ '(6,6),(5,5)'::box)
+         Order By: (b <-> '(5.2,5.91)'::point)
+ Optimizer: Postgres query optimizer
+(6 rows)
 
 select b from gist_tbl where b <@ box(point(5,5), point(6,6))
 order by b <-> point(5.2, 5.91);
diff --git a/src/test/regress/expected/groupingsets.out b/src/test/regress/expected/groupingsets.out
index f7eefa2c8eb..5222cc22b70 100644
--- a/src/test/regress/expected/groupingsets.out
+++ b/src/test/regress/expected/groupingsets.out
@@ -958,6 +958,25 @@ explain (costs off)
  Optimizer: Postgres query optimizer
 (13 rows)
 
+-- HAVING with constant-false predicate on an empty grouping set must emit
+-- zero rows, not the default scalar-aggregate row.
+select count(*) from gstest2 group by grouping sets (()) having false;
+ count 
+-------
+(0 rows)
+
+explain (costs off)
+  select count(*) from gstest2 group by grouping sets (()) having false;
+             QUERY PLAN
+-------------------------------------
+ Aggregate
+   Group Key: ()
+   Filter: false
+   ->  Result
+         One-Time Filter: false
+ Optimizer: Postgres query optimizer
+(6 rows)
+
 -- HAVING with GROUPING queries
 select ten, grouping(ten) from onek
 group by grouping sets(ten) having grouping(ten) >= 0
diff --git a/src/test/regress/expected/groupingsets_optimizer.out b/src/test/regress/expected/groupingsets_optimizer.out
index 08ef4c1a68c..a07017eca32 100644
--- a/src/test/regress/expected/groupingsets_optimizer.out
+++ b/src/test/regress/expected/groupingsets_optimizer.out
@@ -958,23 +958,39 @@ select v.c, (select count(*) from gstest2 group by () having v.c)
 explain (costs off)
   select v.c, (select count(*) from gstest2 group by () having v.c)
     from (values (false),(true)) v(c) order by v.c;
-                                QUERY PLAN                                
---------------------------------------------------------------------------
- Sort
-   Sort Key: "*VALUES*".column1
-   ->  Values Scan on "*VALUES*"
-         SubPlan 1
-           ->  Aggregate
-                 Group Key: ()
-                 Filter: "*VALUES*".column1
-                 ->  Result
-                       One-Time Filter: "*VALUES*".column1
-                       ->  Materialize
-                             ->  Gather Motion 3:1  (slice1; segments: 3)
+                             QUERY PLAN
+--------------------------------------------------------------------
+ Result
+   ->  Sort
+         Sort Key: "Values".column1
+         ->  Values Scan on "Values"
+   SubPlan 1
+     ->  Result
+           One-Time Filter: "Values".column1
+           ->  Finalize Aggregate
+                 ->  Materialize
+                       ->  Gather Motion 3:1  (slice1; segments: 3)
+                             ->  Partial Aggregate
                                    ->  Seq Scan on gstest2
- Optimizer: Postgres query optimizer
+ Optimizer: GPORCA
 (13 rows)
 
+-- HAVING with constant-false predicate on an empty grouping set must emit
+-- zero rows, not the default scalar-aggregate row.
+select count(*) from gstest2 group by grouping sets (()) having false;
+ count 
+-------
+(0 rows)
+
+explain (costs off)
+  select count(*) from gstest2 group by grouping sets (()) having false;
+        QUERY PLAN
+--------------------------
+ Result
+   One-Time Filter: false
+ Optimizer: GPORCA
+(3 rows)
+
 -- HAVING with GROUPING queries
 select ten, grouping(ten) from onek
 group by grouping sets(ten) having grouping(ten) >= 0
diff --git a/src/test/regress/expected/join_hash.out b/src/test/regress/expected/join_hash.out
index 5171a7d9cf3..e5f74c18d28 100644
--- a/src/test/regress/expected/join_hash.out
+++ b/src/test/regress/expected/join_hash.out
@@ -10,6 +10,9 @@ set allow_system_table_mods=on;
 set local min_parallel_table_scan_size = 0;
 set local parallel_setup_cost = 0;
 set local enable_hashjoin = on;
+-- CBDB: disable CBDB parallel for these PG-originated tests; parallel full join
+-- is tested separately in cbdb_parallel.sql.
+set local enable_parallel = off;
 -- Extract bucket and batch counts from an explain analyze plan.  In
 -- general we can't make assertions about how many batches (or
 -- buckets) will be required because it can vary, but we can in some
@@ -58,12 +61,16 @@ $$;
 -- estimated size.
 create table simple as
   select generate_series(1, 60000) AS id, 'aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa';
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 alter table simple set (parallel_workers = 2);
 analyze simple;
 -- Make a relation whose size we will under-estimate.  We want stats
 -- to say 1000 rows, but actually there are 20,000 rows.
 create table bigger_than_it_looks as
   select generate_series(1, 60000) as id, 'aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa';
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 alter table bigger_than_it_looks set (autovacuum_enabled = 'false');
 WARNING:  autovacuum is not supported in Cloudberry
 alter table bigger_than_it_looks set (parallel_workers = 2);
@@ -73,6 +80,8 @@ update pg_class set reltuples = 1000 where relname = 'bigger_than_it_looks';
 -- kind of skew that breaks our batching scheme.  We want stats to say
 -- 2 rows, but actually there are 20,000 rows with the same key.
 create table extremely_skewed (id int, t text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 alter table extremely_skewed set (autovacuum_enabled = 'false');
 WARNING:  autovacuum is not supported in Cloudberry
 alter table extremely_skewed set (parallel_workers = 2);
@@ -85,6 +94,8 @@ update pg_class
   where relname = 'extremely_skewed';
 -- Make a relation with a couple of enormous tuples.
 create table wide as select generate_series(1, 2) as id, rpad('', 320000, 'x') as t;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 alter table wide set (parallel_workers = 2);
 ANALYZE wide;
 -- The "optimal" case: the hash table fits in memory; we plan for 1
@@ -315,6 +326,13 @@ $$);
  t                    | f
 (1 row)
 
+-- parallel full multi-batch hash join
+select count(*) from simple r full outer join simple s using (id);
+ count 
+-------
+ 60000
+(1 row)
+
 rollback to settings;
 -- The "bad" case: during execution we need to increase number of
 -- batches; in this case we plan for 1 batch, and increase at least a
@@ -567,9 +585,13 @@ rollback to settings;
 -- Exercise rescans.  We'll turn off parallel_leader_participation so
 -- that we can check that instrumentation comes back correctly.
 create table join_foo as select generate_series(1, 3) as id, 'xxxxx'::text as t;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 analyze join_foo;
 alter table join_foo set (parallel_workers = 0);
 create table join_bar as select generate_series(1, 20000) as id, 'xxxxx'::text as t;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 analyze join_bar;
 alter table join_bar set (parallel_workers = 2);
 -- multi-batch with rescan, parallel-oblivious
@@ -816,7 +838,33 @@ select  count(*) from simple r full outer join simple s using (id);
 (1 row)
 
 rollback to settings;
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
+savepoint settings;
+set enable_parallel_hash = off;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s using (id);
+                     QUERY PLAN                     
+----------------------------------------------------
+ Finalize Aggregate
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         ->  Partial Aggregate
+               ->  Hash Full Join
+                     Hash Cond: (r.id = s.id)
+                     ->  Seq Scan on simple r
+                     ->  Hash
+                           ->  Seq Scan on simple s
+ Optimizer: Postgres query optimizer
+(9 rows)
+
+select  count(*) from simple r full outer join simple s using (id);
+ count 
+-------
+ 60000
+(1 row)
+
+rollback to settings;
+-- parallelism is possible with parallel-aware full hash join
 savepoint settings;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
@@ -841,7 +889,7 @@ select  count(*) from simple r full outer join simple s using (id);
 (1 row)
 
 rollback to settings;
--- An full outer join where every record is not matched.
+-- A full outer join where every record is not matched.
 -- non-parallel
 savepoint settings;
 set local max_parallel_workers_per_gather = 0;
@@ -869,7 +917,35 @@ select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
 (1 row)
 
 rollback to settings;
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
+savepoint settings;
+set enable_parallel_hash = off;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+                               QUERY PLAN                               
+------------------------------------------------------------------------
+ Finalize Aggregate
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         ->  Partial Aggregate
+               ->  Hash Full Join
+                     Hash Cond: ((0 - s.id) = r.id)
+                     ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                           Hash Key: (0 - s.id)
+                           ->  Seq Scan on simple s
+                     ->  Hash
+                           ->  Seq Scan on simple r
+ Optimizer: Postgres query optimizer
+(11 rows)
+
+select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+ count  
+--------
+ 120000
+(1 row)
+
+rollback to settings;
+-- parallelism is possible with parallel-aware full hash join
 savepoint settings;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
@@ -954,7 +1030,11 @@ rollback to settings;
 savepoint settings;
 set max_parallel_workers_per_gather = 0;
 create table join_hash_t_small(a int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table join_hash_t_big(b int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into join_hash_t_small select i%100 from generate_series(0, 3000)i;
 insert into join_hash_t_big select i%100000 from generate_series(1, 100000)i ;
 analyze join_hash_t_small;
@@ -973,6 +1053,52 @@ explain (costs off) select * from join_hash_t_small, join_hash_t_big where a = b
 
 rollback to settings;
 rollback;
+-- Hash join reuses the HOT status bit to indicate match status. This can only
+-- be guaranteed to produce correct results if all the hash join tuple match
+-- bits are reset before reuse. This is done upon loading them into the
+-- hashtable.
+begin;
+SAVEPOINT settings;
+-- CBDB: disable CBDB parallel; the serial full join match-bit test is what matters here.
+SET enable_parallel = off;
+SET enable_parallel_hash = on;
+SET min_parallel_table_scan_size = 0;
+SET parallel_setup_cost = 0;
+SET parallel_tuple_cost = 0;
+CREATE TABLE hjtest_matchbits_t1(id int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+CREATE TABLE hjtest_matchbits_t2(id int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+INSERT INTO hjtest_matchbits_t1 VALUES (1);
+INSERT INTO hjtest_matchbits_t2 VALUES (2);
+-- Update should create a HOT tuple. If this status bit isn't cleared, we won't
+-- correctly emit the NULL-extended unmatching tuple in full hash join.
+UPDATE hjtest_matchbits_t2 set id = 2;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id
+  ORDER BY t1.id;
+ id | id 
+----+----
+  1 |   
+    |  2
+(2 rows)
+
+-- Test serial full hash join.
+-- Resetting parallel_setup_cost should force a serial plan.
+-- Just to be safe, however, set enable_parallel_hash to off, as parallel full
+-- hash joins are only supported with shared hashtables.
+RESET parallel_setup_cost;
+SET enable_parallel_hash = off;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id;
+ id | id 
+----+----
+    |  2
+  1 |   
+(2 rows)
+
+ROLLBACK TO settings;
+rollback;
 -- Verify that hash key expressions reference the correct
 -- nodes. Hashjoin's hashkeys need to reference its outer plan, Hash's
 -- need to reference Hash's outer plan (which is below HashJoin's
@@ -988,7 +1114,11 @@ BEGIN;
 SET LOCAL enable_sort = OFF; -- avoid mergejoins
 SET LOCAL from_collapse_limit = 1; -- allows easy changing of join order
 CREATE TABLE hjtest_1 (a text, b int, id int, c bool);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 CREATE TABLE hjtest_2 (a bool, id int, b text, c int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 INSERT INTO hjtest_1(a, b, id, c) VALUES ('text', 2, 1, false); -- matches
 INSERT INTO hjtest_1(a, b, id, c) VALUES ('text', 1, 2, false); -- fails id join condition
 INSERT INTO hjtest_1(a, b, id, c) VALUES ('text', 20, 1, false); -- fails < 50
@@ -1045,8 +1175,8 @@ WHERE
          SubPlan 2
            ->  Result
                  Output: (hjtest_1.b * 5)
+ Settings: enable_parallel = 'on', enable_sort = 'off', from_collapse_limit = '1', optimizer = 'off'
  Optimizer: Postgres query optimizer
- Settings: enable_sort=off, from_collapse_limit=1
 (38 rows)
 
 SELECT hjtest_1.a a1, hjtest_2.a a2,hjtest_1.tableoid::regclass t1, hjtest_2.tableoid::regclass t2
@@ -1109,8 +1239,8 @@ WHERE
          SubPlan 3
            ->  Result
                  Output: (hjtest_2.c * 5)
+ Settings: enable_parallel = 'on', enable_sort = 'off', from_collapse_limit = '1', optimizer = 'off'
  Optimizer: Postgres query optimizer
- Settings: enable_sort=off, from_collapse_limit=1
 (38 rows)
 
 SELECT hjtest_1.a a1, hjtest_2.a a2,hjtest_1.tableoid::regclass t1, hjtest_2.tableoid::regclass t2
diff --git a/src/test/regress/expected/join_hash_optimizer.out b/src/test/regress/expected/join_hash_optimizer.out
index 053d0ef4898..1835bfa4f31 100644
--- a/src/test/regress/expected/join_hash_optimizer.out
+++ b/src/test/regress/expected/join_hash_optimizer.out
@@ -10,6 +10,9 @@ set allow_system_table_mods=on;
 set local min_parallel_table_scan_size = 0;
 set local parallel_setup_cost = 0;
 set local enable_hashjoin = on;
+-- CBDB: disable CBDB parallel for these PG-originated tests; parallel full join
+-- is tested separately in cbdb_parallel.sql.
+set local enable_parallel = off;
 -- Extract bucket and batch counts from an explain analyze plan.  In
 -- general we can't make assertions about how many batches (or
 -- buckets) will be required because it can vary, but we can in some
@@ -115,7 +118,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -156,7 +159,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -197,7 +200,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -241,7 +244,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -283,7 +286,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -325,7 +328,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: s.id
                                  ->  Seq Scan on simple s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select count(*) from simple r join simple s using (id);
@@ -344,6 +347,13 @@ $$);
  t                    | f
 (1 row)
 
+-- parallel full multi-batch hash join
+select count(*) from simple r full outer join simple s using (id);
+ count 
+-------
+ 60000
+(1 row)
+
 rollback to settings;
 -- The "bad" case: during execution we need to increase number of
 -- batches; in this case we plan for 1 batch, and increase at least a
@@ -356,8 +366,8 @@ set local work_mem = '128kB';
 set local statement_mem = '1000kB'; -- GPDB uses statement_mem instead of work_mem
 explain (costs off)
   select count(*) FROM simple r JOIN bigger_than_it_looks s USING (id);
-                                  QUERY PLAN                                  
-------------------------------------------------------------------------------
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -367,8 +377,8 @@ explain (costs off)
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on bigger_than_it_looks s
- Optimizer: Pivotal Optimizer (GPORCA)
-(13 rows)
+ Optimizer: GPORCA
+(10 rows)
 
 select count(*) FROM simple r JOIN bigger_than_it_looks s USING (id);
  count 
@@ -395,8 +405,8 @@ set local statement_mem = '1000kB'; -- GPDB uses statement_mem instead of work_m
 set local enable_parallel_hash = off;
 explain (costs off)
   select count(*) from simple r join bigger_than_it_looks s using (id);
-                                  QUERY PLAN                                  
-------------------------------------------------------------------------------
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -406,8 +416,8 @@ explain (costs off)
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on bigger_than_it_looks s
- Optimizer: Pivotal Optimizer (GPORCA)
-(13 rows)
+ Optimizer: GPORCA
+(10 rows)
 
 select count(*) from simple r join bigger_than_it_looks s using (id);
  count 
@@ -434,8 +444,8 @@ set local statement_mem = '1000kB'; -- GPDB uses statement_mem instead of work_m
 set local enable_parallel_hash = on;
 explain (costs off)
   select count(*) from simple r join bigger_than_it_looks s using (id);
-                                  QUERY PLAN                                  
-------------------------------------------------------------------------------
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -445,8 +455,8 @@ explain (costs off)
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on bigger_than_it_looks s
- Optimizer: Pivotal Optimizer (GPORCA)
-(13 rows)
+ Optimizer: GPORCA
+(10 rows)
 
 select count(*) from simple r join bigger_than_it_looks s using (id);
  count 
@@ -490,7 +500,7 @@ HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on extremely_skewed s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (10 rows)
 
 select count(*) from simple r join extremely_skewed s using (id);
@@ -534,7 +544,7 @@ HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on extremely_skewed s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (10 rows)
 
 select count(*) from simple r join extremely_skewed s using (id);
@@ -578,7 +588,7 @@ HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For
                      ->  Hash
                            ->  Broadcast Motion 3:3  (slice2; segments: 3)
                                  ->  Seq Scan on extremely_skewed s
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (10 rows)
 
 select count(*) from simple r join extremely_skewed s using (id);
@@ -643,8 +653,8 @@ explain (costs off)
   select count(*) from join_foo
     left join (select b1.id, b1.t from join_bar b1 join join_bar b2 using (id)) ss
     on join_foo.id < ss.id + 1 and join_foo.id > ss.id - 1;
-                                                 QUERY PLAN                                                 
-------------------------------------------------------------------------------------------------------------
+                                           QUERY PLAN                                           
+------------------------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -662,7 +672,7 @@ explain (costs off)
                                              ->  Redistribute Motion 3:3  (slice4; segments: 3)
                                                    Hash Key: b2.id
                                                    ->  Seq Scan on join_bar b2
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (18 rows)
 
 select count(*) from join_foo
@@ -701,8 +711,8 @@ explain (costs off)
   select count(*) from join_foo
     left join (select b1.id, b1.t from join_bar b1 join join_bar b2 using (id)) ss
     on join_foo.id < ss.id + 1 and join_foo.id > ss.id - 1;
-                                                 QUERY PLAN                                                 
-------------------------------------------------------------------------------------------------------------
+                                           QUERY PLAN                                           
+------------------------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -720,7 +730,7 @@ explain (costs off)
                                              ->  Redistribute Motion 3:3  (slice4; segments: 3)
                                                    Hash Key: b2.id
                                                    ->  Seq Scan on join_bar b2
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (18 rows)
 
 select count(*) from join_foo
@@ -760,8 +770,8 @@ explain (costs off)
   select count(*) from join_foo
     left join (select b1.id, b1.t from join_bar b1 join join_bar b2 using (id)) ss
     on join_foo.id < ss.id + 1 and join_foo.id > ss.id - 1;
-                                                 QUERY PLAN                                                 
-------------------------------------------------------------------------------------------------------------
+                                           QUERY PLAN                                           
+------------------------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -779,7 +789,7 @@ explain (costs off)
                                              ->  Redistribute Motion 3:3  (slice4; segments: 3)
                                                    Hash Key: b2.id
                                                    ->  Seq Scan on join_bar b2
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (18 rows)
 
 select count(*) from join_foo
@@ -818,8 +828,8 @@ explain (costs off)
   select count(*) from join_foo
     left join (select b1.id, b1.t from join_bar b1 join join_bar b2 using (id)) ss
     on join_foo.id < ss.id + 1 and join_foo.id > ss.id - 1;
-                                                 QUERY PLAN                                                 
-------------------------------------------------------------------------------------------------------------
+                                           QUERY PLAN                                           
+------------------------------------------------------------------------------------------------
  Finalize Aggregate
    ->  Gather Motion 3:1  (slice1; segments: 3)
          ->  Partial Aggregate
@@ -837,7 +847,7 @@ explain (costs off)
                                              ->  Redistribute Motion 3:3  (slice4; segments: 3)
                                                    Hash Key: b2.id
                                                    ->  Seq Scan on join_bar b2
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (18 rows)
 
 select count(*) from join_foo
@@ -891,8 +901,9 @@ select  count(*) from simple r full outer join simple s using (id);
 (1 row)
 
 rollback to settings;
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
 savepoint settings;
+set enable_parallel_hash = off;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
      select  count(*) from simple r full outer join simple s using (id);
@@ -920,7 +931,36 @@ select  count(*) from simple r full outer join simple s using (id);
 (1 row)
 
 rollback to settings;
--- An full outer join where every record is not matched.
+-- parallelism is possible with parallel-aware full hash join
+savepoint settings;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s using (id);
+                                  QUERY PLAN                                  
+------------------------------------------------------------------------------
+ Finalize Aggregate
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         ->  Partial Aggregate
+               ->  Hash Full Join
+                     Hash Cond: (r.id = s.id)
+                     ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                           Hash Key: r.id
+                           ->  Seq Scan on simple r
+                     ->  Hash
+                           ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                                 Hash Key: s.id
+                                 ->  Seq Scan on simple s
+ Optimizer: GPORCA
+(13 rows)
+
+select  count(*) from simple r full outer join simple s using (id);
+ count 
+-------
+ 60000
+(1 row)
+
+rollback to settings;
+-- A full outer join where every record is not matched.
 -- non-parallel
 savepoint settings;
 set local max_parallel_workers_per_gather = 0;
@@ -950,7 +990,37 @@ select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
 (1 row)
 
 rollback to settings;
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
+savepoint settings;
+set enable_parallel_hash = off;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+                                  QUERY PLAN                                  
+------------------------------------------------------------------------------
+ Finalize Aggregate
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         ->  Partial Aggregate
+               ->  Hash Full Join
+                     Hash Cond: (r.id = (0 - s.id))
+                     ->  Redistribute Motion 3:3  (slice2; segments: 3)
+                           Hash Key: r.id
+                           ->  Seq Scan on simple r
+                     ->  Hash
+                           ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                                 Hash Key: (0 - s.id)
+                                 ->  Seq Scan on simple s
+ Optimizer: GPORCA
+(13 rows)
+
+select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+ count  
+--------
+ 120000
+(1 row)
+
+rollback to settings;
+-- parallelism is possible with parallel-aware full hash join
 savepoint settings;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
@@ -1012,7 +1082,7 @@ explain (costs off)
                            ->  Redistribute Motion 3:3  (slice3; segments: 3)
                                  Hash Key: wide_1.id
                                  ->  Seq Scan on wide wide_1
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (13 rows)
 
 select length(max(s.t))
@@ -1060,11 +1130,57 @@ explain (costs off) select * from join_hash_t_small, join_hash_t_big where a = b
          ->  Seq Scan on join_hash_t_big
          ->  Hash
                ->  Seq Scan on join_hash_t_small
- Optimizer: Pivotal Optimizer (GPORCA)
+ Optimizer: GPORCA
 (7 rows)
 
 rollback to settings;
 rollback;
+-- Hash join reuses the HOT status bit to indicate match status. This can only
+-- be guaranteed to produce correct results if all the hash join tuple match
+-- bits are reset before reuse. This is done upon loading them into the
+-- hashtable.
+begin;
+SAVEPOINT settings;
+-- CBDB: disable CBDB parallel; the serial full join match-bit test is what matters here.
+SET enable_parallel = off;
+SET enable_parallel_hash = on;
+SET min_parallel_table_scan_size = 0;
+SET parallel_setup_cost = 0;
+SET parallel_tuple_cost = 0;
+CREATE TABLE hjtest_matchbits_t1(id int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+CREATE TABLE hjtest_matchbits_t2(id int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+INSERT INTO hjtest_matchbits_t1 VALUES (1);
+INSERT INTO hjtest_matchbits_t2 VALUES (2);
+-- Update should create a HOT tuple. If this status bit isn't cleared, we won't
+-- correctly emit the NULL-extended unmatching tuple in full hash join.
+UPDATE hjtest_matchbits_t2 set id = 2;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id
+  ORDER BY t1.id;
+ id | id 
+----+----
+  1 |   
+    |  2
+(2 rows)
+
+-- Test serial full hash join.
+-- Resetting parallel_setup_cost should force a serial plan.
+-- Just to be safe, however, set enable_parallel_hash to off, as parallel full
+-- hash joins are only supported with shared hashtables.
+RESET parallel_setup_cost;
+SET enable_parallel_hash = off;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id;
+ id | id 
+----+----
+    |  2
+  1 |   
+(2 rows)
+
+ROLLBACK TO settings;
+rollback;
 -- Verify that hash key expressions reference the correct
 -- nodes. Hashjoin's hashkeys need to reference its outer plan, Hash's
 -- need to reference Hash's outer plan (which is below HashJoin's
@@ -1154,9 +1270,9 @@ WHERE
                                    Filter: (((hjtest_1.b * 5)) < 50)
                                    ->  Result
                                          Output: (hjtest_1.b * 5)
- Settings: enable_sort = 'off', from_collapse_limit = '1'
- Optimizer: Pivotal Optimizer (GPORCA)
-(49 rows)
+ Settings: enable_parallel = 'on', enable_sort = 'off', from_collapse_limit = '1', optimizer = 'on'
+ Optimizer: GPORCA
+(51 rows)
 
 SELECT hjtest_1.a a1, hjtest_2.a a2,hjtest_1.tableoid::regclass t1, hjtest_2.tableoid::regclass t2
 FROM hjtest_1, hjtest_2
@@ -1231,9 +1347,9 @@ WHERE
                                    Filter: (((hjtest_1.b * 5)) < 50)
                                    ->  Result
                                          Output: (hjtest_1.b * 5)
- Settings: enable_sort = 'off', from_collapse_limit = '1'
- Optimizer: Pivotal Optimizer (GPORCA)
-(49 rows)
+ Settings: enable_parallel = 'on', enable_sort = 'off', from_collapse_limit = '1', optimizer = 'on'
+ Optimizer: GPORCA
+(51 rows)
 
 SELECT hjtest_1.a a1, hjtest_2.a a2,hjtest_1.tableoid::regclass t1, hjtest_2.tableoid::regclass t2
 FROM hjtest_2, hjtest_1
diff --git a/src/test/regress/expected/matview_data.out b/src/test/regress/expected/matview_data.out
index 85697e90072..9a9074cd2d5 100644
--- a/src/test/regress/expected/matview_data.out
+++ b/src/test/regress/expected/matview_data.out
@@ -791,6 +791,1431 @@ drop materialized view mv_join2;
 drop table jt3;
 drop table jt2;
 drop table jt1;
+--
+-- Test AQUMV (Answer Query Using Materialized Views) with join queries.
+-- Each matching test shows EXPLAIN + SELECT with GUC off (original plan),
+-- then EXPLAIN + SELECT with GUC on (MV rewrite). Results must match.
+--
+create table aqj_t1(a int, b int) distributed by (a);
+create table aqj_t2(a int, b int) distributed by (a);
+create table aqj_t3(a int, b int) distributed by (a);
+insert into aqj_t1 select i, i*10 from generate_series(1, 100) i;
+insert into aqj_t2 select i, i*100 from generate_series(1, 100) i;
+insert into aqj_t3 select i, i*1000 from generate_series(1, 100) i;
+analyze aqj_t1;
+analyze aqj_t2;
+analyze aqj_t3;
+-- 1. Two-table INNER JOIN exact match
+create materialized view mv_aqj_join2 as
+  select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_join2;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a order by 1 limit 5;
+ a |  b  
+---+-----
+ 1 | 100
+ 2 | 200
+ 3 | 300
+ 4 | 400
+ 5 | 500
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_join2
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a order by 1 limit 5;
+ a |  b  
+---+-----
+ 1 | 100
+ 2 | 200
+ 3 | 300
+ 4 | 400
+ 5 | 500
+(5 rows)
+
+-- 2. Join with WHERE clause
+create materialized view mv_aqj_where as
+  select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_where;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+               Filter: (a > 5)
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+                     Filter: (a > 5)
+ Optimizer: Postgres query optimizer
+(9 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5 order by 1 limit 5;
+ a  |  b   
+----+------
+  6 |  600
+  7 |  700
+  8 |  800
+  9 |  900
+ 10 | 1000
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_where
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5 order by 1 limit 5;
+ a  |  b   
+----+------
+  6 |  600
+  7 |  700
+  8 |  800
+  9 |  900
+ 10 | 1000
+(5 rows)
+
+-- 3. Join with GROUP BY + aggregate
+create materialized view mv_aqj_agg as
+  select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_agg;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+                   QUERY PLAN                   
+------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  HashAggregate
+         Group Key: aqj_t1.a
+         ->  Hash Join
+               Hash Cond: (aqj_t1.a = aqj_t2.a)
+               ->  Seq Scan on aqj_t1
+               ->  Hash
+                     ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(9 rows)
+
+select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a order by 1 limit 5;
+ a | cnt 
+---+-----
+ 1 |   1
+ 2 |   1
+ 3 |   1
+ 4 |   1
+ 5 |   1
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_agg
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a order by 1 limit 5;
+ a | cnt 
+---+-----
+ 1 |   1
+ 2 |   1
+ 3 |   1
+ 4 |   1
+ 5 |   1
+(5 rows)
+
+-- 4. Non-match: different WHERE clause (should show Hash Join, not MV)
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 10;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+               Filter: (a > 10)
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+                     Filter: (a > 10)
+ Optimizer: Postgres query optimizer
+(9 rows)
+
+-- 5. Non-match: different target list
+explain(costs off) select aqj_t1.b, aqj_t2.a from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+-- 6. Non-match: different join type (INNER vs LEFT)
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 left join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Left Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+-- 7. Three-table join
+create materialized view mv_aqj_join3 as
+  select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_join3;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+                   QUERY PLAN                   
+------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t3.a)
+         ->  Hash Join
+               Hash Cond: (aqj_t1.a = aqj_t2.a)
+               ->  Seq Scan on aqj_t1
+               ->  Hash
+                     ->  Seq Scan on aqj_t2
+         ->  Hash
+               ->  Seq Scan on aqj_t3
+ Optimizer: Postgres query optimizer
+(11 rows)
+
+select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a
+  order by 1 limit 5;
+ a |  b  |  c   
+---+-----+------
+ 1 | 100 | 1000
+ 2 | 200 | 2000
+ 3 | 300 | 3000
+ 4 | 400 | 4000
+ 5 | 500 | 5000
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_join3
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a
+  order by 1 limit 5;
+ a |  b  |  c   
+---+-----+------
+ 1 | 100 | 1000
+ 2 | 200 | 2000
+ 3 | 300 | 3000
+ 4 | 400 | 4000
+ 5 | 500 | 5000
+(5 rows)
+
+-- 8. Implicit join (FROM t1, t2 WHERE ...)
+create materialized view mv_aqj_implicit as
+  select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_implicit;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a order by 1 limit 5;
+ a |  b  
+---+-----
+ 1 | 100
+ 2 | 200
+ 3 | 300
+ 4 | 400
+ 5 | 500
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_implicit
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a order by 1 limit 5;
+ a |  b  
+---+-----
+ 1 | 100
+ 2 | 200
+ 3 | 300
+ 4 | 400
+ 5 | 500
+(5 rows)
+
+-- 9. MV not up-to-date: after INSERT on base table
+insert into aqj_t1 values(999, 9990);
+set enable_answer_query_using_materialized_views = on;
+-- Should NOT use mv_aqj_join2 (status is 'i')
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+-- 10. After REFRESH: should use MV again
+refresh materialized view mv_aqj_join2;
+analyze mv_aqj_join2;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_join2
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+-- 11. GUC off: should NOT use MV
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (aqj_t1.a = aqj_t2.a)
+         ->  Seq Scan on aqj_t1
+         ->  Hash
+               ->  Seq Scan on aqj_t2
+ Optimizer: Postgres query optimizer
+(7 rows)
+
+--
+-- More complex join AQUMV test cases with richer schemas
+--
+create table aqj_orders(
+  order_id int,
+  customer_id int,
+  amount numeric(10,2),
+  status text,
+  order_date date
+) distributed by (order_id);
+create table aqj_customers(
+  customer_id int,
+  name text,
+  region text,
+  credit_limit numeric(10,2)
+) distributed by (customer_id);
+create table aqj_products(
+  product_id int,
+  name text,
+  category text,
+  price numeric(10,2)
+) distributed by (product_id);
+create table aqj_order_items(
+  item_id int,
+  order_id int,
+  product_id int,
+  quantity int
+) distributed by (item_id);
+insert into aqj_customers select i, 'cust_' || i, case when i % 3 = 0 then 'east' when i % 3 = 1 then 'west' else 'north' end, (i * 100)::numeric(10,2) from generate_series(1, 50) i;
+insert into aqj_orders select i, (i % 50) + 1, (i * 10.5)::numeric(10,2), case when i % 4 = 0 then 'shipped' when i % 4 = 1 then 'pending' when i % 4 = 2 then 'delivered' else 'cancelled' end, '2024-01-01'::date + (i % 365) from generate_series(1, 200) i;
+insert into aqj_products select i, 'prod_' || i, case when i % 5 = 0 then 'electronics' when i % 5 = 1 then 'books' when i % 5 = 2 then 'clothing' when i % 5 = 3 then 'food' else 'toys' end, (i * 5.99)::numeric(10,2) from generate_series(1, 30) i;
+insert into aqj_order_items select i, (i % 200) + 1, (i % 30) + 1, (i % 10) + 1 from generate_series(1, 500) i;
+analyze aqj_customers;
+analyze aqj_orders;
+analyze aqj_products;
+analyze aqj_order_items;
+-- 12. Join with multiple columns + WHERE on text column
+create materialized view mv_aqj_orders_cust as
+  select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_orders_cust;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: o.customer_id
+               ->  Seq Scan on aqj_orders o
+                     Filter: (status = 'shipped'::text)
+         ->  Hash
+               ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(10 rows)
+
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+ order_id | amount |  name   | region 
+----------+--------+---------+--------
+        4 |  42.00 | cust_5  | north
+        8 |  84.00 | cust_9  | east
+       12 | 126.00 | cust_13 | west
+       16 | 168.00 | cust_17 | north
+       20 | 210.00 | cust_21 | east
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_orders_cust
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+ order_id | amount |  name   | region 
+----------+--------+---------+--------
+        4 |  42.00 | cust_5  | north
+        8 |  84.00 | cust_9  | east
+       12 | 126.00 | cust_13 | west
+       16 | 168.00 | cust_17 | north
+       20 | 210.00 | cust_21 | east
+(5 rows)
+
+-- 13. Four-table join
+create materialized view mv_aqj_order_details as
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_order_details;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+                                  QUERY PLAN                                  
+------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (oi.product_id = p.product_id)
+         ->  Hash Join
+               Hash Cond: (o.order_id = oi.order_id)
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Hash Join
+                           Hash Cond: (o.customer_id = c.customer_id)
+                           ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                                 Hash Key: o.customer_id
+                                 ->  Seq Scan on aqj_orders o
+                           ->  Hash
+                                 ->  Seq Scan on aqj_customers c
+               ->  Hash
+                     ->  Seq Scan on aqj_order_items oi
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice4; segments: 3)
+                     ->  Seq Scan on aqj_products p
+ Optimizer: Postgres query optimizer
+(19 rows)
+
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+ order_id | customer_name | product_name | quantity | price  
+----------+---------------+--------------+----------+--------
+        1 | cust_2        | prod_11      |        1 |  65.89
+        1 | cust_2        | prod_21      |        1 | 125.79
+        2 | cust_3        | prod_12      |        2 |  71.88
+        2 | cust_3        | prod_2       |        2 |  11.98
+        2 | cust_3        | prod_22      |        2 | 131.78
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_order_details
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+ order_id | customer_name | product_name | quantity | price  
+----------+---------------+--------------+----------+--------
+        1 | cust_2        | prod_11      |        1 |  65.89
+        1 | cust_2        | prod_21      |        1 | 125.79
+        2 | cust_3        | prod_12      |        2 |  71.88
+        2 | cust_3        | prod_2       |        2 |  11.98
+        2 | cust_3        | prod_22      |        2 | 131.78
+(5 rows)
+
+-- 14. GROUP BY on join with multiple aggregates: sum, count, avg
+create materialized view mv_aqj_cust_summary as
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'region' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_cust_summary;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+                                   QUERY PLAN                                    
+---------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Finalize HashAggregate
+         Group Key: c.region
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: c.region
+               ->  Streaming Partial HashAggregate
+                     Group Key: c.region
+                     ->  Hash Join
+                           Hash Cond: (o.customer_id = c.customer_id)
+                           ->  Seq Scan on aqj_orders o
+                           ->  Hash
+                                 ->  Broadcast Motion 3:3  (slice3; segments: 3)
+                                       ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region
+  order by c.region;
+ region | order_count | total_amount |      avg_amount       
+--------+-------------+--------------+-----------------------
+ east   |          64 |     66864.00 | 1044.7500000000000000
+ north  |          68 |     71400.00 | 1050.0000000000000000
+ west   |          68 |     72786.00 | 1070.3823529411764706
+(3 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_cust_summary
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region
+  order by c.region;
+ region | order_count | total_amount |      avg_amount       
+--------+-------------+--------------+-----------------------
+ east   |          64 |     66864.00 | 1044.7500000000000000
+ north  |          68 |     71400.00 | 1050.0000000000000000
+ west   |          68 |     72786.00 | 1070.3823529411764706
+(3 rows)
+
+-- 15. Join with expression in target list (arithmetic + function)
+create materialized view mv_aqj_expr as
+  select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_expr;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+                          QUERY PLAN                           
+---------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Seq Scan on aqj_orders o
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(8 rows)
+
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+ order_id | amount_with_tax |  name  | region_upper 
+----------+-----------------+--------+--------------
+        1 |          11.550 | cust_2 | NORTH
+        2 |          23.100 | cust_3 | EAST
+        3 |          34.650 | cust_4 | WEST
+        4 |          46.200 | cust_5 | NORTH
+        5 |          57.750 | cust_6 | EAST
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_expr
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+ order_id | amount_with_tax |  name  | region_upper 
+----------+-----------------+--------+--------------
+        1 |          11.550 | cust_2 | NORTH
+        2 |          23.100 | cust_3 | EAST
+        3 |          34.650 | cust_4 | WEST
+        4 |          46.200 | cust_5 | NORTH
+        5 |          57.750 | cust_6 | EAST
+(5 rows)
+
+-- 16. Non-match: same tables + expressions, but extra WHERE (should NOT match mv_aqj_expr)
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where c.region = 'east';
+                          QUERY PLAN                           
+---------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Seq Scan on aqj_orders o
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Seq Scan on aqj_customers c
+                           Filter: (region = 'east'::text)
+ Optimizer: Postgres query optimizer
+(9 rows)
+
+-- 17. Non-match: same tables but different aggregate target list
+explain(costs off)
+  select c.region, sum(o.amount) as total_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+                                   QUERY PLAN                                    
+---------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Finalize HashAggregate
+         Group Key: c.region
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: c.region
+               ->  Streaming Partial HashAggregate
+                     Group Key: c.region
+                     ->  Hash Join
+                           Hash Cond: (o.customer_id = c.customer_id)
+                           ->  Seq Scan on aqj_orders o
+                           ->  Hash
+                                 ->  Broadcast Motion 3:3  (slice3; segments: 3)
+                                       ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+-- 18. Non-match: different join order (o JOIN c vs c JOIN o)
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_customers c join aqj_orders o on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: o.customer_id
+               ->  Seq Scan on aqj_orders o
+                     Filter: (status = 'shipped'::text)
+         ->  Hash
+               ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(10 rows)
+
+-- 19. Join with compound WHERE (multiple AND conditions)
+create materialized view mv_aqj_compound_where as
+  select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_compound_where;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+                                   QUERY PLAN                                    
+---------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Seq Scan on aqj_orders o
+               Filter: ((amount > '50'::numeric) AND (status = 'pending'::text))
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Seq Scan on aqj_customers c
+                           Filter: (region = 'west'::text)
+ Optimizer: Postgres query optimizer
+(10 rows)
+
+select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50
+  order by o.order_id limit 5;
+ order_id | amount |  name   
+----------+--------+---------
+        9 |  94.50 | cust_10
+       21 | 220.50 | cust_22
+       33 | 346.50 | cust_34
+       45 | 472.50 | cust_46
+       53 | 556.50 | cust_4
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_compound_where
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50
+  order by o.order_id limit 5;
+ order_id | amount |  name   
+----------+--------+---------
+        9 |  94.50 | cust_10
+       21 | 220.50 | cust_22
+       33 | 346.50 | cust_34
+       45 | 472.50 | cust_46
+       53 | 556.50 | cust_4
+(5 rows)
+
+-- 20. Self-join
+create materialized view mv_aqj_selfjoin as
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'id1' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_selfjoin;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+                            QUERY PLAN                            
+------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o1.customer_id = o2.customer_id)
+         Join Filter: (o1.order_id < o2.order_id)
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: o1.customer_id
+               ->  Seq Scan on aqj_orders o1
+         ->  Hash
+               ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                     Hash Key: o2.customer_id
+                     ->  Seq Scan on aqj_orders o2
+ Optimizer: Postgres query optimizer
+(12 rows)
+
+select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id
+  order by o1.order_id, o2.order_id limit 5;
+ id1 | id2 | amt1  |  amt2   
+-----+-----+-------+---------
+   1 |  51 | 10.50 |  535.50
+   1 | 101 | 10.50 | 1060.50
+   1 | 151 | 10.50 | 1585.50
+   2 |  52 | 21.00 |  546.00
+   2 | 102 | 21.00 | 1071.00
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_selfjoin
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id
+  order by o1.order_id, o2.order_id limit 5;
+ id1 | id2 | amt1  |  amt2   
+-----+-----+-------+---------
+   1 |  51 | 10.50 |  535.50
+   1 | 101 | 10.50 | 1060.50
+   1 | 151 | 10.50 | 1585.50
+   2 |  52 | 21.00 |  546.00
+   2 | 102 | 21.00 | 1071.00
+(5 rows)
+
+-- 21. GROUP BY with multi-column key on join
+create materialized view mv_aqj_grp_multi as
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'region, status' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_grp_multi;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+                                   QUERY PLAN                                    
+---------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Finalize HashAggregate
+         Group Key: c.region, o.status
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: c.region, o.status
+               ->  Streaming Partial HashAggregate
+                     Group Key: c.region, o.status
+                     ->  Hash Join
+                           Hash Cond: (o.customer_id = c.customer_id)
+                           ->  Seq Scan on aqj_orders o
+                           ->  Hash
+                                 ->  Broadcast Motion 3:3  (slice3; segments: 3)
+                                       ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+ region |  status   | cnt |  total   
+--------+-----------+-----+----------
+ east   | cancelled |  16 | 16968.00
+ east   | delivered |  16 | 16464.00
+ east   | pending   |  16 | 16968.00
+ east   | shipped   |  16 | 16464.00
+ north  | cancelled |  18 | 19425.00
+ north  | delivered |  16 | 16800.00
+(6 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_grp_multi
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+ region |  status   | cnt |  total   
+--------+-----------+-----+----------
+ east   | cancelled |  16 | 16968.00
+ east   | delivered |  16 | 16464.00
+ east   | pending   |  16 | 16968.00
+ east   | shipped   |  16 | 16464.00
+ north  | cancelled |  18 | 19425.00
+ north  | delivered |  16 | 16800.00
+(6 rows)
+
+-- 22. Four-table join with WHERE and aggregate
+create materialized view mv_aqj_3way_agg as
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'region, category' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_3way_agg;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+                                              QUERY PLAN                                              
+------------------------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Finalize HashAggregate
+         Group Key: c.region, p.category
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: c.region, p.category
+               ->  Streaming Partial HashAggregate
+                     Group Key: c.region, p.category
+                     ->  Hash Join
+                           Hash Cond: (oi.product_id = p.product_id)
+                           ->  Hash Join
+                                 Hash Cond: (oi.order_id = o.order_id)
+                                 ->  Seq Scan on aqj_order_items oi
+                                 ->  Hash
+                                       ->  Broadcast Motion 3:3  (slice3; segments: 3)
+                                             ->  Hash Join
+                                                   Hash Cond: (o.customer_id = c.customer_id)
+                                                   ->  Redistribute Motion 3:3  (slice4; segments: 3)
+                                                         Hash Key: o.customer_id
+                                                         ->  Seq Scan on aqj_orders o
+                                                               Filter: (status = 'delivered'::text)
+                                                   ->  Hash
+                                                         ->  Seq Scan on aqj_customers c
+                           ->  Hash
+                                 ->  Broadcast Motion 3:3  (slice5; segments: 3)
+                                       ->  Seq Scan on aqj_products p
+ Optimizer: Postgres query optimizer
+(26 rows)
+
+select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category
+  order by c.region, p.category limit 6;
+ region |  category   | total_qty | line_count 
+--------+-------------+-----------+------------
+ east   | books       |        30 |          5
+ east   | clothing    |        20 |         10
+ east   | electronics |        50 |          5
+ east   | food        |        80 |         10
+ east   | toys        |        40 |         10
+ north  | books       |        60 |         10
+(6 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_3way_agg
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category
+  order by c.region, p.category limit 6;
+ region |  category   | total_qty | line_count 
+--------+-------------+-----------+------------
+ east   | books       |        30 |          5
+ east   | clothing    |        20 |         10
+ east   | electronics |        50 |          5
+ east   | food        |        80 |         10
+ east   | toys        |        40 |         10
+ north  | books       |        60 |         10
+(6 rows)
+
+-- 23. Implicit four-table join (comma style)
+create materialized view mv_aqj_implicit3 as
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_implicit3;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+                                     QUERY PLAN                                     
+------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (oi.product_id = p.product_id)
+         ->  Hash Join
+               Hash Cond: (oi.order_id = o.order_id)
+               ->  Seq Scan on aqj_order_items oi
+               ->  Hash
+                     ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                           ->  Hash Join
+                                 Hash Cond: (o.customer_id = c.customer_id)
+                                 ->  Redistribute Motion 3:3  (slice3; segments: 3)
+                                       Hash Key: o.customer_id
+                                       ->  Seq Scan on aqj_orders o
+                                             Filter: (status = 'pending'::text)
+                                 ->  Hash
+                                       ->  Seq Scan on aqj_customers c
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice4; segments: 3)
+                     ->  Seq Scan on aqj_products p
+ Optimizer: Postgres query optimizer
+(20 rows)
+
+select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending'
+  order by o.order_id, p.name limit 5;
+ order_id |  name  | product_name 
+----------+--------+--------------
+        1 | cust_2 | prod_11
+        1 | cust_2 | prod_21
+        5 | cust_6 | prod_15
+        5 | cust_6 | prod_25
+        5 | cust_6 | prod_5
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_implicit3
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending'
+  order by o.order_id, p.name limit 5;
+ order_id |  name  | product_name 
+----------+--------+--------------
+        1 | cust_2 | prod_11
+        1 | cust_2 | prod_21
+        5 | cust_6 | prod_15
+        5 | cust_6 | prod_25
+        5 | cust_6 | prod_5
+(5 rows)
+
+-- 24. Result correctness across DML + REFRESH cycle
+insert into aqj_orders values(201, 1, 9999.99, 'shipped', '2025-12-31');
+set enable_answer_query_using_materialized_views = on;
+-- Stale: should NOT use MV
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Hash Join
+         Hash Cond: (o.customer_id = c.customer_id)
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: o.customer_id
+               ->  Seq Scan on aqj_orders o
+                     Filter: (status = 'shipped'::text)
+         ->  Hash
+               ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(10 rows)
+
+-- Refresh and verify MV is used again
+refresh materialized view mv_aqj_orders_cust;
+analyze mv_aqj_orders_cust;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+                QUERY PLAN                
+------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Seq Scan on mv_aqj_orders_cust
+ Optimizer: Postgres query optimizer
+(3 rows)
+
+-- The new row should appear in results via MV scan
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped' and o.order_id = 201;
+ order_id | amount  |  name  | region 
+----------+---------+--------+--------
+      201 | 9999.99 | cust_1 | west
+(1 row)
+
+-- 25. Post-DML comprehensive: refresh all, then verify GUC off vs on results
+refresh materialized view mv_aqj_order_details;
+refresh materialized view mv_aqj_expr;
+refresh materialized view mv_aqj_selfjoin;
+refresh materialized view mv_aqj_grp_multi;
+refresh materialized view mv_aqj_3way_agg;
+refresh materialized view mv_aqj_implicit3;
+analyze mv_aqj_order_details;
+analyze mv_aqj_expr;
+analyze mv_aqj_selfjoin;
+analyze mv_aqj_grp_multi;
+analyze mv_aqj_3way_agg;
+analyze mv_aqj_implicit3;
+-- Verify four-table join results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+ order_id | customer_name | product_name | quantity | price  
+----------+---------------+--------------+----------+--------
+        1 | cust_2        | prod_11      |        1 |  65.89
+        1 | cust_2        | prod_21      |        1 | 125.79
+        2 | cust_3        | prod_12      |        2 |  71.88
+        2 | cust_3        | prod_2       |        2 |  11.98
+        2 | cust_3        | prod_22      |        2 | 131.78
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+ order_id | customer_name | product_name | quantity | price  
+----------+---------------+--------------+----------+--------
+        1 | cust_2        | prod_11      |        1 |  65.89
+        1 | cust_2        | prod_21      |        1 | 125.79
+        2 | cust_3        | prod_12      |        2 |  71.88
+        2 | cust_3        | prod_2       |        2 |  11.98
+        2 | cust_3        | prod_22      |        2 | 131.78
+(5 rows)
+
+-- Verify expression MV results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+ order_id | amount_with_tax |  name  | region_upper 
+----------+-----------------+--------+--------------
+        1 |          11.550 | cust_2 | NORTH
+        2 |          23.100 | cust_3 | EAST
+        3 |          34.650 | cust_4 | WEST
+        4 |          46.200 | cust_5 | NORTH
+        5 |          57.750 | cust_6 | EAST
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+ order_id | amount_with_tax |  name  | region_upper 
+----------+-----------------+--------+--------------
+        1 |          11.550 | cust_2 | NORTH
+        2 |          23.100 | cust_3 | EAST
+        3 |          34.650 | cust_4 | WEST
+        4 |          46.200 | cust_5 | NORTH
+        5 |          57.750 | cust_6 | EAST
+(5 rows)
+
+-- Verify multi-key GROUP BY results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+ region |  status   | cnt |  total   
+--------+-----------+-----+----------
+ east   | cancelled |  16 | 16968.00
+ east   | delivered |  16 | 16464.00
+ east   | pending   |  16 | 16968.00
+ east   | shipped   |  16 | 16464.00
+ north  | cancelled |  18 | 19425.00
+ north  | delivered |  16 | 16800.00
+(6 rows)
+
+set enable_answer_query_using_materialized_views = on;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+ region |  status   | cnt |  total   
+--------+-----------+-----+----------
+ east   | cancelled |  16 | 16968.00
+ east   | delivered |  16 | 16464.00
+ east   | pending   |  16 | 16968.00
+ east   | shipped   |  16 | 16464.00
+ north  | cancelled |  18 | 19425.00
+ north  | delivered |  16 | 16800.00
+(6 rows)
+
+-- 26. Non-match: LIMIT vs FETCH FIRST WITH TIES (limitOption differs)
+create materialized view mv_aqj_limit_test as
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_limit_test;
+set enable_answer_query_using_materialized_views = on;
+-- Same tables/WHERE/ORDER BY but FETCH FIRST WITH TIES: should NOT match
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id fetch first 5 rows with ties;
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
+ Limit
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Merge Key: o.order_id
+         ->  Limit
+               ->  Sort
+                     Sort Key: o.order_id
+                     ->  Hash Join
+                           Hash Cond: (c.customer_id = o.customer_id)
+                           ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                                 ->  Seq Scan on aqj_customers c
+                           ->  Hash
+                                 ->  Seq Scan on aqj_orders o
+                                       Filter: (status = 'shipped'::text)
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+-- Identical LIMIT query: should match
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+                      QUERY PLAN                       
+-------------------------------------------------------
+ Limit
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Merge Key: order_id
+         ->  Limit
+               ->  Sort
+                     Sort Key: order_id
+                     ->  Seq Scan on mv_aqj_limit_test
+ Optimizer: Postgres query optimizer
+(8 rows)
+
+-- 27. Match: FETCH FIRST WITH TIES exact match
+create materialized view mv_aqj_with_ties as
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'order_id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+analyze mv_aqj_with_ties;
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+                                QUERY PLAN                                 
+---------------------------------------------------------------------------
+ Limit
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Merge Key: o.order_id
+         ->  Limit
+               ->  Sort
+                     Sort Key: o.order_id
+                     ->  Hash Join
+                           Hash Cond: (c.customer_id = o.customer_id)
+                           ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                                 ->  Seq Scan on aqj_customers c
+                           ->  Hash
+                                 ->  Seq Scan on aqj_orders o
+                                       Filter: (status = 'pending'::text)
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+ order_id | amount 
+----------+--------
+        1 |  10.50
+        5 |  52.50
+        9 |  94.50
+       13 | 136.50
+       17 | 178.50
+(5 rows)
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+                      QUERY PLAN                      
+------------------------------------------------------
+ Limit
+   ->  Gather Motion 3:1  (slice1; segments: 3)
+         Merge Key: order_id
+         ->  Limit
+               ->  Sort
+                     Sort Key: order_id
+                     ->  Seq Scan on mv_aqj_with_ties
+ Optimizer: Postgres query optimizer
+(8 rows)
+
+select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+ order_id | amount 
+----------+--------
+        1 |  10.50
+        5 |  52.50
+        9 |  94.50
+       13 | 136.50
+       17 | 178.50
+(5 rows)
+
+-- 28. Non-match: GROUP BY vs GROUP BY DISTINCT (groupDistinct differs)
+-- MV mv_aqj_grp_multi uses GROUP BY (groupDistinct=false, registered in catalog)
+-- Query uses GROUP BY DISTINCT — should NOT match
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by distinct c.region, o.status;
+                                   QUERY PLAN                                    
+---------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Finalize HashAggregate
+         Group Key: c.region, o.status
+         ->  Redistribute Motion 3:3  (slice2; segments: 3)
+               Hash Key: c.region, o.status
+               ->  Streaming Partial HashAggregate
+                     Group Key: c.region, o.status
+                     ->  Hash Join
+                           Hash Cond: (o.customer_id = c.customer_id)
+                           ->  Seq Scan on aqj_orders o
+                           ->  Hash
+                                 ->  Broadcast Motion 3:3  (slice3; segments: 3)
+                                       ->  Seq Scan on aqj_customers c
+ Optimizer: Postgres query optimizer
+(14 rows)
+
+-- Clean up AQUMV join test objects
+drop materialized view mv_aqj_with_ties;
+drop materialized view mv_aqj_limit_test;
+drop materialized view mv_aqj_implicit3;
+drop materialized view mv_aqj_3way_agg;
+drop materialized view mv_aqj_grp_multi;
+drop materialized view mv_aqj_selfjoin;
+drop materialized view mv_aqj_compound_where;
+drop materialized view mv_aqj_expr;
+drop materialized view mv_aqj_cust_summary;
+drop materialized view mv_aqj_order_details;
+drop materialized view mv_aqj_orders_cust;
+drop materialized view mv_aqj_implicit;
+drop materialized view mv_aqj_join3;
+drop materialized view mv_aqj_agg;
+drop materialized view mv_aqj_where;
+drop materialized view mv_aqj_join2;
+drop table aqj_order_items;
+drop table aqj_products;
+drop table aqj_customers;
+drop table aqj_orders;
+drop table aqj_t3;
+drop table aqj_t2;
+drop table aqj_t1;
 -- test drop table
 select mvname, datastatus from gp_matview_aux where mvname in ('mv0','mv1', 'mv2', 'mv3');
  mvname | datastatus 
@@ -925,12 +2350,12 @@ HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sur
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 insert into par_1_prt_1 values (1, 1, 1);
@@ -938,9 +2363,9 @@ insert into par_1_prt_1 values (1, 1, 1);
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
+ mv_par1_2 | u
  mv_par2   | u
  mv_par2_1 | u
- mv_par1_2 | u
  mv_par1_1 | i
  mv_par1   | i
  mv_par    | i
@@ -951,12 +2376,12 @@ insert into par values (1, 2, 2);
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | i
- mv_par2_1 | u
  mv_par1_2 | u
+ mv_par2_1 | u
  mv_par1_1 | i
  mv_par1   | i
  mv_par    | i
+ mv_par2   | i
 (6 rows)
 
 refresh materialized view mv_par;
@@ -971,11 +2396,11 @@ insert into par_1_prt_2_2_prt_1 values (1, 2, 1);
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | i
- mv_par2_1 | i
  mv_par1_2 | u
  mv_par1   | u
  mv_par1_1 | u
+ mv_par2_1 | i
+ mv_par2   | i
  mv_par    | i
 (6 rows)
 
@@ -986,11 +2411,11 @@ truncate par_1_prt_2;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | e
- mv_par2_1 | e
  mv_par1_2 | u
  mv_par1   | u
  mv_par1_1 | u
+ mv_par2_1 | e
+ mv_par2   | e
  mv_par    | e
 (6 rows)
 
@@ -1000,11 +2425,11 @@ truncate par_1_prt_2;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | e
- mv_par2_1 | e
  mv_par1_2 | u
  mv_par1   | u
  mv_par1_1 | u
+ mv_par2_1 | e
+ mv_par2   | e
  mv_par    | e
 (6 rows)
 
@@ -1018,9 +2443,9 @@ vacuum full par_1_prt_1_2_prt_1;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
+ mv_par1_2 | u
  mv_par2   | u
  mv_par2_1 | u
- mv_par1_2 | u
  mv_par1_1 | r
  mv_par1   | r
  mv_par    | r
@@ -1038,8 +2463,8 @@ select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
  mv_par2   | r
- mv_par2_1 | r
  mv_par    | r
+ mv_par2_1 | r
  mv_par1_2 | r
  mv_par1   | r
  mv_par1_1 | r
@@ -1058,10 +2483,10 @@ NOTICE:  table has parent, setting distribution columns to match parent table
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
  mv_par1   | e
  mv_par    | e
 (6 rows)
@@ -1089,10 +2514,10 @@ alter table par_1_prt_1 detach partition par_1_prt_1_2_prt_1;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
  mv_par1   | e
  mv_par    | e
 (6 rows)
@@ -1107,10 +2532,10 @@ alter table par_1_prt_1 attach partition new_par for values from (4) to (5);
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
  mv_par1   | e
  mv_par    | e
 (6 rows)
@@ -1130,12 +2555,12 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 insert into par values(1, 1, 1), (1, 1, 2);
@@ -1144,10 +2569,10 @@ select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
 -----------+------------
  mv_par2   | u
  mv_par2_1 | u
- mv_par1_1 | i
+ mv_par1_2 | i
  mv_par1   | i
  mv_par    | i
- mv_par1_2 | i
+ mv_par1_1 | i
 (6 rows)
 
 abort;
@@ -1155,23 +2580,23 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 insert into par_1_prt_2_2_prt_1 values(2, 2, 1);
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | i
- mv_par2_1 | i
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2_1 | i
+ mv_par2   | i
  mv_par    | i
 (6 rows)
 
@@ -1180,23 +2605,23 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 delete from par where b = 2  and c = 1;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | e
- mv_par2_1 | e
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2_1 | e
+ mv_par2   | e
  mv_par    | e
 (6 rows)
 
@@ -1205,21 +2630,21 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 delete from par_1_prt_1_2_prt_2;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
+ mv_par1_1 | u
  mv_par2   | u
  mv_par2_1 | u
- mv_par1_1 | u
  mv_par1_2 | e
  mv_par1   | e
  mv_par    | e
@@ -1231,12 +2656,12 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 update par set c = 2 where b = 1 and c = 1;
@@ -1257,12 +2682,12 @@ begin;
 select mvname, datastatus from gp_matview_aux where mvname like 'mv_par%';
   mvname   | datastatus 
 -----------+------------
- mv_par2   | u
- mv_par2_1 | u
  mv_par    | u
  mv_par1   | u
  mv_par1_1 | u
  mv_par1_2 | u
+ mv_par2   | u
+ mv_par2_1 | u
 (6 rows)
 
 update par set c = 2, a = 2 where  b = 1 and c = 1;
@@ -1281,6 +2706,7 @@ abort;
 -- Test report warning if extend protocol data is not consumed.
 --start_ignore
 drop extension gp_inject_fault;
+ERROR:  extension "gp_inject_fault" does not exist
 create extension gp_inject_fault;
 --end_ignore
 select gp_inject_fault_infinite('consume_extend_protocol_data', 'skip', dbid)
diff --git a/src/test/regress/expected/orca_parallel.out b/src/test/regress/expected/orca_parallel.out
new file mode 100644
index 00000000000..73df0c060bd
--- /dev/null
+++ b/src/test/regress/expected/orca_parallel.out
@@ -0,0 +1,120 @@
+create schema orca_parallel;
+set search_path=orca_parallel, public;
+set statement_mem = '256MB';
+set optimizer=on;
+create table t1(a int, b int) with(parallel_workers=2) distributed by (a);
+create table t2(c int, d int ) with(parallel_workers=3) distributed by (c);
+insert into t1 select i, i+1 from generate_series(1, 1000)i;
+insert into t2 select i, i+2 from generate_series(1, 20000)i;
+analyze t1;
+analyze t2;
+set parallel_setup_cost=0;
+set max_parallel_workers_per_gather=4;
+set enable_parallel = on;
+explain (verbose, costs off) select * from t1  join t2  on t1.a = t2.c;
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Output: t1.a, t1.b, t2.c, t2.d
+   ->  Hash Join
+         Output: t1.a, t1.b, t2.c, t2.d
+         Hash Cond: (t2.c = t1.a)
+         ->  Redistribute Motion 9:3  (slice2; segments: 9)
+               Output: t2.c, t2.d
+               Hash Key: t2.c
+               ->  Parallel Seq Scan on orca_parallel.t2
+                     Output: t2.c, t2.d
+         ->  Hash
+               Output: t1.a, t1.b
+               ->  Redistribute Motion 6:3  (slice3; segments: 6)
+                     Output: t1.a, t1.b
+                     Hash Key: t1.a
+                     ->  Parallel Seq Scan on orca_parallel.t1
+                           Output: t1.a, t1.b
+ Settings: enable_parallel = 'on', optimizer = 'on', parallel_setup_cost = '0'
+ Optimizer: GPORCA
+(19 rows)
+
+explain (verbose, costs off) select * from t1  join t2  on t1.a = t2.d;
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Output: t1.a, t1.b, t2.c, t2.d
+   ->  Hash Join
+         Output: t1.a, t1.b, t2.c, t2.d
+         Hash Cond: (t2.d = t1.a)
+         ->  Redistribute Motion 9:3  (slice2; segments: 9)
+               Output: t2.c, t2.d
+               Hash Key: t2.d
+               ->  Parallel Seq Scan on orca_parallel.t2
+                     Output: t2.c, t2.d
+         ->  Hash
+               Output: t1.a, t1.b
+               ->  Redistribute Motion 6:3  (slice3; segments: 6)
+                     Output: t1.a, t1.b
+                     Hash Key: t1.a
+                     ->  Parallel Seq Scan on orca_parallel.t1
+                           Output: t1.a, t1.b
+ Settings: enable_parallel = 'on', optimizer = 'on', parallel_setup_cost = '0'
+ Optimizer: GPORCA
+(19 rows)
+
+explain (verbose, costs off) select * from t1  join t2  on t1.b = t2.c;
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Output: t1.a, t1.b, t2.c, t2.d
+   ->  Hash Join
+         Output: t1.a, t1.b, t2.c, t2.d
+         Hash Cond: (t2.c = t1.b)
+         ->  Redistribute Motion 9:3  (slice2; segments: 9)
+               Output: t2.c, t2.d
+               Hash Key: t2.c
+               ->  Parallel Seq Scan on orca_parallel.t2
+                     Output: t2.c, t2.d
+         ->  Hash
+               Output: t1.a, t1.b
+               ->  Redistribute Motion 6:3  (slice3; segments: 6)
+                     Output: t1.a, t1.b
+                     Hash Key: t1.b
+                     ->  Parallel Seq Scan on orca_parallel.t1
+                           Output: t1.a, t1.b
+ Settings: enable_parallel = 'on', optimizer = 'on', parallel_setup_cost = '0'
+ Optimizer: GPORCA
+(19 rows)
+
+explain (verbose, costs off) select * from t1  join t2  on t1.b = t2.d;
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   Output: t1.a, t1.b, t2.c, t2.d
+   ->  Hash Join
+         Output: t1.a, t1.b, t2.c, t2.d
+         Hash Cond: (t2.d = t1.b)
+         ->  Redistribute Motion 9:3  (slice2; segments: 9)
+               Output: t2.c, t2.d
+               Hash Key: t2.d
+               ->  Parallel Seq Scan on orca_parallel.t2
+                     Output: t2.c, t2.d
+         ->  Hash
+               Output: t1.a, t1.b
+               ->  Redistribute Motion 6:3  (slice3; segments: 6)
+                     Output: t1.a, t1.b
+                     Hash Key: t1.b
+                     ->  Parallel Seq Scan on orca_parallel.t1
+                           Output: t1.a, t1.b
+ Settings: enable_parallel = 'on', optimizer = 'on', parallel_setup_cost = '0'
+ Optimizer: GPORCA
+(19 rows)
+
+reset enable_parallel;
+reset max_parallel_workers_per_gather;
+reset parallel_setup_cost;
+reset statement_mem;
+reset optimizer;
+-- start_ignore
+drop schema orca_parallel cascade;
+NOTICE:  drop cascades to 2 other objects
+DETAIL:  drop cascades to table t1
+drop cascades to table t2
+-- end_ignore
diff --git a/src/test/regress/expected/pg_stat.out b/src/test/regress/expected/pg_stat.out
index 80e4e4ff132..8c2b2e81d32 100644
--- a/src/test/regress/expected/pg_stat.out
+++ b/src/test/regress/expected/pg_stat.out
@@ -5,7 +5,7 @@ create table pg_stat_test(a int);
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup
-from pg_stat_all_tables where relname = 'pg_stat_test';
+from gp_stat_all_tables_summary where relname = 'pg_stat_test';
  schemaname |   relname    | seq_scan | seq_tup_read | idx_scan | idx_tup_fetch | n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup 
 ------------+--------------+----------+--------------+----------+---------------+-----------+-----------+-----------+---------------+------------+------------
  public     | pg_stat_test |        0 |            0 |          |               |         0 |         0 |         0 |             0 |          0 |          0
@@ -14,7 +14,7 @@ from pg_stat_all_tables where relname = 'pg_stat_test';
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup
-from pg_stat_user_tables where relname = 'pg_stat_test';
+from gp_stat_user_tables_summary where relname = 'pg_stat_test';
  schemaname |   relname    | seq_scan | seq_tup_read | idx_scan | idx_tup_fetch | n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup 
 ------------+--------------+----------+--------------+----------+---------------+-----------+-----------+-----------+---------------+------------+------------
  public     | pg_stat_test |        0 |            0 |          |               |         0 |         0 |         0 |             0 |          0 |          0
@@ -22,14 +22,14 @@ from pg_stat_user_tables where relname = 'pg_stat_test';
 
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_all_indexes where relname = 'pg_stat_test';
+from gp_stat_all_indexes_summary where relname = 'pg_stat_test';
  schemaname | relname | indexrelname | idx_scan | idx_tup_read | idx_tup_fetch 
 ------------+---------+--------------+----------+--------------+---------------
 (0 rows)
 
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_user_indexes where relname = 'pg_stat_test';
+from gp_stat_user_indexes_summary where relname = 'pg_stat_test';
  schemaname | relname | indexrelname | idx_scan | idx_tup_read | idx_tup_fetch 
 ------------+---------+--------------+----------+--------------+---------------
 (0 rows)
@@ -63,7 +63,7 @@ reset enable_seqscan;
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze
-from pg_stat_all_tables where relname = 'pg_stat_test';
+from gp_stat_all_tables_summary where relname = 'pg_stat_test';
  schemaname |   relname    | seq_scan | seq_tup_read | idx_scan | idx_tup_fetch | n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 ------------+--------------+----------+--------------+----------+---------------+-----------+-----------+-----------+---------------+------------+------------+---------------------
  public     | pg_stat_test |       12 |          391 |        1 |             0 |       110 |         0 |        19 |             0 |         91 |         19 |                 129
@@ -72,7 +72,7 @@ from pg_stat_all_tables where relname = 'pg_stat_test';
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze
-from pg_stat_user_tables where relname = 'pg_stat_test';
+from gp_stat_user_tables_summary where relname = 'pg_stat_test';
  schemaname |   relname    | seq_scan | seq_tup_read | idx_scan | idx_tup_fetch | n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 ------------+--------------+----------+--------------+----------+---------------+-----------+-----------+-----------+---------------+------------+------------+---------------------
  public     | pg_stat_test |       12 |          391 |        1 |             0 |       110 |         0 |        19 |             0 |         91 |         19 |                 129
@@ -80,7 +80,7 @@ from pg_stat_user_tables where relname = 'pg_stat_test';
 
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_all_indexes where relname = 'pg_stat_test';
+from gp_stat_all_indexes_summary where relname = 'pg_stat_test';
  schemaname |   relname    |       indexrelname       | idx_scan | idx_tup_read | idx_tup_fetch 
 ------------+--------------+--------------------------+----------+--------------+---------------
  public     | pg_stat_test | pg_stat_user_table_index |        1 |            1 |             0
@@ -88,7 +88,7 @@ from pg_stat_all_indexes where relname = 'pg_stat_test';
 
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_user_indexes where relname = 'pg_stat_test';
+from gp_stat_user_indexes_summary where relname = 'pg_stat_test';
  schemaname |   relname    |       indexrelname       | idx_scan | idx_tup_read | idx_tup_fetch 
 ------------+--------------+--------------------------+----------+--------------+---------------
  public     | pg_stat_test | pg_stat_user_table_index |        1 |            1 |             0
diff --git a/src/test/regress/expected/qp_orca_fallback.out b/src/test/regress/expected/qp_orca_fallback.out
index 37378ef698f..e8e42370758 100644
--- a/src/test/regress/expected/qp_orca_fallback.out
+++ b/src/test/regress/expected/qp_orca_fallback.out
@@ -293,6 +293,92 @@ SELECT * FROM jsonb_array_elements('["b", "a"]'::jsonb) WITH ORDINALITY;
  "a"   |          2
 (2 rows)
 
+-- The walker that detects a CTE Consumer on a different slice than its
+-- replicated Producer. Without it ORCA would emit a plan with cross-slice
+-- replicated CTE Consumers that hangs at execution.
+-- start_ignore
+DROP TABLE IF EXISTS tbl1, tbl2;
+NOTICE:  table "tbl1" does not exist, skipping
+NOTICE:  table "tbl2" does not exist, skipping
+-- end_ignore
+CREATE TABLE tbl2 (id numeric, refrcode varchar(255), referenceid numeric)
+DISTRIBUTED REPLICATED;
+CREATE TABLE tbl1 (id bigserial, iscalctrg varchar(15) NOT NULL,
+                   iscalcdetail varchar(15))
+DISTRIBUTED REPLICATED;
+-- start_ignore
+INSERT INTO tbl2 SELECT i, 'A'||(i%5), 101991
+  FROM generate_series(1, 50000) i;
+INSERT INTO tbl1 (iscalctrg, iscalcdetail)
+  SELECT 'A'||(i%5), 'A'||(i%7) FROM generate_series(1, 50000) i;
+ANALYZE tbl1;
+ANALYZE tbl2;
+-- end_ignore
+-- Case 1: walker triggers fallback. With scalar subqueries on the CTE
+-- ORCA produces a plan whose CTE Producer is replicated and Consumers
+-- live on a different slice -- the walker raises ExmiExpr2DXLUnsupported
+-- and trace_fallback DETAIL says "CTE Consumer placed on a different
+-- slice than its replicated Producer".
+EXPLAIN (COSTS OFF)
+WITH t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.iscalctrg,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalctrg    LIMIT 1) AS r,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalcdetail LIMIT 1) AS r1
+FROM tbl1 p
+LIMIT 1;
+                                       QUERY PLAN
+----------------------------------------------------------------------------------------
+ Gather Motion 1:1  (slice1; segments: 1)
+   ->  Limit
+         ->  Seq Scan on tbl1 p
+               SubPlan 1
+                 ->  Limit
+                       ->  Result
+                             Filter: ((tbl2.refrcode)::text = (p.iscalctrg)::text)
+                             ->  Materialize
+                                   ->  Seq Scan on tbl2
+                                         Filter: (referenceid = '101991'::numeric)
+               SubPlan 2
+                 ->  Limit
+                       ->  Result
+                             Filter: ((tbl2_1.refrcode)::text = (p.iscalcdetail)::text)
+                             ->  Materialize
+                                   ->  Seq Scan on tbl2 tbl2_1
+                                         Filter: (referenceid = '101991'::numeric)
+ Optimizer: Postgres query optimizer
+(18 rows)
+
+-- Case 2: walker correctly stays silent. The same CTE referenced from a
+-- JOIN: ORCA pins the Producer body to a single segment with a One-Time
+-- Filter (gp_execution_segment() = N), so the Producer's child
+-- distribution is EdtSingleton, not replicated -- the walker skips it.
+EXPLAIN (COSTS OFF)
+WITH t1 AS (SELECT * FROM tbl1),
+     t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.* FROM t1 p
+  JOIN t2 r  ON p.iscalctrg   = r.refrcode
+  JOIN t2 r1 ON p.iscalcdetail = r1.refrcode
+LIMIT 1;
+                                   QUERY PLAN
+---------------------------------------------------------------------------------
+ Gather Motion 1:1  (slice1; segments: 1)
+   ->  Limit
+         ->  Hash Join
+               Hash Cond: ((tbl1.iscalcdetail)::text = (r1.refrcode)::text)
+               ->  Hash Join
+                     Hash Cond: ((tbl2.refrcode)::text = (tbl1.iscalctrg)::text)
+                     ->  Seq Scan on tbl2
+                           Filter: (referenceid = '101991'::numeric)
+                     ->  Hash
+                           ->  Seq Scan on tbl1
+               ->  Hash
+                     ->  Subquery Scan on r1
+                           ->  Seq Scan on tbl2 tbl2_1
+                                 Filter: (referenceid = '101991'::numeric)
+ Optimizer: Postgres query optimizer
+(15 rows)
+
+DROP TABLE tbl1, tbl2;
 -- start_ignore
 -- FIXME: gpcheckcat fails due to mismatching distribution policy if this table isn't dropped
 -- Keep this table around once this is fixed
diff --git a/src/test/regress/expected/qp_orca_fallback_optimizer.out b/src/test/regress/expected/qp_orca_fallback_optimizer.out
index ad2eeabd1e5..63c2cc0e1a8 100644
--- a/src/test/regress/expected/qp_orca_fallback_optimizer.out
+++ b/src/test/regress/expected/qp_orca_fallback_optimizer.out
@@ -353,6 +353,105 @@ DETAIL:  Falling back to Postgres-based planner because GPORCA does not support
  "a"   |          2
 (2 rows)
 
+-- The walker that detects a CTE Consumer on a different slice than its
+-- replicated Producer. Without it ORCA would emit a plan with cross-slice
+-- replicated CTE Consumers that hangs at execution.
+-- start_ignore
+DROP TABLE IF EXISTS tbl1, tbl2;
+NOTICE:  table "tbl1" does not exist, skipping
+NOTICE:  table "tbl2" does not exist, skipping
+-- end_ignore
+CREATE TABLE tbl2 (id numeric, refrcode varchar(255), referenceid numeric)
+DISTRIBUTED REPLICATED;
+CREATE TABLE tbl1 (id bigserial, iscalctrg varchar(15) NOT NULL,
+                   iscalcdetail varchar(15))
+DISTRIBUTED REPLICATED;
+-- start_ignore
+INSERT INTO tbl2 SELECT i, 'A'||(i%5), 101991
+  FROM generate_series(1, 50000) i;
+INSERT INTO tbl1 (iscalctrg, iscalcdetail)
+  SELECT 'A'||(i%5), 'A'||(i%7) FROM generate_series(1, 50000) i;
+ANALYZE tbl1;
+ANALYZE tbl2;
+-- end_ignore
+-- Case 1: walker triggers fallback. With scalar subqueries on the CTE
+-- ORCA produces a plan whose CTE Producer is replicated and Consumers
+-- live on a different slice -- the walker raises ExmiExpr2DXLUnsupported
+-- and trace_fallback DETAIL says "CTE Consumer placed on a different
+-- slice than its replicated Producer".
+EXPLAIN (COSTS OFF)
+WITH t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.iscalctrg,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalctrg    LIMIT 1) AS r,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalcdetail LIMIT 1) AS r1
+FROM tbl1 p
+LIMIT 1;
+INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
+DETAIL:  Falling back to Postgres-based planner because GPORCA does not support the following feature: CTE Consumer placed on a different slice than its replicated Producer
+                                       QUERY PLAN
+----------------------------------------------------------------------------------------
+ Gather Motion 1:1  (slice1; segments: 1)
+   ->  Limit
+         ->  Seq Scan on tbl1 p
+               SubPlan 1
+                 ->  Limit
+                       ->  Result
+                             Filter: ((tbl2.refrcode)::text = (p.iscalctrg)::text)
+                             ->  Materialize
+                                   ->  Seq Scan on tbl2
+                                         Filter: (referenceid = '101991'::numeric)
+               SubPlan 2
+                 ->  Limit
+                       ->  Result
+                             Filter: ((tbl2_1.refrcode)::text = (p.iscalcdetail)::text)
+                             ->  Materialize
+                                   ->  Seq Scan on tbl2 tbl2_1
+                                         Filter: (referenceid = '101991'::numeric)
+ Optimizer: Postgres query optimizer
+(18 rows)
+
+-- Case 2: walker correctly stays silent. The same CTE referenced from a
+-- JOIN: ORCA pins the Producer body to a single segment with a One-Time
+-- Filter (gp_execution_segment() = N), so the Producer's child
+-- distribution is EdtSingleton, not replicated -- the walker skips it.
+EXPLAIN (COSTS OFF)
+WITH t1 AS (SELECT * FROM tbl1),
+     t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.* FROM t1 p
+  JOIN t2 r  ON p.iscalctrg   = r.refrcode
+  JOIN t2 r1 ON p.iscalcdetail = r1.refrcode
+LIMIT 1;
+                                                    QUERY PLAN
+-------------------------------------------------------------------------------------------------------------------
+ Gather Motion 3:1  (slice1; segments: 3)
+   ->  Sequence
+         ->  Shared Scan (share slice:id 1:1)
+               ->  Result
+                     Filter: (tbl2.referenceid = '101991'::numeric)
+                     ->  Result
+                           One-Time Filter: (gp_execution_segment() = 1)
+                           ->  Seq Scan on tbl2
+         ->  Redistribute Motion 1:3  (slice2)
+               ->  Limit
+                     ->  Gather Motion 3:1  (slice3; segments: 3)
+                           ->  Limit
+                                 ->  Hash Join
+                                       Hash Cond: ((tbl1.iscalctrg)::text = (share1_ref2.refrcode)::text)
+                                       ->  Hash Join
+                                             Hash Cond: ((tbl1.iscalcdetail)::text = (share1_ref3.refrcode)::text)
+                                             ->  Result
+                                                   ->  Seq Scan on tbl1
+                                             ->  Hash
+                                                   ->  Redistribute Motion 3:3  (slice4; segments: 3)
+                                                         Hash Key: share1_ref3.refrcode
+                                                         ->  Shared Scan (share slice:id 4:1)
+                                       ->  Hash
+                                             ->  Broadcast Motion 3:3  (slice5; segments: 3)
+                                                   ->  Shared Scan (share slice:id 5:1)
+ Optimizer: GPORCA
+(26 rows)
+
+DROP TABLE tbl1, tbl2;
 -- start_ignore
 -- FIXME: gpcheckcat fails due to mismatching distribution policy if this table isn't dropped
 -- Keep this table around once this is fixed
diff --git a/src/test/regress/expected/rpt_optimizer.out b/src/test/regress/expected/rpt_optimizer.out
index 24ee61ff642..a07e2c8f8dc 100644
--- a/src/test/regress/expected/rpt_optimizer.out
+++ b/src/test/regress/expected/rpt_optimizer.out
@@ -933,16 +933,17 @@ explain (costs off) select a from t_replicate_volatile union all select * from n
 
 -- CTAS
 explain (costs off) create table rpt_ctas as select random() from generate_series(1, 10) distributed replicated;
-QUERY PLAN
-___________
+                  QUERY PLAN                  
+----------------------------------------------
  Result
    ->  Broadcast Motion 1:3  (slice1)
          ->  Function Scan on generate_series
-GP_IGNORE:(4 rows)
+ Optimizer: GPORCA
+(4 rows)
 
 explain (costs off) create table rpt_ctas as select a from generate_series(1, 10) a group by a having sum(a) > random() distributed replicated;
-QUERY PLAN
-___________
+                                  QUERY PLAN                                   
+-------------------------------------------------------------------------------
  Result
    ->  Broadcast Motion 3:3  (slice1; segments: 3)
          ->  Result
@@ -951,8 +952,8 @@ ___________
                      Group Key: generate_series
                      ->  Result
                            ->  Function Scan on generate_series
- Optimizer: Pivotal Optimizer (GPORCA)
-GP_IGNORE:(9 rows)
+ Optimizer: GPORCA
+(9 rows)
 
 -- update & delete
 explain (costs off) update t_replicate_volatile set a = 1 where b > random();
diff --git a/src/test/regress/expected/shared_scan.out b/src/test/regress/expected/shared_scan.out
index 2673aff0f8c..83a3815fb0e 100644
--- a/src/test/regress/expected/shared_scan.out
+++ b/src/test/regress/expected/shared_scan.out
@@ -234,3 +234,36 @@ where
  Optimizer: Postgres query optimizer
 (37 rows)
 
+-- ORCA should fallback when a CTE over a replicated table is referenced
+-- from multiple scalar subqueries.
+-- ss_t1 needs enough rows (40000) to push ORCA to the cross-slice plan;
+-- with fewer rows the bug does not manifest and the test would silently
+-- pass even without the fix.
+-- start_ignore
+DROP TABLE IF EXISTS ss_t1, ss_t2;
+NOTICE:  table "ss_t1" does not exist, skipping
+NOTICE:  table "ss_t2" does not exist, skipping
+-- end_ignore
+CREATE TABLE ss_t1 AS
+  SELECT generate_series(1, 40000) id
+  DISTRIBUTED BY (id);
+CREATE TABLE ss_t2 AS
+  SELECT * FROM (VALUES (1, 10), (2, 20)) AS v(id, v)
+  DISTRIBUTED REPLICATED;
+ANALYZE ss_t1;
+ANALYZE ss_t2;
+SET statement_timeout = '15s';
+WITH
+    cte1 AS (SELECT v FROM ss_t2 WHERE id = 1),
+    cte2 AS (SELECT v FROM ss_t2 WHERE id = 2)
+  SELECT (SELECT v FROM cte1) + (SELECT v FROM cte2) +
+         (SELECT v FROM cte1) + (SELECT v FROM cte2) AS result
+  FROM ss_t1
+  LIMIT 1;
+ result 
+--------
+     60
+(1 row)
+
+RESET statement_timeout;
+DROP TABLE ss_t1, ss_t2;
diff --git a/src/test/regress/expected/shared_scan_optimizer.out b/src/test/regress/expected/shared_scan_optimizer.out
index 57ec36089d2..e71dfafe035 100644
--- a/src/test/regress/expected/shared_scan_optimizer.out
+++ b/src/test/regress/expected/shared_scan_optimizer.out
@@ -242,3 +242,31 @@ where
  Optimizer: Postgres query optimizer
 (37 rows)
 
+-- ORCA should fallback when a CTE over a replicated table is referenced
+-- from multiple scalar subqueries.
+-- ss_t1 needs enough rows (40000) to push ORCA to the cross-slice plan;
+-- with fewer rows the bug does not manifest and the test would silently
+-- pass even without the fix.
+CREATE TABLE ss_t1 AS
+  SELECT generate_series(1, 40000) id
+  DISTRIBUTED BY (id);
+CREATE TABLE ss_t2 AS
+  SELECT * FROM (VALUES (1, 10), (2, 20)) AS v(id, v)
+  DISTRIBUTED REPLICATED;
+ANALYZE ss_t1;
+ANALYZE ss_t2;
+SET statement_timeout = '15s';
+WITH
+    cte1 AS (SELECT v FROM ss_t2 WHERE id = 1),
+    cte2 AS (SELECT v FROM ss_t2 WHERE id = 2)
+  SELECT (SELECT v FROM cte1) + (SELECT v FROM cte2) +
+         (SELECT v FROM cte1) + (SELECT v FROM cte2) AS result
+  FROM ss_t1
+  LIMIT 1;
+ result 
+--------
+     60
+(1 row)
+
+RESET statement_timeout;
+DROP TABLE ss_t1, ss_t2;
diff --git a/src/test/regress/expected/tuplesort.out b/src/test/regress/expected/tuplesort.out
index 47b5a8ddb21..e6cd26efdb1 100644
--- a/src/test/regress/expected/tuplesort.out
+++ b/src/test/regress/expected/tuplesort.out
@@ -236,7 +236,7 @@ CLUSTER abbrev_abort_uuids USING abbrev_abort_uuids__abort_increasing_idx;
 -- head
 SELECT id, abort_increasing, abort_decreasing, noabort_increasing, noabort_decreasing
 FROM abbrev_abort_uuids
-ORDER BY ctid LIMIT 5;
+ORDER BY ctid, id LIMIT 5;
  id |           abort_increasing           |           abort_decreasing           |          noabort_increasing          |          noabort_decreasing          
 ----+--------------------------------------+--------------------------------------+--------------------------------------+--------------------------------------
   2 | 00000000-0000-0000-0000-000000000001 | 00000000-0000-0000-0000-000000019999 | 00000001-0000-0000-0000-000000000001 | 00009990-0000-0000-0000-000000019999
diff --git a/src/test/regress/expected/tuplesort_optimizer.out b/src/test/regress/expected/tuplesort_optimizer.out
index d62e0a0e71b..4eaabea61b5 100644
--- a/src/test/regress/expected/tuplesort_optimizer.out
+++ b/src/test/regress/expected/tuplesort_optimizer.out
@@ -232,7 +232,7 @@ CLUSTER abbrev_abort_uuids USING abbrev_abort_uuids__abort_increasing_idx;
 -- head
 SELECT id, abort_increasing, abort_decreasing, noabort_increasing, noabort_decreasing
 FROM abbrev_abort_uuids
-ORDER BY ctid LIMIT 5;
+ORDER BY ctid, id LIMIT 5;
  id |           abort_increasing           |           abort_decreasing           |          noabort_increasing          |          noabort_decreasing          
 ----+--------------------------------------+--------------------------------------+--------------------------------------+--------------------------------------
   2 | 00000000-0000-0000-0000-000000000001 | 00000000-0000-0000-0000-000000019999 | 00000001-0000-0000-0000-000000000001 | 00009990-0000-0000-0000-000000019999
diff --git a/src/test/regress/expected/union_gp.out b/src/test/regress/expected/union_gp.out
index 5bdae3e887c..d134f223502 100644
--- a/src/test/regress/expected/union_gp.out
+++ b/src/test/regress/expected/union_gp.out
@@ -2342,6 +2342,36 @@ with result as (update r_1240 set a = a +1 where a < 5 returning *) select * fro
 drop table r_1240;
 drop table p1_1240;
 --
+-- Test CTAS with UNION ALL when branches have different typmods (issue #1431).
+-- ORCA should resolve the output column type to character varying (no length),
+-- same as the Postgres planner, instead of picking the first branch's typmod.
+--
+create table union_ctas_t1(id int, name varchar(1));
+create table union_ctas_t2(id int, name varchar(2));
+insert into union_ctas_t1 values (1, 'a');
+insert into union_ctas_t2 values (1, 'ab');
+create table union_ctas_result as
+  (select id, name from union_ctas_t1)
+  union all
+  (select id, name from union_ctas_t2);
+-- name column should be "character varying" without length, not varchar(1)
+select atttypmod from pg_attribute
+where attrelid = 'union_ctas_result'::regclass and attname = 'name';
+ atttypmod 
+-----------
+        -1
+(1 row)
+
+-- data should not be truncated
+select * from union_ctas_result order by name;
+ id | name 
+----+------
+  1 | a
+  1 | ab
+(2 rows)
+
+drop table union_ctas_t1, union_ctas_t2, union_ctas_result;
+--
 -- Clean up
 --
 DROP TABLE IF EXISTS T_a1 CASCADE;
diff --git a/src/test/regress/expected/union_gp_optimizer.out b/src/test/regress/expected/union_gp_optimizer.out
index 8ff8655591d..8704f0fe7a7 100644
--- a/src/test/regress/expected/union_gp_optimizer.out
+++ b/src/test/regress/expected/union_gp_optimizer.out
@@ -1,7 +1,7 @@
 -- Additional GPDB-added tests for UNION
 SET optimizer_trace_fallback=on;
 create temp table t_union1 (a int, b int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 select distinct a, null::integer as c from t_union1 union select a, b from t_union1;
  a | c 
@@ -44,8 +44,8 @@ LINE 1: select 1 intersect (select 1, 2 union all select 3, 4);
 select 1 a, row_number() over (partition by 'a') union all (select 1 a , 2 b);
  a | row_number 
 ---+------------
- 1 |          2
  1 |          1
+ 1 |          2
 (2 rows)
 
 -- This should preserve domain types
@@ -104,8 +104,7 @@ DETAIL:  Falling back to Postgres-based planner because GPORCA does not support
 (1 row)
 
 CREATE TABLE union_ctas (a, b) AS SELECT 1, 2 UNION SELECT 1, 1 UNION SELECT 1, 1;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Greenplum Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause. Creating a NULL policy entry.
 SELECT * FROM union_ctas;
  a | b 
 ---+---
@@ -116,11 +115,9 @@ SELECT * FROM union_ctas;
 DROP TABLE union_ctas;
 -- MPP-21075: push quals below union
 CREATE TABLE union_quals1 (a, b) AS SELECT i, i%2 from generate_series(1,10) i;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Greenplum Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause. Creating a NULL policy entry.
 CREATE TABLE union_quals2 (a, b) AS SELECT i%2, i from generate_series(1,10) i;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column(s) named 'a' as the Greenplum Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause. Creating a NULL policy entry.
 SELECT * FROM (SELECT a, b from union_quals1 UNION SELECT b, a from union_quals2) as foo(a,b) where a > b order by a;
  a  | b 
 ----+---
@@ -225,7 +222,7 @@ select distinct a from (select  distinct 'A' from (select 'C' from (select disti
 -- on a single QE.
 --
 CREATE TABLE test1 (id int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into test1 values (1);
 CREATE EXTERNAL WEB TABLE test2 (id int) EXECUTE 'echo 2' ON COORDINATOR FORMAT 'csv';
@@ -234,8 +231,8 @@ union
 (SELECT 'test2' as branch, id FROM test2);
  branch | id 
 --------+----
- test1  |  1
  test2  |  2
+ test1  |  1
 (2 rows)
 
 explain (SELECT 'test1' as branch, id FROM test1 LIMIT 1)
@@ -243,10 +240,10 @@ union
 (SELECT 'test2' as branch, id FROM test2);
                                                           QUERY PLAN                                                          
 ------------------------------------------------------------------------------------------------------------------------------
- Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..984.78 rows=1125 width=12)
-   ->  HashAggregate  (cost=0.00..984.73 rows=375 width=12)
+ Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..985.86 rows=1125 width=12)
+   ->  HashAggregate  (cost=0.00..985.81 rows=375 width=12)
          Group Key: ('test1'::text), test1.id
-         ->  Append  (cost=0.00..984.65 rows=334 width=12)
+         ->  Append  (cost=0.00..985.73 rows=334 width=12)
                ->  Redistribute Motion 1:3  (slice2)  (cost=0.00..431.00 rows=1 width=12)
                      Hash Key: ('test1'::text), test1.id
                      ->  GroupAggregate  (cost=0.00..431.00 rows=1 width=12)
@@ -257,16 +254,16 @@ union
                                        ->  Result  (cost=0.00..431.00 rows=1 width=12)
                                              ->  Gather Motion 3:1  (slice3; segments: 3)  (cost=0.00..431.00 rows=1 width=4)
                                                    ->  Seq Scan on test1  (cost=0.00..431.00 rows=1 width=4)
-               ->  HashAggregate  (cost=0.00..553.64 rows=334 width=12)
-                     Group Key: ('test2'::text), test2.id
-                     ->  Redistribute Motion 3:3  (slice4; segments: 3)  (cost=0.00..553.56 rows=334 width=12)
-                           Hash Key: ('test2'::text), test2.id
-                           ->  Streaming HashAggregate  (cost=0.00..553.55 rows=334 width=12)
-                                 Group Key: 'test2'::text, test2.id
-                                 ->  Result  (cost=0.00..471.53 rows=333334 width=12)
-                                       ->  Redistribute Motion 1:3  (slice5)  (cost=0.00..467.53 rows=333334 width=4)
-                                             ->  Foreign Scan on test2  (cost=0.00..449.70 rows=1000000 width=4)
- Optimizer: Pivotal Optimizer (GPORCA)
+               ->  HashAggregate  (cost=0.00..554.73 rows=334 width=12)
+                     Group Key: ('test2'::text), id
+                     ->  Redistribute Motion 3:3  (slice4; segments: 3)  (cost=0.00..554.64 rows=334 width=12)
+                           Hash Key: ('test2'::text), id
+                           ->  Streaming HashAggregate  (cost=0.00..554.63 rows=334 width=12)
+                                 Group Key: 'test2'::text, id
+                                 ->  Result  (cost=0.00..473.73 rows=333334 width=12)
+                                       ->  Redistribute Motion 1:3  (slice5)  (cost=0.00..469.73 rows=333334 width=4)
+                                             ->  Foreign Scan on test2  (cost=0.00..451.90 rows=1000000 width=4)
+ Optimizer: GPORCA
 (24 rows)
 
 --
@@ -320,8 +317,8 @@ INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
 DETAIL:  Unknown error: Partially Distributed Data
                                       QUERY PLAN                                       
 ---------------------------------------------------------------------------------------
- Gather Motion 1:1  (slice1; segments: 1)  (cost=1922.00..1922.00 rows=172200 width=8)
-   ->  Append  (cost=0.00..1922.00 rows=172200 width=8)
+ Gather Motion 1:1  (slice1; segments: 1)  (cost=2783.00..2783.00 rows=172200 width=8)
+   ->  Append  (cost=0.00..2783.00 rows=172200 width=8)
          ->  Seq Scan on rep2  (cost=0.00..961.00 rows=86100 width=8)
          ->  Seq Scan on rep3  (cost=0.00..961.00 rows=86100 width=8)
  Optimizer: Postgres query optimizer
@@ -353,7 +350,7 @@ INSERT INTO T_a1 SELECT i, i%5 from generate_series(1,10) i;
 CREATE TABLE T_b2 (b1 int, b2 int) DISTRIBUTED BY(b2);
 INSERT INTO T_b2 SELECT i, i%5 from generate_series(1,20) i;
 CREATE TABLE T_random (c1 int, c2 int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 INSERT INTO T_random SELECT i, i%5 from generate_series(1,30) i;
 --start_ignore
@@ -2079,14 +2076,18 @@ insert into t1_ncols values (1, 11, 'one', '2001-01-01');
 insert into t2_ncols values (2, 22, 'two', '2002-02-02');
 insert into t2_ncols values (4, 44, 'four','2004-04-04');
 select b from t1_ncols union all select a from t2_ncols;
+NOTICE:  One or more columns in the following table(s) do not have statistics: t2_ncols
+HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For partitioned tables, run analyze rootpartition <table_name>(<column_list>). See log for columns missing statistics.
  b  
 ----
-  4
-  2
  11
+  2
+  4
 (3 rows)
 
 select a+100, b, d from t1_ncols union select b, a+200, d from t2_ncols order by 1;
+NOTICE:  One or more columns in the following table(s) do not have statistics: t2_ncols
+HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For partitioned tables, run analyze rootpartition <table_name>(<column_list>). See log for columns missing statistics.
  ?column? |  b  |     d      
 ----------+-----+------------
        22 | 202 | 02-02-2002
@@ -2095,15 +2096,19 @@ select a+100, b, d from t1_ncols union select b, a+200, d from t2_ncols order by
 (3 rows)
 
 select c, a from v1_ncols;
+NOTICE:  One or more columns in the following table(s) do not have statistics: t2_ncols
+HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For partitioned tables, run analyze rootpartition <table_name>(<column_list>). See log for columns missing statistics.
   c   | a 
 ------+---
  one  | 1
- four | 4
  two  | 2
+ four | 4
 (3 rows)
 
 with cte1(aa, b, c, d) as (select a*100, b, c, d from t1_ncols union select * from t2_ncols)
 select x.aa/100 aaa, x.c, y.c from cte1 x join cte1 y on x.aa=y.aa;
+NOTICE:  One or more columns in the following table(s) do not have statistics: t2_ncols
+HINT:  For non-partitioned tables, run analyze <table_name>(<column_list>). For partitioned tables, run analyze rootpartition <table_name>(<column_list>). See log for columns missing statistics.
  aaa |  c   |  c   
 -----+------+------
    0 | two  | two
@@ -2122,13 +2127,13 @@ NOTICE:  schema "union_schema" does not exist, skipping
 -- end_ignore
 create schema union_schema;
 create table union_schema.t1(a int, b int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table union_schema.t2(a int, b int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 create table union_schema.t3(a int, b int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Greenplum Database data distribution key for this table.
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 set allow_system_table_mods = on;
 update gp_distribution_policy set numsegments = 1
@@ -2188,8 +2193,8 @@ INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
 DETAIL:  Unknown error: Partially Distributed Data
                                              QUERY PLAN                                              
 -----------------------------------------------------------------------------------------------------
- Gather Motion 3:1  (slice1; segments: 3)  (cost=1.23..1472.30 rows=86130 width=8)
-   ->  Append  (cost=1.23..323.90 rows=28710 width=8)
+ Gather Motion 3:1  (slice1; segments: 3)  (cost=1.23..1615.85 rows=86130 width=8)
+   ->  Append  (cost=1.23..467.45 rows=28710 width=8)
          ->  Hash Join  (cost=1.23..2.80 rows=10 width=8)
                Hash Cond: (t2.b = t1.a)
                ->  Redistribute Motion 2:3  (slice2; segments: 2)  (cost=0.00..1.40 rows=20 width=4)
@@ -2208,6 +2213,8 @@ INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
 DETAIL:  Unknown error: Partially Distributed Data
  a  | b  | a  | b  
 ----+----+----+----
+  1 |  1 |  1 |  1
+  5 |  5 |  5 |  5
   2 |  2 |  2 |  2
   3 |  3 |  3 |  3
   4 |  4 |  4 |  4
@@ -2216,8 +2223,6 @@ DETAIL:  Unknown error: Partially Distributed Data
   8 |  8 |  8 |  8
   9 |  9 |  9 |  9
  10 | 10 | 10 | 10
-  1 |  1 |  1 |  1
-  5 |  5 |  5 |  5
 (10 rows)
 
 select union_schema.t1.a, union_schema.t2.b
@@ -2229,6 +2234,8 @@ INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
 DETAIL:  Unknown error: Partially Distributed Data
  a  | b  
 ----+----
+  1 |  1
+  5 |  5
   2 |  2
   3 |  3
   4 |  4
@@ -2237,8 +2244,6 @@ DETAIL:  Unknown error: Partially Distributed Data
   8 |  8
   9 |  9
  10 | 10
-  1 |  1
-  5 |  5
 (10 rows)
 
 truncate union_schema.t1, union_schema.t2;
@@ -2276,8 +2281,8 @@ INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
 DETAIL:  Unknown error: Partially Distributed Data
                                                 QUERY PLAN                                                 
 -----------------------------------------------------------------------------------------------------------
- Gather Motion 3:1  (slice1; segments: 3)  (cost=1.32..1472.20 rows=86130 width=8)
-   ->  Append  (cost=1.32..323.80 rows=28710 width=8)
+ Gather Motion 3:1  (slice1; segments: 3)  (cost=1.32..1615.75 rows=86130 width=8)
+   ->  Append  (cost=1.32..467.35 rows=28710 width=8)
          ->  Hash Join  (cost=1.32..2.70 rows=10 width=8)
                Hash Cond: (t1.a = t2.b)
                ->  Seq Scan on t1  (cost=0.00..1.20 rows=20 width=4)
@@ -2340,6 +2345,8 @@ reset allow_system_table_mods;
 create table rep (a int) distributed replicated;
 insert into rep select i from generate_series (1, 10) i; 
 create table dist (a int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into dist select i from generate_series (1, 1000) i;
 analyze dist;
 analyze rep;
@@ -2352,7 +2359,7 @@ explain select a from rep union all select a from dist;
  Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..862.03 rows=1010 width=4)
    ->  Append  (cost=0.00..862.01 rows=337 width=4)
          ->  Result  (cost=0.00..431.00 rows=4 width=4)
-               One-Time Filter: (gp_execution_segment() = 2)
+               One-Time Filter: (gp_execution_segment() = 0)
                ->  Seq Scan on rep  (cost=0.00..431.00 rows=10 width=4)
          ->  Seq Scan on dist  (cost=0.00..431.01 rows=334 width=4)
  Optimizer: GPORCA
@@ -2368,12 +2375,12 @@ analyze rand;
 explain select i from generate_series(1,1000) i union all select a from rand;
                                        QUERY PLAN                                       
 ----------------------------------------------------------------------------------------
- Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..431.28 rows=11000 width=4)
+ Gather Motion 3:1  (slice1; segments: 3)  (cost=0.00..431.29 rows=11000 width=4)
    ->  Append  (cost=0.00..431.12 rows=3667 width=4)
          ->  Result  (cost=0.00..0.01 rows=334 width=4)
-               One-Time Filter: (gp_execution_segment() = 2)
+               One-Time Filter: (gp_execution_segment() = 0)
                ->  Function Scan on generate_series  (cost=0.00..0.00 rows=334 width=4)
-         ->  Seq Scan on rand  (cost=0.00..431.06 rows=3334 width=4)
+         ->  Seq Scan on rand  (cost=0.00..431.07 rows=3334 width=4)
  Optimizer: GPORCA
 (7 rows)
 
@@ -2460,7 +2467,7 @@ DETAIL:  Falling back to Postgres-based planner because GPORCA does not support
          ->  Gather Motion 3:1  (slice2; segments: 3)
                ->  Subquery Scan on "*SELECT* 2"
                      ->  Seq Scan on p1_1240
- Optimizer: Postgres-based planner
+ Optimizer: Postgres query optimizer
 (11 rows)
 
 with result as (update r_1240 set a = a +1 where a < 5 returning *) select * from result except select * from p1_1240;
@@ -2475,6 +2482,43 @@ DETAIL:  Falling back to Postgres-based planner because GPORCA does not support
 drop table r_1240;
 drop table p1_1240;
 --
+-- Test CTAS with UNION ALL when branches have different typmods (issue #1431).
+-- ORCA should resolve the output column type to character varying (no length),
+-- same as the Postgres planner, instead of picking the first branch's typmod.
+--
+create table union_ctas_t1(id int, name varchar(1));
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+create table union_ctas_t2(id int, name varchar(2));
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Apache Cloudberry data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into union_ctas_t1 values (1, 'a');
+insert into union_ctas_t2 values (1, 'ab');
+create table union_ctas_result as
+  (select id, name from union_ctas_t1)
+  union all
+  (select id, name from union_ctas_t2);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause. Creating a NULL policy entry.
+-- name column should be "character varying" without length, not varchar(1)
+select atttypmod from pg_attribute
+where attrelid = 'union_ctas_result'::regclass and attname = 'name';
+INFO:  GPORCA failed to produce a plan, falling back to Postgres-based planner
+DETAIL:  Falling back to Postgres-based planner because GPORCA does not support the following feature: Queries on master-only tables
+ atttypmod 
+-----------
+        -1
+(1 row)
+
+-- data should not be truncated
+select * from union_ctas_result order by name;
+ id | name 
+----+------
+  1 | a
+  1 | ab
+(2 rows)
+
+drop table union_ctas_t1, union_ctas_t2, union_ctas_result;
+--
 -- Clean up
 --
 DROP TABLE IF EXISTS T_a1 CASCADE;
diff --git a/src/test/regress/expected/vacuum_gp.out b/src/test/regress/expected/vacuum_gp.out
index daeb2504559..cac825d0cd4 100644
--- a/src/test/regress/expected/vacuum_gp.out
+++ b/src/test/regress/expected/vacuum_gp.out
@@ -446,6 +446,8 @@ create table relcache_leak_in_motion(v1 int);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'v1' as the Apache Cloudberry data distribution key for this table.
 HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
 insert into relcache_leak_in_motion values(generate_series(0, 10000));
+BEGIN;
+SET LOCAL synchronous_commit = local;
 SELECT gp_inject_fault('interconnect_stop_recv_chunk', 'interrupt', dbid)
   FROM gp_segment_configuration WHERE content = -1 and role='p';
  gp_inject_fault 
@@ -457,11 +459,8 @@ analyze relcache_leak_in_motion;
 ERROR:  canceling statement due to user request
 SELECT gp_inject_fault('interconnect_stop_recv_chunk', 'reset', dbid)
   FROM gp_segment_configuration WHERE content = -1 and role='p';
- gp_inject_fault 
------------------
- Success:
-(1 row)
-
+ERROR:  current transaction is aborted, commands ignored until end of transaction block
+COMMIT;
 -- start_ignore
 drop table if exists relcache_leak_in_motion;
 -- end_ignore
diff --git a/src/test/regress/expected/workfile/hashjoin_spill.out b/src/test/regress/expected/workfile/hashjoin_spill.out
index 5633e670954..053f457294b 100644
--- a/src/test/regress/expected/workfile/hashjoin_spill.out
+++ b/src/test/regress/expected/workfile/hashjoin_spill.out
@@ -37,6 +37,8 @@ HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sur
 insert into test_hj_spill SELECT i,i,i%1000,i,i,i,i,i from
 	(select generate_series(1, nsegments * 15000) as i from
 	(select count(*) as nsegments from gp_segment_configuration where role='p' and content >= 0) foo) bar;
+-- Collect statistics to ensure ORCA generates correct execution plan
+ANALYZE test_hj_spill;
 SET statement_mem=1024;
 set gp_resqueue_print_operator_memory_limits=on;
 set gp_workfile_compression = on;
diff --git a/src/test/regress/greenplum_schedule b/src/test/regress/greenplum_schedule
index 3c8f7965b28..604616791c8 100755
--- a/src/test/regress/greenplum_schedule
+++ b/src/test/regress/greenplum_schedule
@@ -167,6 +167,7 @@ test: instr_in_shmem_verify
 # hold locks.
 test: partition_locking
 test: vacuum_gp
+test: vacuum_fsm_nondefault_tablespace
 test: resource_queue_stat
 # background analyze may affect pgstat
 test: pg_stat
diff --git a/src/test/regress/input/pgstat_qd_tabstat.source b/src/test/regress/input/pgstat_qd_tabstat.source
index 0fb8c0ccb71..e9f76ccf0d6 100644
--- a/src/test/regress/input/pgstat_qd_tabstat.source
+++ b/src/test/regress/input/pgstat_qd_tabstat.source
@@ -10,7 +10,7 @@ copy table_for_docopy (i, j) from stdin;
 3	hello3
 \.
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_docopy'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_docopy'::regclass;
 
 CREATE TABLE data_tbl (a int,b char) distributed by (a);
 INSERT INTO data_tbl values(1,'1');
@@ -21,7 +21,7 @@ COPY data_tbl TO '/tmp/data_tbl<SEGID>.csv' on segment;
 create table copy_on_segment (a int,b char);
 COPY copy_on_segment from '/tmp/data_tbl<SEGID>.csv' on segment log errors segment reject limit 3 rows;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'copy_on_segment'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'copy_on_segment'::regclass;
 
 
 -- Test pgstat table stat in initplan on QD
@@ -34,26 +34,26 @@ copy table_for_initplan (i, j, k) from stdin;
 explain (costs off) with updated AS (update table_for_initplan set k = 33 where i = 3 returning k) select table_for_initplan.*, (select sum(k) from updated) from table_for_initplan;
 with updated AS (update table_for_initplan set k = 33 where i = 3 returning k) select table_for_initplan.*, (select sum(k) from updated) from table_for_initplan;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_initplan'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_initplan'::regclass;
 
 
 -- Test pgstat table stat in CTAS on QD
 create table table_for_ctas with (autovacuum_enabled=false) as select i, 'hello' || i from generate_series(1, 100) f(i);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_ctas'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_ctas'::regclass;
 select i, 'hello' || i into table_for_insert_into from generate_series(1, 100) f(i);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_insert_into'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_insert_into'::regclass;
 
 
 -- Test pgstat table stat in ALTER TABLE SET DISTRIBUTED BY on QD
 create table table_for_set_distributed_by(i int, j varchar) distributed by (i);
 insert into table_for_set_distributed_by select i, 'hello' || i from generate_series(1, 333) f(i);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_set_distributed_by'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_set_distributed_by'::regclass;
 alter table table_for_set_distributed_by set distributed by (j);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_set_distributed_by'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_set_distributed_by'::regclass;
 
 
 -- Test pgstat table stat in execution of funciton on QD
@@ -68,7 +68,7 @@ $$
 language plpgsql volatile;
 select update_table_for_function();
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_function'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_function'::regclass;
 
 
 -- Test pgstat table stat in ALTER TABLE EXPAND TABLE on QD;
@@ -78,11 +78,11 @@ create table table_for_expand(i int, j varchar) distributed by (i);
 insert into table_for_expand select i, 'hello' || i from generate_series(1, 333) f(i);
 select count(distinct gp_segment_id) from table_for_expand;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_expand'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_expand'::regclass;
 alter table table_for_expand expand table;
 select count(distinct gp_segment_id) from table_for_expand;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_expand'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_expand'::regclass;
 select gp_debug_reset_create_table_default_numsegments();
 
 
@@ -103,7 +103,7 @@ update table_for_iud set j = 'heroes never die' where i >= 300;
 release savepoint level3;
 commit;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_iud'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_iud'::regclass;
 
 begin;
 savepoint level1;
@@ -120,14 +120,14 @@ rollback to savepoint level3;
 delete from table_for_iud where i <= 200;
 commit;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_iud'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_iud'::regclass;
 
 
 -- Test pgstat table stat in TRUNCATE on QD
 create table table_for_truncate(i int, j varchar) distributed by (i);
 insert into table_for_truncate select i, 'hello' || i from generate_series(1, 777) f(i);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_truncate'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_truncate'::regclass;
 begin;
 savepoint level1;
 savepoint level2;
@@ -141,12 +141,12 @@ delete from table_for_truncate where i >= 700;
 update table_for_truncate set j = 'D' where i <= 200;
 commit;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate'::regclass;
 
 create table table_for_truncate_abort(i int, j varchar) distributed by (i);
 insert into table_for_truncate_abort select i, 'hello' || i from generate_series(1, 777) f(i);
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate_abort'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate_abort'::regclass;
 begin;
 savepoint level1;
 savepoint level2;
@@ -160,7 +160,7 @@ delete from table_for_truncate_abort where i < 700;
 update table_for_truncate_abort set j = 'D' where i >= 200;
 rollback;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate_abort'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate_abort'::regclass;
 
 
 -- Test pgstat table stat for partition table on QD
@@ -171,17 +171,17 @@ PARTITION BY RANGE (rank)
   DEFAULT PARTITION extra );
 insert into rankpart select i, i % 10, i from generate_series(1, 1000)i;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
 
 begin;
 delete from rankpart where id <= 100;
 rollback;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
 
 copy rankpart (id, rank, product) from stdin;
 1001	1	1001
@@ -196,8 +196,8 @@ copy rankpart (id, rank, product) from stdin;
 1010	6	1010
 \.
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
 
 begin;
 update rankpart set rank = 1 where id > 1005;
@@ -209,9 +209,9 @@ release savepoint level2;
 rollback to savepoint level1;
 commit;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
 
 begin;
 savepoint level1_1;
@@ -219,9 +219,9 @@ insert into rankpart select i, i % 10, i from generate_series(2001, 3000)i;
 insert into rankpart select i, i % 10, i from generate_series(3001, 4000)i;
 commit;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
 
 
 -- Test pgstat matview stat with distributed policy.
@@ -229,11 +229,11 @@ create table base_table(i int, j int, z int ) distributed by (i);
 insert into base_table select i,i,i from generate_series(1, 100) i;
 create materialized view mt as select * from base_table where z>=50;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 insert into base_table select i,i,i from generate_series(1, 100) i;
 refresh materialized view mt;
 select pg_sleep(0.77) from gp_dist_random('gp_id'); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 -- pg_stat_all_tables collects gpstats across segments
 select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 
@@ -245,11 +245,11 @@ create table base_table(i int, j int, z int ) distributed replicated;
 insert into base_table select i,i,i from generate_series(1, 100) i;
 create materialized view mt as select * from base_table where z>=50 distributed replicated;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 insert into base_table select i,i,i from generate_series(1, 100) i;
 refresh materialized view mt;
 select pg_sleep(0.77) from gp_dist_random('gp_id'); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 -- pg_stat_all_tables collects gpstats across segments
 select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
 
@@ -263,15 +263,15 @@ insert into tabstat_ao select 1,1;
 delete from tabstat_ao;
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
 
-select count(*) from pg_stat_all_tables
+select count(*) from gp_stat_all_tables_summary
 where
     relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass)
     OR relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass)
     OR relid = (select visimaprelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
 
 select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
-select n_tup_ins from pg_stat_all_tables where relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
-select n_tup_ins from pg_stat_all_tables where relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
-select n_tup_ins from pg_stat_all_tables where relid = (select visimaprelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select visimaprelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
 
 drop table tabstat_ao;
diff --git a/src/test/regress/input/vacuum_fsm_nondefault_tablespace.source b/src/test/regress/input/vacuum_fsm_nondefault_tablespace.source
new file mode 100644
index 00000000000..adce9ab77de
--- /dev/null
+++ b/src/test/regress/input/vacuum_fsm_nondefault_tablespace.source
@@ -0,0 +1,54 @@
+-- Test: VACUUM on a table in a non-default tablespace does not crash on first run.
+--
+-- Bug: SIGSEGV in fsm_extend() (freespace.c:637) when vacuuming a heap table
+-- (or an AO table's aoseg auxiliary table) that resides in a non-default
+-- tablespace for the very first time.
+--
+-- Root cause: commit "Prevent CREATE TABLE from using dangling tablespace"
+-- added TablespaceLockTuple() in TablespaceCreateDbspace() for non-default
+-- tablespaces. That call reaches AcceptInvalidationMessages() via
+-- LockSharedObject(), which processes a pending SHAREDINVALSMGR_ID message
+-- that vm_extend() had queued via CacheInvalidateSmgr(), nullifying
+-- rel->rd_smgr before fsm_extend() dereferences it at freespace.c:637.
+--
+-- Fix: added RelationOpenSmgr(rel) after smgrcreate() in both fsm_extend()
+-- (freespace.c) and vm_extend() (visibilitymap.c) so that rd_smgr is
+-- re-opened if the sinval handler closed it.
+
+CREATE TABLESPACE fsm_ts_test LOCATION '@testtablespace@';
+
+-- Case 1: plain heap table in non-default tablespace, first VACUUM.
+-- Before the fix this crashed with SIGSEGV at freespace.c:637:
+--   vm_extend()  -> CacheInvalidateSmgr  (queues SHAREDINVALSMGR_ID)
+--   fsm_extend() -> smgrcreate -> TablespaceCreateDbspace
+--                -> TablespaceLockTuple  -> AcceptInvalidationMessages
+--                -> processes SHAREDINVALSMGR_ID -> rel->rd_smgr = NULL
+--                -> rel->rd_smgr->smgr_cached_nblocks[...] = ...  SIGSEGV
+CREATE TABLE fsm_ts_heap (id int, val text)
+    TABLESPACE fsm_ts_test
+    DISTRIBUTED BY (id);
+INSERT INTO fsm_ts_heap SELECT i, repeat('x', 80) FROM generate_series(1, 500) i;
+VACUUM ANALYZE fsm_ts_heap;
+SELECT count(*) FROM fsm_ts_heap;
+-- Second VACUUM must also succeed (FSM/VM now exist, different code path).
+VACUUM ANALYZE fsm_ts_heap;
+SELECT count(*) FROM fsm_ts_heap;
+DROP TABLE fsm_ts_heap;
+
+-- Case 2: AO table in non-default tablespace.
+-- The crash occurs inside the recursive vacuum of the aoseg auxiliary table
+-- (which is also a heap table stored in the same non-default tablespace).
+CREATE TABLE fsm_ts_ao (id int, val text)
+    USING ao_row
+    TABLESPACE fsm_ts_test
+    DISTRIBUTED BY (id);
+INSERT INTO fsm_ts_ao SELECT i, repeat('y', 80) FROM generate_series(1, 500) i;
+VACUUM ANALYZE fsm_ts_ao;
+SELECT count(*) FROM fsm_ts_ao;
+-- Second VACUUM must also succeed.
+VACUUM ANALYZE fsm_ts_ao;
+SELECT count(*) FROM fsm_ts_ao;
+DROP TABLE fsm_ts_ao;
+
+-- Cleanup.
+DROP TABLESPACE fsm_ts_test;
diff --git a/src/test/regress/output/pgstat_qd_tabstat.source b/src/test/regress/output/pgstat_qd_tabstat.source
index ca612e18b9c..591f262f7c5 100644
--- a/src/test/regress/output/pgstat_qd_tabstat.source
+++ b/src/test/regress/output/pgstat_qd_tabstat.source
@@ -10,7 +10,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_docopy'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_docopy'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
          3 |         0 |         0 |             0 |          3 |          0 |                   3
@@ -32,7 +32,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'copy_on_segment'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'copy_on_segment'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
          4 |         0 |         0 |             0 |          4 |          0 |                   4
@@ -70,7 +70,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_initplan'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_initplan'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
          3 |         1 |         0 |             0 |          3 |          1 |                   4
@@ -86,7 +86,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_ctas'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_ctas'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        100 |         0 |         0 |             0 |        100 |          0 |                 100
@@ -101,7 +101,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_insert_into'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_insert_into'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        100 |         0 |         0 |             0 |        100 |          0 |                 100
@@ -116,7 +116,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_set_distributed_by'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_set_distributed_by'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        333 |         0 |         0 |             0 |        333 |          0 |                 333
@@ -129,7 +129,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_set_distributed_by'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_set_distributed_by'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        333 |         0 |         0 |             0 |        333 |          0 |                 333
@@ -157,7 +157,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_function'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_function'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        333 |         0 |       200 |             0 |        133 |        200 |                 533
@@ -185,7 +185,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_expand'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_expand'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        333 |         0 |         0 |             0 |        333 |          0 |                 333
@@ -204,7 +204,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_expand'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_expand'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        333 |         0 |         0 |             0 |        333 |          0 |                 333
@@ -238,7 +238,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_iud'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_iud'::regclass;
  n_live_tup | n_dead_tup 
 ------------+------------
         333 |         34
@@ -264,7 +264,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_iud'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_iud'::regclass;
  n_live_tup | n_dead_tup 
 ------------+------------
         133 |        713
@@ -279,7 +279,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'table_for_truncate'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'table_for_truncate'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        777 |         0 |         0 |             0 |        777 |          0 |                 777
@@ -303,7 +303,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate'::regclass;
  n_live_tup | n_dead_tup 
 ------------+------------
         699 |        301
@@ -317,7 +317,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate_abort'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate_abort'::regclass;
  n_live_tup | n_dead_tup 
 ------------+------------
         777 |          0
@@ -341,7 +341,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_live_tup, n_dead_tup from pg_stat_all_tables_internal where relid = 'table_for_truncate_abort'::regclass;
+select n_live_tup, n_dead_tup from pg_stat_all_tables where relid = 'table_for_truncate_abort'::regclass;
  n_live_tup | n_dead_tup 
 ------------+------------
         777 |        223
@@ -360,19 +360,19 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        500 |         0 |         0 |             0 |        500 |          0 |                 500
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        400 |         0 |         0 |             0 |        400 |          0 |                 400
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        100 |         0 |         0 |             0 |        100 |          0 |                 100
@@ -387,19 +387,19 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        500 |         0 |        50 |             0 |        500 |          0 |                 500
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        400 |         0 |        40 |             0 |        400 |          0 |                 400
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        100 |         0 |        10 |             0 |        100 |          0 |                 100
@@ -412,13 +412,13 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        505 |         0 |        50 |             0 |        505 |          0 |                 505
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        405 |         0 |        40 |             0 |        405 |          0 |                 405
@@ -439,19 +439,19 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        510 |         0 |        55 |             0 |        510 |          0 |                 510
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        410 |         0 |        50 |             0 |        400 |         10 |                 410
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        100 |         0 |        10 |             0 |        100 |          0 |                 100
@@ -468,19 +468,19 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_2'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_2'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
       1510 |         0 |        55 |             0 |       1510 |          0 |                1510
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_3'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_3'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
       1210 |         0 |        50 |             0 |       1200 |         10 |                1210
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'rankpart_1_prt_extra'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'rankpart_1_prt_extra'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        300 |         0 |        10 |             0 |        300 |          0 |                 300
@@ -498,7 +498,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
         51 |         0 |         0 |             0 |         51 |          0 |                  51
@@ -514,7 +514,7 @@ select pg_sleep(0.77) from gp_dist_random('gp_id'); -- Force pgstat_report_stat(
  
 (3 rows)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        153 |         0 |         0 |             0 |        102 |          0 |                 153
@@ -539,7 +539,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
         51 |         0 |         0 |             0 |         51 |          0 |                  51
@@ -555,7 +555,7 @@ select pg_sleep(0.77) from gp_dist_random('gp_id'); -- Force pgstat_report_stat(
  
 (3 rows)
 
-select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables_internal where relid = 'mt'::regclass;
+select n_tup_ins, n_tup_upd, n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze from pg_stat_all_tables where relid = 'mt'::regclass;
  n_tup_ins | n_tup_upd | n_tup_del | n_tup_hot_upd | n_live_tup | n_dead_tup | n_mod_since_analyze 
 -----------+-----------+-----------+---------------+------------+------------+---------------------
        153 |         0 |         0 |             0 |        102 |          0 |                 153
@@ -580,7 +580,7 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select count(*) from pg_stat_all_tables
+select count(*) from gp_stat_all_tables_summary
 where
     relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass)
     OR relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass)
@@ -596,19 +596,19 @@ select pg_sleep(0.77); -- Force pgstat_report_stat() to send tabstat.
  
 (1 row)
 
-select n_tup_ins from pg_stat_all_tables where relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select segrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
  n_tup_ins 
 -----------
          1
 (1 row)
 
-select n_tup_ins from pg_stat_all_tables where relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select blkdirrelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
  n_tup_ins 
 -----------
          1
 (1 row)
 
-select n_tup_ins from pg_stat_all_tables where relid = (select visimaprelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
+select n_tup_ins from gp_stat_all_tables_summary where relid = (select visimaprelid from pg_appendonly where relid = 'tabstat_ao'::regclass);
  n_tup_ins 
 -----------
          1
diff --git a/src/test/regress/output/vacuum_fsm_nondefault_tablespace.source b/src/test/regress/output/vacuum_fsm_nondefault_tablespace.source
new file mode 100644
index 00000000000..fc2ff245691
--- /dev/null
+++ b/src/test/regress/output/vacuum_fsm_nondefault_tablespace.source
@@ -0,0 +1,70 @@
+-- Test: VACUUM on a table in a non-default tablespace does not crash on first run.
+--
+-- Bug: SIGSEGV in fsm_extend() (freespace.c:637) when vacuuming a heap table
+-- (or an AO table's aoseg auxiliary table) that resides in a non-default
+-- tablespace for the very first time.
+--
+-- Root cause: commit "Prevent CREATE TABLE from using dangling tablespace"
+-- added TablespaceLockTuple() in TablespaceCreateDbspace() for non-default
+-- tablespaces. That call reaches AcceptInvalidationMessages() via
+-- LockSharedObject(), which processes a pending SHAREDINVALSMGR_ID message
+-- that vm_extend() had queued via CacheInvalidateSmgr(), nullifying
+-- rel->rd_smgr before fsm_extend() dereferences it at freespace.c:637.
+--
+-- Fix: added RelationOpenSmgr(rel) after smgrcreate() in both fsm_extend()
+-- (freespace.c) and vm_extend() (visibilitymap.c) so that rd_smgr is
+-- re-opened if the sinval handler closed it.
+CREATE TABLESPACE fsm_ts_test LOCATION '@testtablespace@';
+-- Case 1: plain heap table in non-default tablespace, first VACUUM.
+-- Before the fix this crashed with SIGSEGV at freespace.c:637:
+--   vm_extend()  -> CacheInvalidateSmgr  (queues SHAREDINVALSMGR_ID)
+--   fsm_extend() -> smgrcreate -> TablespaceCreateDbspace
+--                -> TablespaceLockTuple  -> AcceptInvalidationMessages
+--                -> processes SHAREDINVALSMGR_ID -> rel->rd_smgr = NULL
+--                -> rel->rd_smgr->smgr_cached_nblocks[...] = ...  SIGSEGV
+CREATE TABLE fsm_ts_heap (id int, val text)
+    TABLESPACE fsm_ts_test
+    DISTRIBUTED BY (id);
+INSERT INTO fsm_ts_heap SELECT i, repeat('x', 80) FROM generate_series(1, 500) i;
+VACUUM ANALYZE fsm_ts_heap;
+SELECT count(*) FROM fsm_ts_heap;
+ count 
+-------
+   500
+(1 row)
+
+-- Second VACUUM must also succeed (FSM/VM now exist, different code path).
+VACUUM ANALYZE fsm_ts_heap;
+SELECT count(*) FROM fsm_ts_heap;
+ count 
+-------
+   500
+(1 row)
+
+DROP TABLE fsm_ts_heap;
+-- Case 2: AO table in non-default tablespace.
+-- The crash occurs inside the recursive vacuum of the aoseg auxiliary table
+-- (which is also a heap table stored in the same non-default tablespace).
+CREATE TABLE fsm_ts_ao (id int, val text)
+    USING ao_row
+    TABLESPACE fsm_ts_test
+    DISTRIBUTED BY (id);
+INSERT INTO fsm_ts_ao SELECT i, repeat('y', 80) FROM generate_series(1, 500) i;
+VACUUM ANALYZE fsm_ts_ao;
+SELECT count(*) FROM fsm_ts_ao;
+ count 
+-------
+   500
+(1 row)
+
+-- Second VACUUM must also succeed.
+VACUUM ANALYZE fsm_ts_ao;
+SELECT count(*) FROM fsm_ts_ao;
+ count 
+-------
+   500
+(1 row)
+
+DROP TABLE fsm_ts_ao;
+-- Cleanup.
+DROP TABLESPACE fsm_ts_test;
diff --git a/src/test/regress/parallel_schedule b/src/test/regress/parallel_schedule
index 5adb7d9df01..79eb980de74 100644
--- a/src/test/regress/parallel_schedule
+++ b/src/test/regress/parallel_schedule
@@ -194,5 +194,8 @@ test: constraints_check
 # run stats by itself because its delay may be insufficient under heavy load
 test: stats
 
+# orca parallel
+test: orca_parallel
+
 # test of tag
 test: tag
diff --git a/src/test/regress/sql/.gitignore b/src/test/regress/sql/.gitignore
index 9b5f3660fa7..3a340338616 100644
--- a/src/test/regress/sql/.gitignore
+++ b/src/test/regress/sql/.gitignore
@@ -64,3 +64,4 @@
 /ao_unique_index_partition.sql
 /bfv_copy.sql
 /copy_encoding_error.sql
+/vacuum_fsm_nondefault_tablespace.sql
diff --git a/src/test/regress/sql/analyze.sql b/src/test/regress/sql/analyze.sql
index fa2ce8b834f..6d1c7ddd159 100644
--- a/src/test/regress/sql/analyze.sql
+++ b/src/test/regress/sql/analyze.sql
@@ -677,3 +677,26 @@ analyze verbose p2;
 select * from pg_stats where tablename like 'part2';
 
 drop table multipart cascade;
+
+--
+-- Test column-specific ANALYZE correctly uses attnum-based NDV index (not loop index).
+-- When ANALYZE t(b) is run, the QD loop has i=0 for column b (attnum=2),
+-- so attnum-1=1 != i=0. Without the fix, colNDVBySeg[i=0] reads column a's NDV
+-- instead of column b's NDV.
+--
+CREATE TABLE analyze_col_ndv_drop (a int, b int, c int) DISTRIBUTED BY (a);
+INSERT INTO analyze_col_ndv_drop SELECT i%5, i, i%50 FROM generate_series(1, 100) i;
+-- ANALYZE specific column b: QD loop has i=0, b.attnum=2, so attnum-1=1 != i=0
+ANALYZE analyze_col_ndv_drop (b);
+-- stadistinctbyseg for b should be 100 (all distinct), not ~5 (NDV of column a at index 0)
+SELECT a.attname,
+       CASE WHEN s.stakind1 = 8 THEN array_to_string(s.stavalues1, ',')
+            WHEN s.stakind2 = 8 THEN array_to_string(s.stavalues2, ',')
+            WHEN s.stakind3 = 8 THEN array_to_string(s.stavalues3, ',')
+            WHEN s.stakind4 = 8 THEN array_to_string(s.stavalues4, ',')
+            WHEN s.stakind5 = 8 THEN array_to_string(s.stavalues5, ',')
+       END AS stadistinctbyseg
+FROM pg_statistic s
+JOIN pg_attribute a ON a.attrelid = s.starelid AND a.attnum = s.staattnum
+WHERE s.starelid = 'analyze_col_ndv_drop'::regclass AND a.attname = 'b';
+DROP TABLE analyze_col_ndv_drop;
diff --git a/src/test/regress/sql/brin.sql b/src/test/regress/sql/brin.sql
index 9a446efdc82..fade709eaa4 100644
--- a/src/test/regress/sql/brin.sql
+++ b/src/test/regress/sql/brin.sql
@@ -330,6 +330,7 @@ BEGIN
 		SET enable_bitmapscan = 1;
 		SET optimizer_enable_tablescan = 0;
 		SET optimizer_enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		is_planner_plan := false;
diff --git a/src/test/regress/sql/brin_bloom.sql b/src/test/regress/sql/brin_bloom.sql
index 84572fdc2fb..558ca5730b7 100644
--- a/src/test/regress/sql/brin_bloom.sql
+++ b/src/test/regress/sql/brin_bloom.sql
@@ -231,6 +231,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_bloom WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/sql/brin_multi.sql b/src/test/regress/sql/brin_multi.sql
index a46c09951b5..327a4215bf9 100644
--- a/src/test/regress/sql/brin_multi.sql
+++ b/src/test/regress/sql/brin_multi.sql
@@ -266,6 +266,7 @@ BEGIN
 		-- run the query using the brin index
 		SET enable_seqscan = 0;
 		SET enable_bitmapscan = 1;
+		SET enable_parallel = 0;
 
 		plan_ok := false;
 		FOR plan_line IN EXECUTE format($y$EXPLAIN SELECT array_agg(ctid) FROM brintest_multi WHERE %s $y$, cond) LOOP
diff --git a/src/test/regress/sql/cbdb_parallel.sql b/src/test/regress/sql/cbdb_parallel.sql
index f9d01dd8a00..08e7aa198f9 100644
--- a/src/test/regress/sql/cbdb_parallel.sql
+++ b/src/test/regress/sql/cbdb_parallel.sql
@@ -1149,6 +1149,56 @@ reset gp_cte_sharing;
 reset enable_parallel;
 reset min_parallel_table_scan_size;
 
+--
+-- Parallel Hash Full/Right Join
+--
+begin;
+create table pj_t1(id int, v int) with(parallel_workers=2) distributed by (id);
+create table pj_t2(id int, v int) with(parallel_workers=2) distributed by (id);
+create table pj_t3(id int, v int) with(parallel_workers=0) distributed by (id);
+
+-- pj_t1 is 3x larger than pj_t2 so the planner hashes the smaller pj_t2
+-- and probes with pj_t1, producing a genuine Parallel Hash Right Join plan.
+insert into pj_t1 select i, i from generate_series(1,30000)i;
+insert into pj_t2 select i, i from generate_series(25001,35000)i;
+insert into pj_t3 select i, i from generate_series(1,10000)i;
+analyze pj_t1;
+analyze pj_t2;
+analyze pj_t3;
+
+set local enable_parallel = on;
+set local min_parallel_table_scan_size = 0;
+
+-- 12_P_12_10: Parallel Hash Full Join: HashedWorkers FULL JOIN HashedWorkers -> HashedOJ(parallel)
+explain(costs off, locus)
+select count(*) from pj_t1 full join pj_t2 using (id);
+-- correctness: parallel result matches non-parallel
+set local enable_parallel = off;
+select count(*) from pj_t1 full join pj_t2 using (id);
+set local enable_parallel = on;
+select count(*) from pj_t1 full join pj_t2 using (id);
+
+-- Parallel Hash Right Join: pj_t1 (30K) is larger, so the planner hashes the smaller pj_t2
+-- (10K) as the build side and probes with pj_t1; result locus HashedWorkers(parallel)
+explain(costs off, locus)
+select count(*) from pj_t1 right join pj_t2 using (id);
+-- correctness: parallel result matches non-parallel
+set local enable_parallel = off;
+select count(*) from pj_t1 right join pj_t2 using (id);
+set local enable_parallel = on;
+select count(*) from pj_t1 right join pj_t2 using (id);
+
+-- Locus propagation: HashedOJ(parallel) followed by INNER JOIN with Hashed(serial)
+-- The full join result (HashedOJ,parallel=2) is joined with pj_t3 (Hashed,serial)
+explain(costs off, locus)
+select count(*) from (pj_t1 full join pj_t2 using (id)) fj inner join pj_t3 using (id);
+
+-- Locus propagation: HashedOJ(parallel) followed by FULL JOIN with Hashed(serial)
+explain(costs off, locus)
+select count(*) from (pj_t1 full join pj_t2 using (id)) fj full join pj_t3 using (id);
+
+abort;
+
 -- start_ignore
 drop schema test_parallel cascade;
 -- end_ignore
diff --git a/src/test/regress/sql/create_index.sql b/src/test/regress/sql/create_index.sql
index ac5526ea9b1..b01c11aaf4f 100644
--- a/src/test/regress/sql/create_index.sql
+++ b/src/test/regress/sql/create_index.sql
@@ -649,7 +649,7 @@ DROP TABLE syscol_table;
 -- Tests for IS NULL/IS NOT NULL with b-tree indexes
 --
 
-CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek;
+CREATE TABLE onek_with_null AS SELECT unique1, unique2 FROM onek DISTRIBUTED BY (unique1);
 INSERT INTO onek_with_null (unique1,unique2) VALUES (NULL, -1), (NULL, NULL);
 CREATE UNIQUE INDEX onek_nulltest ON onek_with_null (unique2,unique1);
 
diff --git a/src/test/regress/sql/create_view.sql b/src/test/regress/sql/create_view.sql
index f35364b8a23..4605fdb71b1 100644
--- a/src/test/regress/sql/create_view.sql
+++ b/src/test/regress/sql/create_view.sql
@@ -693,6 +693,38 @@ select x + y + z as c1,
 from (values(1,2,3)) v(x,y,z);
 select pg_get_viewdef('tt26v', true);
 
+
+-- Test that changing the relkind of a relcache entry doesn't cause
+-- trouble. Prior instances of where it did:
+-- CALDaNm2yXz+zOtv7y5zBd5WKT8O0Ld3YxikuU3dcyCvxF7gypA@mail.gmail.com
+-- CALDaNm3oZA-8Wbps2Jd1g5_Gjrr-x3YWrJPek-mF5Asrrvz2Dg@mail.gmail.com
+CREATE TABLE tt26(c int);
+
+BEGIN;
+CREATE TABLE tt27(c int);
+SAVEPOINT q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+SELECT * FROM tt27;
+ROLLBACK TO q;
+CREATE RULE "_RETURN" AS ON SELECT TO tt27 DO INSTEAD SELECT * FROM tt26;
+ROLLBACK;
+
+BEGIN;
+CREATE TABLE tt28(c int);
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+CREATE RULE "_RETURN" AS ON SELECT TO tt28 DO INSTEAD SELECT * FROM tt26;
+ROLLBACK;
+
+
+-- test restriction on non-system view expansion.
+create table tt27v_tbl (a int);
+create view tt27v as select a from tt27v_tbl;
+set restrict_nonsystem_relation_kind to 'view';
+select a from tt27v where a > 0; -- Error
+insert into tt27v values (1); -- Error
+select viewname from pg_views where viewname = 'tt27v'; -- Ok to access a system view.
+reset restrict_nonsystem_relation_kind;
+
 -- test display negative operator of const-folder expression
 create table tdis(a int, b int, c int);
 create view tdis_v1 as select a,b,c, -1::int from tdis group by 1,2,3,4;
diff --git a/src/test/regress/sql/groupingsets.sql b/src/test/regress/sql/groupingsets.sql
index 6907b5f1f55..851a1eea6bb 100644
--- a/src/test/regress/sql/groupingsets.sql
+++ b/src/test/regress/sql/groupingsets.sql
@@ -353,6 +353,12 @@ explain (costs off)
   select v.c, (select count(*) from gstest2 group by () having v.c)
     from (values (false),(true)) v(c) order by v.c;
 
+-- HAVING with constant-false predicate on an empty grouping set must emit
+-- zero rows, not the default scalar-aggregate row.
+select count(*) from gstest2 group by grouping sets (()) having false;
+explain (costs off)
+  select count(*) from gstest2 group by grouping sets (()) having false;
+
 -- HAVING with GROUPING queries
 select ten, grouping(ten) from onek
 group by grouping sets(ten) having grouping(ten) >= 0
diff --git a/src/test/regress/sql/join_hash.sql b/src/test/regress/sql/join_hash.sql
index 325068e9d23..2978e155ecd 100644
--- a/src/test/regress/sql/join_hash.sql
+++ b/src/test/regress/sql/join_hash.sql
@@ -13,6 +13,9 @@ set allow_system_table_mods=on;
 set local min_parallel_table_scan_size = 0;
 set local parallel_setup_cost = 0;
 set local enable_hashjoin = on;
+-- CBDB: disable CBDB parallel for these PG-originated tests; parallel full join
+-- is tested separately in cbdb_parallel.sql.
+set local enable_parallel = off;
 
 -- Extract bucket and batch counts from an explain analyze plan.  In
 -- general we can't make assertions about how many batches (or
@@ -191,6 +194,8 @@ select original > 1 as initially_multibatch, final > original as increased_batch
 $$
   select count(*) from simple r join simple s using (id);
 $$);
+-- parallel full multi-batch hash join
+select count(*) from simple r full outer join simple s using (id);
 rollback to settings;
 
 -- The "bad" case: during execution we need to increase number of
@@ -438,7 +443,16 @@ explain (costs off)
 select  count(*) from simple r full outer join simple s using (id);
 rollback to settings;
 
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
+savepoint settings;
+set enable_parallel_hash = off;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s using (id);
+select  count(*) from simple r full outer join simple s using (id);
+rollback to settings;
+
+-- parallelism is possible with parallel-aware full hash join
 savepoint settings;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
@@ -446,7 +460,7 @@ explain (costs off)
 select  count(*) from simple r full outer join simple s using (id);
 rollback to settings;
 
--- An full outer join where every record is not matched.
+-- A full outer join where every record is not matched.
 
 -- non-parallel
 savepoint settings;
@@ -456,7 +470,16 @@ explain (costs off)
 select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
 rollback to settings;
 
--- parallelism not possible with parallel-oblivious outer hash join
+-- parallelism not possible with parallel-oblivious full hash join
+savepoint settings;
+set enable_parallel_hash = off;
+set local max_parallel_workers_per_gather = 2;
+explain (costs off)
+     select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
+rollback to settings;
+
+-- parallelism is possible with parallel-aware full hash join
 savepoint settings;
 set local max_parallel_workers_per_gather = 2;
 explain (costs off)
@@ -464,6 +487,7 @@ explain (costs off)
 select  count(*) from simple r full outer join simple s on (r.id = 0 - s.id);
 rollback to settings;
 
+
 -- exercise special code paths for huge tuples (note use of non-strict
 -- expression and left join required to get the detoasted tuple into
 -- the hash table)
@@ -518,6 +542,37 @@ rollback to settings;
 
 rollback;
 
+-- Hash join reuses the HOT status bit to indicate match status. This can only
+-- be guaranteed to produce correct results if all the hash join tuple match
+-- bits are reset before reuse. This is done upon loading them into the
+-- hashtable.
+begin;
+SAVEPOINT settings;
+-- CBDB: disable CBDB parallel; the serial full join match-bit test is what matters here.
+SET enable_parallel = off;
+SET enable_parallel_hash = on;
+SET min_parallel_table_scan_size = 0;
+SET parallel_setup_cost = 0;
+SET parallel_tuple_cost = 0;
+CREATE TABLE hjtest_matchbits_t1(id int);
+CREATE TABLE hjtest_matchbits_t2(id int);
+INSERT INTO hjtest_matchbits_t1 VALUES (1);
+INSERT INTO hjtest_matchbits_t2 VALUES (2);
+-- Update should create a HOT tuple. If this status bit isn't cleared, we won't
+-- correctly emit the NULL-extended unmatching tuple in full hash join.
+UPDATE hjtest_matchbits_t2 set id = 2;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id
+  ORDER BY t1.id;
+-- Test serial full hash join.
+-- Resetting parallel_setup_cost should force a serial plan.
+-- Just to be safe, however, set enable_parallel_hash to off, as parallel full
+-- hash joins are only supported with shared hashtables.
+RESET parallel_setup_cost;
+SET enable_parallel_hash = off;
+SELECT * FROM hjtest_matchbits_t1 t1 FULL JOIN hjtest_matchbits_t2 t2 ON t1.id = t2.id;
+ROLLBACK TO settings;
+
+rollback;
 
 -- Verify that hash key expressions reference the correct
 -- nodes. Hashjoin's hashkeys need to reference its outer plan, Hash's
diff --git a/src/test/regress/sql/matview_data.sql b/src/test/regress/sql/matview_data.sql
index 059a5a97bf4..65de9dd5c9b 100644
--- a/src/test/regress/sql/matview_data.sql
+++ b/src/test/regress/sql/matview_data.sql
@@ -343,6 +343,604 @@ drop table jt3;
 drop table jt2;
 drop table jt1;
 
+--
+-- Test AQUMV (Answer Query Using Materialized Views) with join queries.
+-- Each matching test shows EXPLAIN + SELECT with GUC off (original plan),
+-- then EXPLAIN + SELECT with GUC on (MV rewrite). Results must match.
+--
+create table aqj_t1(a int, b int) distributed by (a);
+create table aqj_t2(a int, b int) distributed by (a);
+create table aqj_t3(a int, b int) distributed by (a);
+insert into aqj_t1 select i, i*10 from generate_series(1, 100) i;
+insert into aqj_t2 select i, i*100 from generate_series(1, 100) i;
+insert into aqj_t3 select i, i*1000 from generate_series(1, 100) i;
+analyze aqj_t1;
+analyze aqj_t2;
+analyze aqj_t3;
+
+-- 1. Two-table INNER JOIN exact match
+create materialized view mv_aqj_join2 as
+  select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+analyze mv_aqj_join2;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a order by 1 limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a order by 1 limit 5;
+
+-- 2. Join with WHERE clause
+create materialized view mv_aqj_where as
+  select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+analyze mv_aqj_where;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5 order by 1 limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5;
+select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 5 order by 1 limit 5;
+
+-- 3. Join with GROUP BY + aggregate
+create materialized view mv_aqj_agg as
+  select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+analyze mv_aqj_agg;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a order by 1 limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a;
+select aqj_t1.a, count(*) as cnt from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a group by aqj_t1.a order by 1 limit 5;
+
+-- 4. Non-match: different WHERE clause (should show Hash Join, not MV)
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a where aqj_t1.a > 10;
+
+-- 5. Non-match: different target list
+explain(costs off) select aqj_t1.b, aqj_t2.a from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+
+-- 6. Non-match: different join type (INNER vs LEFT)
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 left join aqj_t2 on aqj_t1.a = aqj_t2.a;
+
+-- 7. Three-table join
+create materialized view mv_aqj_join3 as
+  select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+analyze mv_aqj_join3;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a
+  order by 1 limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a;
+select aqj_t1.a, aqj_t2.b, aqj_t3.b as c
+  from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a join aqj_t3 on aqj_t2.a = aqj_t3.a
+  order by 1 limit 5;
+
+-- 8. Implicit join (FROM t1, t2 WHERE ...)
+create materialized view mv_aqj_implicit as
+  select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+analyze mv_aqj_implicit;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a order by 1 limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a;
+select aqj_t1.a, aqj_t2.b from aqj_t1, aqj_t2 where aqj_t1.a = aqj_t2.a order by 1 limit 5;
+
+-- 9. MV not up-to-date: after INSERT on base table
+insert into aqj_t1 values(999, 9990);
+set enable_answer_query_using_materialized_views = on;
+-- Should NOT use mv_aqj_join2 (status is 'i')
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+
+-- 10. After REFRESH: should use MV again
+refresh materialized view mv_aqj_join2;
+analyze mv_aqj_join2;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+
+-- 11. GUC off: should NOT use MV
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select aqj_t1.a, aqj_t2.b from aqj_t1 join aqj_t2 on aqj_t1.a = aqj_t2.a;
+
+--
+-- More complex join AQUMV test cases with richer schemas
+--
+
+create table aqj_orders(
+  order_id int,
+  customer_id int,
+  amount numeric(10,2),
+  status text,
+  order_date date
+) distributed by (order_id);
+
+create table aqj_customers(
+  customer_id int,
+  name text,
+  region text,
+  credit_limit numeric(10,2)
+) distributed by (customer_id);
+
+create table aqj_products(
+  product_id int,
+  name text,
+  category text,
+  price numeric(10,2)
+) distributed by (product_id);
+
+create table aqj_order_items(
+  item_id int,
+  order_id int,
+  product_id int,
+  quantity int
+) distributed by (item_id);
+
+insert into aqj_customers select i, 'cust_' || i, case when i % 3 = 0 then 'east' when i % 3 = 1 then 'west' else 'north' end, (i * 100)::numeric(10,2) from generate_series(1, 50) i;
+insert into aqj_orders select i, (i % 50) + 1, (i * 10.5)::numeric(10,2), case when i % 4 = 0 then 'shipped' when i % 4 = 1 then 'pending' when i % 4 = 2 then 'delivered' else 'cancelled' end, '2024-01-01'::date + (i % 365) from generate_series(1, 200) i;
+insert into aqj_products select i, 'prod_' || i, case when i % 5 = 0 then 'electronics' when i % 5 = 1 then 'books' when i % 5 = 2 then 'clothing' when i % 5 = 3 then 'food' else 'toys' end, (i * 5.99)::numeric(10,2) from generate_series(1, 30) i;
+insert into aqj_order_items select i, (i % 200) + 1, (i % 30) + 1, (i % 10) + 1 from generate_series(1, 500) i;
+
+analyze aqj_customers;
+analyze aqj_orders;
+analyze aqj_products;
+analyze aqj_order_items;
+
+-- 12. Join with multiple columns + WHERE on text column
+create materialized view mv_aqj_orders_cust as
+  select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+analyze mv_aqj_orders_cust;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+
+-- 13. Four-table join
+create materialized view mv_aqj_order_details as
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+analyze mv_aqj_order_details;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+
+-- 14. GROUP BY on join with multiple aggregates: sum, count, avg
+create materialized view mv_aqj_cust_summary as
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+analyze mv_aqj_cust_summary;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region
+  order by c.region;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+select c.region, count(*) as order_count, sum(o.amount) as total_amount, avg(o.amount) as avg_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region
+  order by c.region;
+
+-- 15. Join with expression in target list (arithmetic + function)
+create materialized view mv_aqj_expr as
+  select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+analyze mv_aqj_expr;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+
+-- 16. Non-match: same tables + expressions, but extra WHERE (should NOT match mv_aqj_expr)
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where c.region = 'east';
+
+-- 17. Non-match: same tables but different aggregate target list
+explain(costs off)
+  select c.region, sum(o.amount) as total_amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region;
+
+-- 18. Non-match: different join order (o JOIN c vs c JOIN o)
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_customers c join aqj_orders o on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+
+-- 19. Join with compound WHERE (multiple AND conditions)
+create materialized view mv_aqj_compound_where as
+  select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+analyze mv_aqj_compound_where;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off) select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50
+  order by o.order_id limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off) select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50;
+select o.order_id, o.amount, c.name
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending' and c.region = 'west' and o.amount > 50
+  order by o.order_id limit 5;
+
+-- 20. Self-join
+create materialized view mv_aqj_selfjoin as
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+analyze mv_aqj_selfjoin;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id
+  order by o1.order_id, o2.order_id limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id;
+select o1.order_id as id1, o2.order_id as id2, o1.amount as amt1, o2.amount as amt2
+  from aqj_orders o1 join aqj_orders o2 on o1.customer_id = o2.customer_id
+  where o1.order_id < o2.order_id
+  order by o1.order_id, o2.order_id limit 5;
+
+-- 21. GROUP BY with multi-column key on join
+create materialized view mv_aqj_grp_multi as
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+analyze mv_aqj_grp_multi;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+
+-- 22. Four-table join with WHERE and aggregate
+create materialized view mv_aqj_3way_agg as
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+analyze mv_aqj_3way_agg;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category
+  order by c.region, p.category limit 6;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category;
+select c.region, p.category, sum(oi.quantity) as total_qty, count(*) as line_count
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  where o.status = 'delivered'
+  group by c.region, p.category
+  order by c.region, p.category limit 6;
+
+-- 23. Implicit four-table join (comma style)
+create materialized view mv_aqj_implicit3 as
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+analyze mv_aqj_implicit3;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending'
+  order by o.order_id, p.name limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending';
+select o.order_id, c.name, p.name as product_name
+  from aqj_orders o, aqj_customers c, aqj_order_items oi, aqj_products p
+  where o.customer_id = c.customer_id and o.order_id = oi.order_id and oi.product_id = p.product_id
+    and o.status = 'pending'
+  order by o.order_id, p.name limit 5;
+
+-- 24. Result correctness across DML + REFRESH cycle
+insert into aqj_orders values(201, 1, 9999.99, 'shipped', '2025-12-31');
+set enable_answer_query_using_materialized_views = on;
+-- Stale: should NOT use MV
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+-- Refresh and verify MV is used again
+refresh materialized view mv_aqj_orders_cust;
+analyze mv_aqj_orders_cust;
+explain(costs off) select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped';
+-- The new row should appear in results via MV scan
+select o.order_id, o.amount, c.name, c.region
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped' and o.order_id = 201;
+
+-- 25. Post-DML comprehensive: refresh all, then verify GUC off vs on results
+refresh materialized view mv_aqj_order_details;
+refresh materialized view mv_aqj_expr;
+refresh materialized view mv_aqj_selfjoin;
+refresh materialized view mv_aqj_grp_multi;
+refresh materialized view mv_aqj_3way_agg;
+refresh materialized view mv_aqj_implicit3;
+analyze mv_aqj_order_details;
+analyze mv_aqj_expr;
+analyze mv_aqj_selfjoin;
+analyze mv_aqj_grp_multi;
+analyze mv_aqj_3way_agg;
+analyze mv_aqj_implicit3;
+
+-- Verify four-table join results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+select o.order_id, c.name as customer_name, p.name as product_name, oi.quantity, p.price
+  from aqj_orders o
+  join aqj_customers c on o.customer_id = c.customer_id
+  join aqj_order_items oi on o.order_id = oi.order_id
+  join aqj_products p on oi.product_id = p.product_id
+  order by o.order_id, p.name limit 5;
+
+-- Verify expression MV results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+
+set enable_answer_query_using_materialized_views = on;
+select o.order_id, o.amount * 1.1 as amount_with_tax, c.name, upper(c.region) as region_upper
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  order by o.order_id limit 5;
+
+-- Verify multi-key GROUP BY results after DML+refresh
+set enable_answer_query_using_materialized_views = off;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+
+set enable_answer_query_using_materialized_views = on;
+select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by c.region, o.status
+  order by c.region, o.status limit 6;
+
+-- 26. Non-match: LIMIT vs FETCH FIRST WITH TIES (limitOption differs)
+create materialized view mv_aqj_limit_test as
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+analyze mv_aqj_limit_test;
+
+set enable_answer_query_using_materialized_views = on;
+-- Same tables/WHERE/ORDER BY but FETCH FIRST WITH TIES: should NOT match
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id fetch first 5 rows with ties;
+-- Identical LIMIT query: should match
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'shipped'
+  order by o.order_id limit 5;
+
+-- 27. Match: FETCH FIRST WITH TIES exact match
+create materialized view mv_aqj_with_ties as
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+analyze mv_aqj_with_ties;
+
+set enable_answer_query_using_materialized_views = off;
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+select o.order_id, o.amount
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  where o.status = 'pending'
+  order by o.order_id fetch first 5 rows with ties;
+
+-- 28. Non-match: GROUP BY vs GROUP BY DISTINCT (groupDistinct differs)
+-- MV mv_aqj_grp_multi uses GROUP BY (groupDistinct=false, registered in catalog)
+-- Query uses GROUP BY DISTINCT — should NOT match
+set enable_answer_query_using_materialized_views = on;
+explain(costs off)
+  select c.region, o.status, count(*) as cnt, sum(o.amount) as total
+  from aqj_orders o join aqj_customers c on o.customer_id = c.customer_id
+  group by distinct c.region, o.status;
+
+-- Clean up AQUMV join test objects
+drop materialized view mv_aqj_with_ties;
+drop materialized view mv_aqj_limit_test;
+drop materialized view mv_aqj_implicit3;
+drop materialized view mv_aqj_3way_agg;
+drop materialized view mv_aqj_grp_multi;
+drop materialized view mv_aqj_selfjoin;
+drop materialized view mv_aqj_compound_where;
+drop materialized view mv_aqj_expr;
+drop materialized view mv_aqj_cust_summary;
+drop materialized view mv_aqj_order_details;
+drop materialized view mv_aqj_orders_cust;
+drop materialized view mv_aqj_implicit;
+drop materialized view mv_aqj_join3;
+drop materialized view mv_aqj_agg;
+drop materialized view mv_aqj_where;
+drop materialized view mv_aqj_join2;
+drop table aqj_order_items;
+drop table aqj_products;
+drop table aqj_customers;
+drop table aqj_orders;
+drop table aqj_t3;
+drop table aqj_t2;
+drop table aqj_t1;
+
 -- test drop table
 select mvname, datastatus from gp_matview_aux where mvname in ('mv0','mv1', 'mv2', 'mv3');
 drop materialized view mv2;
diff --git a/src/test/regress/sql/orca_parallel.sql b/src/test/regress/sql/orca_parallel.sql
new file mode 100644
index 00000000000..dc4689c6bc3
--- /dev/null
+++ b/src/test/regress/sql/orca_parallel.sql
@@ -0,0 +1,31 @@
+create schema orca_parallel;
+set search_path=orca_parallel, public;
+set statement_mem = '256MB';
+set optimizer=on;
+
+create table t1(a int, b int) with(parallel_workers=2) distributed by (a);
+create table t2(c int, d int ) with(parallel_workers=3) distributed by (c);
+insert into t1 select i, i+1 from generate_series(1, 1000)i;
+insert into t2 select i, i+2 from generate_series(1, 20000)i;
+analyze t1;
+analyze t2;
+
+set parallel_setup_cost=0;
+set max_parallel_workers_per_gather=4;
+set enable_parallel = on;
+
+explain (verbose, costs off) select * from t1  join t2  on t1.a = t2.c;
+explain (verbose, costs off) select * from t1  join t2  on t1.a = t2.d;
+explain (verbose, costs off) select * from t1  join t2  on t1.b = t2.c;
+explain (verbose, costs off) select * from t1  join t2  on t1.b = t2.d;
+
+
+reset enable_parallel;
+reset max_parallel_workers_per_gather;
+reset parallel_setup_cost;
+reset statement_mem;
+reset optimizer;
+
+-- start_ignore
+drop schema orca_parallel cascade;
+-- end_ignore
diff --git a/src/test/regress/sql/pg_stat.sql b/src/test/regress/sql/pg_stat.sql
index d9fc37850b0..383a9149186 100644
--- a/src/test/regress/sql/pg_stat.sql
+++ b/src/test/regress/sql/pg_stat.sql
@@ -6,17 +6,17 @@ create table pg_stat_test(a int);
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup
-from pg_stat_all_tables where relname = 'pg_stat_test';
+from gp_stat_all_tables_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup
-from pg_stat_user_tables where relname = 'pg_stat_test';
+from gp_stat_user_tables_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_all_indexes where relname = 'pg_stat_test';
+from gp_stat_all_indexes_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_user_indexes where relname = 'pg_stat_test';
+from gp_stat_user_indexes_summary where relname = 'pg_stat_test';
 
 begin; -- make analyze same transcation with insert to avoid double the pgstat causes by unorder message read.
 insert into pg_stat_test select * from generate_series(1, 100);
@@ -42,17 +42,17 @@ reset enable_seqscan;
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze
-from pg_stat_all_tables where relname = 'pg_stat_test';
+from gp_stat_all_tables_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, seq_scan, seq_tup_read, idx_scan, idx_tup_fetch, n_tup_ins, n_tup_upd,
     n_tup_del, n_tup_hot_upd, n_live_tup, n_dead_tup, n_mod_since_analyze
-from pg_stat_user_tables where relname = 'pg_stat_test';
+from gp_stat_user_tables_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_all_indexes where relname = 'pg_stat_test';
+from gp_stat_all_indexes_summary where relname = 'pg_stat_test';
 select
     schemaname, relname, indexrelname, idx_scan, idx_tup_read, idx_tup_fetch
-from pg_stat_user_indexes where relname = 'pg_stat_test';
+from gp_stat_user_indexes_summary where relname = 'pg_stat_test';
 
 reset optimizer;
 reset max_parallel_workers_per_gather;
diff --git a/src/test/regress/sql/qp_orca_fallback.sql b/src/test/regress/sql/qp_orca_fallback.sql
index 42ad5eef3b9..ecb892c2aa7 100644
--- a/src/test/regress/sql/qp_orca_fallback.sql
+++ b/src/test/regress/sql/qp_orca_fallback.sql
@@ -121,6 +121,53 @@ select array_agg(a order by b)
 -- Orca should fallback if a function in 'from' clause uses 'WITH ORDINALITY'
 SELECT * FROM jsonb_array_elements('["b", "a"]'::jsonb) WITH ORDINALITY;
 
+-- The walker that detects a CTE Consumer on a different slice than its
+-- replicated Producer. Without it ORCA would emit a plan with cross-slice
+-- replicated CTE Consumers that hangs at execution.
+-- start_ignore
+DROP TABLE IF EXISTS tbl1, tbl2;
+-- end_ignore
+CREATE TABLE tbl2 (id numeric, refrcode varchar(255), referenceid numeric)
+DISTRIBUTED REPLICATED;
+CREATE TABLE tbl1 (id bigserial, iscalctrg varchar(15) NOT NULL,
+                   iscalcdetail varchar(15))
+DISTRIBUTED REPLICATED;
+-- start_ignore
+INSERT INTO tbl2 SELECT i, 'A'||(i%5), 101991
+  FROM generate_series(1, 50000) i;
+INSERT INTO tbl1 (iscalctrg, iscalcdetail)
+  SELECT 'A'||(i%5), 'A'||(i%7) FROM generate_series(1, 50000) i;
+ANALYZE tbl1;
+ANALYZE tbl2;
+-- end_ignore
+
+-- Case 1: walker triggers fallback. With scalar subqueries on the CTE
+-- ORCA produces a plan whose CTE Producer is replicated and Consumers
+-- live on a different slice -- the walker raises ExmiExpr2DXLUnsupported
+-- and trace_fallback DETAIL says "CTE Consumer placed on a different
+-- slice than its replicated Producer".
+EXPLAIN (COSTS OFF)
+WITH t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.iscalctrg,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalctrg    LIMIT 1) AS r,
+       (SELECT refrcode FROM t2 WHERE refrcode = p.iscalcdetail LIMIT 1) AS r1
+FROM tbl1 p
+LIMIT 1;
+
+-- Case 2: walker correctly stays silent. The same CTE referenced from a
+-- JOIN: ORCA pins the Producer body to a single segment with a One-Time
+-- Filter (gp_execution_segment() = N), so the Producer's child
+-- distribution is EdtSingleton, not replicated -- the walker skips it.
+EXPLAIN (COSTS OFF)
+WITH t1 AS (SELECT * FROM tbl1),
+     t2 AS (SELECT id, refrcode FROM tbl2 WHERE referenceid = 101991)
+SELECT p.* FROM t1 p
+  JOIN t2 r  ON p.iscalctrg   = r.refrcode
+  JOIN t2 r1 ON p.iscalcdetail = r1.refrcode
+LIMIT 1;
+
+DROP TABLE tbl1, tbl2;
+
 -- start_ignore
 -- FIXME: gpcheckcat fails due to mismatching distribution policy if this table isn't dropped
 -- Keep this table around once this is fixed
diff --git a/src/test/regress/sql/shared_scan.sql b/src/test/regress/sql/shared_scan.sql
index 7234cef6e4a..80b4a1d52c7 100644
--- a/src/test/regress/sql/shared_scan.sql
+++ b/src/test/regress/sql/shared_scan.sql
@@ -120,3 +120,31 @@ where
 	(data_hour = date_trunc('day',data_hour) and stat.schema_name || '.' ||stat.table_name not in (select table_nm_23 from tbls_daily_report_23))
 	and (stat.schema_name || '.' ||stat.table_name not in (select table_nm_onl_act from tbls_w_onl_actl_data))
 	or (stat.schema_name || '.' ||stat.table_name in (select table_nm_onl_act from tbls_w_onl_actl_data));
+
+-- ORCA should fallback when a CTE over a replicated table is referenced
+-- from multiple scalar subqueries.
+-- ss_t1 needs enough rows (40000) to push ORCA to the cross-slice plan;
+-- with fewer rows the bug does not manifest and the test would silently
+-- pass even without the fix.
+-- start_ignore
+DROP TABLE IF EXISTS ss_t1, ss_t2;
+-- end_ignore
+CREATE TABLE ss_t1 AS
+  SELECT generate_series(1, 40000) id
+  DISTRIBUTED BY (id);
+CREATE TABLE ss_t2 AS
+  SELECT * FROM (VALUES (1, 10), (2, 20)) AS v(id, v)
+  DISTRIBUTED REPLICATED;
+ANALYZE ss_t1;
+ANALYZE ss_t2;
+
+SET statement_timeout = '15s';
+WITH
+    cte1 AS (SELECT v FROM ss_t2 WHERE id = 1),
+    cte2 AS (SELECT v FROM ss_t2 WHERE id = 2)
+  SELECT (SELECT v FROM cte1) + (SELECT v FROM cte2) +
+         (SELECT v FROM cte1) + (SELECT v FROM cte2) AS result
+  FROM ss_t1
+  LIMIT 1;
+RESET statement_timeout;
+DROP TABLE ss_t1, ss_t2;
diff --git a/src/test/regress/sql/tuplesort.sql b/src/test/regress/sql/tuplesort.sql
index 45c7c027cd8..fa5f87c7ec9 100644
--- a/src/test/regress/sql/tuplesort.sql
+++ b/src/test/regress/sql/tuplesort.sql
@@ -95,7 +95,7 @@ CLUSTER abbrev_abort_uuids USING abbrev_abort_uuids__abort_increasing_idx;
 -- head
 SELECT id, abort_increasing, abort_decreasing, noabort_increasing, noabort_decreasing
 FROM abbrev_abort_uuids
-ORDER BY ctid LIMIT 5;
+ORDER BY ctid, id LIMIT 5;
 
 -- tail
 SELECT id, abort_increasing, abort_decreasing, noabort_increasing, noabort_decreasing
diff --git a/src/test/regress/sql/union_gp.sql b/src/test/regress/sql/union_gp.sql
index e7cac952704..9e9e5c3a815 100644
--- a/src/test/regress/sql/union_gp.sql
+++ b/src/test/regress/sql/union_gp.sql
@@ -721,9 +721,32 @@ drop table r_1240;
 drop table p1_1240;
 
 --
--- Clean up
+-- Test CTAS with UNION ALL when branches have different typmods (issue #1431).
+-- ORCA should resolve the output column type to character varying (no length),
+-- same as the Postgres planner, instead of picking the first branch's typmod.
 --
+create table union_ctas_t1(id int, name varchar(1));
+create table union_ctas_t2(id int, name varchar(2));
+insert into union_ctas_t1 values (1, 'a');
+insert into union_ctas_t2 values (1, 'ab');
+
+create table union_ctas_result as
+  (select id, name from union_ctas_t1)
+  union all
+  (select id, name from union_ctas_t2);
+
+-- name column should be "character varying" without length, not varchar(1)
+select atttypmod from pg_attribute
+where attrelid = 'union_ctas_result'::regclass and attname = 'name';
+
+-- data should not be truncated
+select * from union_ctas_result order by name;
 
+drop table union_ctas_t1, union_ctas_t2, union_ctas_result;
+
+--
+-- Clean up
+--
 DROP TABLE IF EXISTS T_a1 CASCADE;
 DROP TABLE IF EXISTS T_b2 CASCADE;
 DROP TABLE IF EXISTS T_random CASCADE;
diff --git a/src/test/regress/sql/vacuum_gp.sql b/src/test/regress/sql/vacuum_gp.sql
index 198a80f4a93..ed4bfe4f699 100644
--- a/src/test/regress/sql/vacuum_gp.sql
+++ b/src/test/regress/sql/vacuum_gp.sql
@@ -298,11 +298,14 @@ drop table if exists relcache_leak_in_motion;
 -- end_ignore
 create table relcache_leak_in_motion(v1 int);
 insert into relcache_leak_in_motion values(generate_series(0, 10000));
+BEGIN;
+SET LOCAL synchronous_commit = local;
 SELECT gp_inject_fault('interconnect_stop_recv_chunk', 'interrupt', dbid)
   FROM gp_segment_configuration WHERE content = -1 and role='p';
 analyze relcache_leak_in_motion;
 SELECT gp_inject_fault('interconnect_stop_recv_chunk', 'reset', dbid)
   FROM gp_segment_configuration WHERE content = -1 and role='p';
+COMMIT;
 -- start_ignore
 drop table if exists relcache_leak_in_motion;
 -- end_ignore
diff --git a/src/test/regress/sql/workfile/hashjoin_spill.sql b/src/test/regress/sql/workfile/hashjoin_spill.sql
index 08e30501ef2..7166842dae5 100644
--- a/src/test/regress/sql/workfile/hashjoin_spill.sql
+++ b/src/test/regress/sql/workfile/hashjoin_spill.sql
@@ -40,6 +40,10 @@ CREATE TABLE test_hj_spill (i1 int, i2 int, i3 int, i4 int, i5 int, i6 int, i7 i
 insert into test_hj_spill SELECT i,i,i%1000,i,i,i,i,i from
 	(select generate_series(1, nsegments * 15000) as i from
 	(select count(*) as nsegments from gp_segment_configuration where role='p' and content >= 0) foo) bar;
+
+-- Collect statistics to ensure ORCA generates correct execution plan
+ANALYZE test_hj_spill;
+
 SET statement_mem=1024;
 set gp_resqueue_print_operator_memory_limits=on;