diff --git a/.gitmodules b/.gitmodules
index 038b1484190..1dc2cbf7153 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -1,3 +1,16 @@
 [submodule "gpcontrib/gpcloud/test/googletest"]
 	path = gpcontrib/gpcloud/test/googletest
 	url = https://github.com/google/googletest.git
+[submodule "contrib/pax_storage/src/cpp/contrib/googletest"]
+	path = contrib/pax_storage/src/cpp/contrib/googletest
+	url = https://code.hashdata.xyz/cloudberry/googletest
+[submodule "contrib/pax_storage/src/cpp/contrib/tabulate"]
+	path = contrib/pax_storage/src/cpp/contrib/tabulate
+	url = https://code.hashdata.xyz/cloudberry/tabulate
+[submodule "contrib/pax_storage/src/cpp/contrib/googlebench"]
+	path = contrib/pax_storage/src/cpp/contrib/googlebench
+	url = https://code.hashdata.xyz/cloudberry/benchmark.git
+[submodule "contrib/pax_storage/src/cpp/contrib/cpp-stub"]
+	path = contrib/pax_storage/src/cpp/contrib/cpp-stub
+	url = https://code.hashdata.xyz/cloudberry/cpp-stub.git
+	branch = dev
diff --git a/GNUmakefile.in b/GNUmakefile.in
index 77c2ab55218..e6333e39bec 100644
--- a/GNUmakefile.in
+++ b/GNUmakefile.in
@@ -31,6 +31,9 @@ all:
 	$(MAKE) -C contrib/pg_buffercache all
 ifeq ($(with_openssl), yes)
 	$(MAKE) -C contrib/sslinfo all
+endif
+ifeq ($(enable_pax), yes)
+	$(MAKE) -C contrib/pax_storage all
 endif
 	$(MAKE) -C gpMgmt all
 	$(MAKE) -C gpcontrib all
@@ -73,6 +76,9 @@ install:
 	$(MAKE) -C contrib/tablefunc $@
 	$(MAKE) -C contrib/passwordcheck $@
 	$(MAKE) -C contrib/pg_buffercache $@
+ifeq ($(enable_pax), yes)
+	$(MAKE) -C contrib/pax_storage $@
+endif
 ifeq ($(with_openssl), yes)
 	$(MAKE) -C contrib/sslinfo $@
 endif
@@ -180,6 +186,9 @@ ICW_TARGETS += contrib/extprotocol contrib/dblink contrib/pg_trgm
 ICW_TARGETS += contrib/indexscan contrib/hstore contrib/pgcrypto
 ICW_TARGETS += contrib/tablefunc contrib/passwordcheck
 ICW_TARGETS += contrib/pg_buffercache
+ifeq ($(enable_pax), yes)
+ICW_TARGETS += contrib/pax_storage
+endif
 # sslinfo depends on openssl
 ifeq ($(with_openssl), yes)
 ICW_TARGETS += contrib/sslinfo
diff --git a/configure b/configure
index 57fec242cce..47b466a34e4 100755
--- a/configure
+++ b/configure
@@ -751,6 +751,7 @@ ICU_CFLAGS
 with_icu
 enable_thread_safety
 INCLUDES
+enable_pax
 enable_preload_ic_module
 enable_ic_proxy
 enable_external_fts
@@ -901,6 +902,7 @@ enable_gpcloud
 enable_external_fts
 enable_ic_proxy
 enable_preload_ic_module
+enable_pax
 enable_thread_safety
 with_icu
 with_tcl
@@ -1616,6 +1618,7 @@ Optional Features:
                           library)
   --disable-preload-ic-module
                           disable preload interconnect module
+  --enable-pax            enable pax support
   --disable-thread-safety disable thread-safety in client libraries
   --enable-openssl-redirect
                           enable redirect openssl interface to internal
@@ -9098,6 +9101,36 @@ fi
 { $as_echo "$as_me:${as_lineno-$LINENO}: result: checking whether to build with preload ic module ... $enable_preload_ic_module" >&5
 $as_echo "checking whether to build with preload ic module ... $enable_preload_ic_module" >&6; }
 
+#
+# pax support
+#
+
+
+# Check whether --enable-pax was given.
+if test "${enable_pax+set}" = set; then :
+  enableval=$enable_pax;
+  case $enableval in
+    yes)
+
+$as_echo "#define USE_PAX_STORAGE 1" >>confdefs.h
+
+      ;;
+    no)
+      :
+      ;;
+    *)
+      as_fn_error $? "no argument expected for --enable-pax option" "$LINENO" 5
+      ;;
+  esac
+
+else
+  enable_pax=no
+
+fi
+
+
+{ $as_echo "$as_me:${as_lineno-$LINENO}: result: checking whether to build with pax support ... $enable_pax" >&5
+$as_echo "checking whether to build with pax support ... $enable_pax" >&6; }
 
 #
 # Include directories
diff --git a/configure.ac b/configure.ac
index d9df92f6768..1686a00416b 100644
--- a/configure.ac
+++ b/configure.ac
@@ -925,6 +925,16 @@ PGAC_ARG_BOOL(enable, preload-ic-module, yes,
 AC_MSG_RESULT([checking whether to build with preload ic module ... $enable_preload_ic_module])
 AC_SUBST(enable_preload_ic_module)
 
+#
+# pax support
+#
+PGAC_ARG_BOOL(enable, pax, no,
+              [enable pax support],
+              [AC_DEFINE(USE_PAX_STORAGE, 1,
+                         [Define to 1 to support pax])])
+AC_MSG_RESULT([checking whether to build with pax support ... $enable_pax])
+AC_SUBST(enable_pax)
+
 #
 # Include directories
 #
diff --git a/contrib/Makefile b/contrib/Makefile
index fceafaffe8a..2292adb88f2 100644
--- a/contrib/Makefile
+++ b/contrib/Makefile
@@ -98,6 +98,12 @@ else
 ALWAYS_SUBDIRS += hstore_plpython jsonb_plpython ltree_plpython
 endif
 
+ifeq ($(enable_pax),yes)
+SUBDIRS += pax_storage
+else
+ALWAYS_SUBDIRS += pax_storage
+endif
+
 # Missing:
 #		start-scripts	\ (does not have a makefile)
 
diff --git a/contrib/pax_storage/.ci/tf/qingcloud-provider.tf b/contrib/pax_storage/.ci/tf/qingcloud-provider.tf
deleted file mode 100644
index 02941a05be8..00000000000
--- a/contrib/pax_storage/.ci/tf/qingcloud-provider.tf
+++ /dev/null
@@ -1,86 +0,0 @@
-variable "qingcloud_access_key" {
-  sensitive = true
-  type      = string
-}
-
-variable "qingcloud_secret_key" {
-  sensitive = true
-  type      = string
-}
-
-variable "qingcloud_zone" {
-  default = "pek3c"
-}
-
-variable "instance_name" {
-  default = "ci"
-}
-
-variable "instance_image" {
-  default = "img-qbpas5m2"
-}
-
-variable "instance_class" {
-  default = 202
-}
-
-variable "instance_cpu" {
-  default = 16
-}
-
-variable "instance_memory" {
-  default = 16384
-}
-
-variable "instance_os_disk_size" {
-  default = 100
-}
-
-variable "instance_vxnet" {
-  default = "vxnet-5tjdylj"
-}
-
-variable "instance_keypair" {
-  default = [
-  "kp-o07unn26"]
-}
-
-terraform {
-  required_providers {
-    qingcloud = {
-      source  = "HashDataInc/qingcloud"
-      version = "1.2.7"
-    }
-    ansible = {
-      source  = "nbering/ansible"
-      version = "1.0.4"
-    }
-  }
-}
-
-provider "qingcloud" {
-  access_key = var.qingcloud_access_key
-  secret_key = var.qingcloud_secret_key
-  zone       = var.qingcloud_zone
-}
-
-
-resource "qingcloud_instance" "ci" {
-  name             = var.instance_name
-  image_id         = var.instance_image
-  instance_class   = var.instance_class
-  cpu              = var.instance_cpu
-  memory           = var.instance_memory
-  os_disk_size     = var.instance_os_disk_size
-  managed_vxnet_id = var.instance_vxnet
-  keypair_ids      = var.instance_keypair
-}
-
-resource "ansible_host" "ci" {
-  inventory_hostname = qingcloud_instance.ci.private_ip
-  groups = [
-  "runner"]
-  vars = {
-    ansible_user = "root"
-  }
-}
diff --git a/contrib/pax_storage/.clang-tidy b/contrib/pax_storage/.clang-tidy
index 6b6594d4fb7..9e3bff8027b 100644
--- a/contrib/pax_storage/.clang-tidy
+++ b/contrib/pax_storage/.clang-tidy
@@ -12,7 +12,7 @@ Checks: '-*,
     modernize-avoid-bind,
     modernize-loop-convert,
     modernize-make-shared,
-    modernize-make-unique,
+    - modernize-make-unique,
     modernize-raw-string-literal,
     modernize-redundant-void-arg,
     modernize-replace-auto-ptr,
@@ -37,7 +37,7 @@ Checks: '-*,
     readability-avoid-const-params-in-decls,
     readability-const-return-type,
     readability-container-size-empty,
-    readability-convert-member-functions-to-static,
+    - readability-convert-member-functions-to-static,
     readability-deleted-default,
     readability-make-member-function-const,
     readability-misplaced-array-index,
@@ -52,7 +52,7 @@ Checks: '-*,
     readability-uniqueptr-delete-release,
     readability-redundant-member-init,
     readability-simplify-subscript-expr,
-    readability-simplify-boolean-expr,
+    - readability-simplify-boolean-expr,
     readability-inconsistent-declaration-parameter-name,
     readability-identifier-naming,
 
@@ -68,7 +68,6 @@ Checks: '-*,
     bugprone-incorrect-roundings,
     bugprone-infinite-loop,
     bugprone-integer-division,
-    bugprone-macro-parentheses,
     bugprone-macro-repeated-side-effects,
     bugprone-misplaced-operator-in-strlen-in-alloc,
     bugprone-misplaced-pointer-artithmetic-in-alloc,
@@ -225,4 +224,4 @@ CheckOptions:
   - key: modernize-use-transparent-functors.SafeMode
     value: 1
   - key: modernize-use-emplace.IgnoreImplicitConstructors
-    value: 1
\ No newline at end of file
+    value: 1
diff --git a/contrib/pax_storage/.githooks/pre-push b/contrib/pax_storage/.githooks/pre-push
deleted file mode 100755
index 22bebb8148b..00000000000
--- a/contrib/pax_storage/.githooks/pre-push
+++ /dev/null
@@ -1,25 +0,0 @@
-#!/bin/sh
-#
-# Verify what is about to be pushed.  Called by "git
-# push" after it has checked the remote status, but before anything has been
-# pushed.  If this script exits with a non-zero status nothing will be pushed.
-#
-
-rc=0
-
-if [ -x "./tools/cpplint.py" ]; then
-	echo "Running cpplint ..."
-	mkdir -p .tmp/
-	./tools/cpplint.py --counting=detailed --recursive . > .tmp/cpplint.log 2>&1
-	rc=$?
-	if [ $rc -ne 0 ]; then
-		tail -n 1 .tmp/cpplint.log
-		echo ""
-		echo "ERROR cpplint returned errors!"
-		echo "ERROR Fix the problem and use 'git add' to update your changes."
-		echo "ERROR See `pwd`/.tmp/cpplint.log for more information."
-		echo ""
-	fi
-fi
-
-exit $rc
\ No newline at end of file
diff --git a/contrib/pax_storage/.gitignore b/contrib/pax_storage/.gitignore
index 76807d0dbc3..1fe686d3b2e 100644
--- a/contrib/pax_storage/.gitignore
+++ b/contrib/pax_storage/.gitignore
@@ -20,5 +20,5 @@ clang-tidy.result
 **/*.pb.cc
 
 # Executables
-*.out
+/*.out
 !src/data/expected/*.out
diff --git a/contrib/pax_storage/.gitlab-ci.yml b/contrib/pax_storage/.gitlab-ci.yml
deleted file mode 100644
index 51415fcc444..00000000000
--- a/contrib/pax_storage/.gitlab-ci.yml
+++ /dev/null
@@ -1,71 +0,0 @@
-stages:
-  - build
-
-.global_variables: &global_variables
-  # Runner instance name, passed to Terraform
-  TF_VAR_instance_name: "cbdb-test-pipeline-${CI_PIPELINE_ID}-job-${CI_JOB_ID}"
-  TF_VAR_qingcloud_access_key: "key"
-  TF_VAR_qingcloud_secret_key: "secret"
-  # Custom clone path on runner instance 
-  GIT_SUBMODULE_STRATEGY: "normal" 
-  GIT_DEPTH: 0 
-  CI_USER: root 
-  # For internal deploy
-  ARTIFACTORY_USERNAME: "admin"
-  ARTIFACTORY_PASSWORD: "token"
-  AWS_ACCESS_KEY_ID: "${TF_VAR_qingcloud_access_key}"
-  AWS_SECRET_ACCESS_KEY: "${TF_VAR_qingcloud_secret_key}"
-  GIT_CLONE_PATH: "/code/gpdb_pax_src"
-  # cbdb project dir
-  CBDB_PROJECT_DIR: "/code/gpdb_src"
-  # For artifacts
-  BUCKET_INTERMEDIATE: "http://artifactory.hashdata.xyz/artifactory/hashdata-repository/intermediate-artifacts"
-  # For pax storage project
-  CBDB_PAX_BRANCH: $CI_COMMIT_BRANCH
-
-.build_script: &build_script
-  script: |
-    git clone -b feature-pax https://buildbot:Passw0rd@code.hashdata.xyz/cloudberry/cbdb.git $CBDB_PROJECT_DIR
-    cd /code/gpdb_src
-    git submodule update --init --recursive
-    cd /code
-    echo "${CI_PIPELINE_ID}" > ${CBDB_PROJECT_DIR}/BUILD_NUMBER
-    bash ${CBDB_PROJECT_DIR}/hd-ci/compile_cbdb.bash
-    bash ${GIT_CLONE_PATH}/hd-ci/compile_pax.bash
-    bash ${GIT_CLONE_PATH}/hd-ci/clang_tidy_pax.bash
-    cp ${CBDB_PROJECT_DIR}/cbdb-artifacts.txt ${CI_PROJECT_DIR}/cbdb-artifacts.txt
-    touch /code/CI_STATUS
-
-.build_artifacts: &build_artifacts
-  artifacts:
-    name: "artifacts"
-    when: always
-    paths:
-      - ${CI_PROJECT_DIR}/cbdb-artifacts.txt
-      - ${GIT_CLONE_PATH}/clang-tidy.result
-    reports:
-      dotenv: ${CI_PROJECT_DIR}/cbdb-artifacts.txt
-
-.cbdb_test_rules: &cbdb_test_rules
-  rules:
-    - if: $CI_COMMIT_TAG
-      when: never
-    - if: '$RUN_NIGHTLY_BUILD == "true"'
-      when: always
-    - if: '$RUN_TEST_BUILD == "true"'
-      when: always
-    - if: '$CI_PIPELINE_SOURCE == "pipeline"'
-      when: always
-    - when: always
-
-x86_64:build:
-  stage: build
-  variables:
-    <<: *global_variables
-  <<: *build_script
-  <<: *build_artifacts
-  <<: *cbdb_test_rules
-  timeout: 8 hours
-  retry:
-    max: 2
-    when: always
diff --git a/contrib/pax_storage/.gitmodules b/contrib/pax_storage/.gitmodules
index 884a7c5972b..5c3c84dc64d 100644
--- a/contrib/pax_storage/.gitmodules
+++ b/contrib/pax_storage/.gitmodules
@@ -5,3 +5,6 @@
 	path = src/cpp/contrib/zstd
 	url = https://code.hashdata.xyz/cloudberry/lib_zstd.git
 	branch = v1.5.5
+[submodule "src/cpp/contrib/cpp-stub"]
+	path = src/cpp/contrib/cpp-stub
+	url = https://code.hashdata.xyz/cloudberry/cpp-stub.git
diff --git a/contrib/pax_storage/CMakeLists.txt b/contrib/pax_storage/CMakeLists.txt
index b4ab18181ea..2a6cde93a82 100644
--- a/contrib/pax_storage/CMakeLists.txt
+++ b/contrib/pax_storage/CMakeLists.txt
@@ -2,73 +2,74 @@ project(Pax)
 cmake_minimum_required (VERSION 3.11.0)
 set(CMAKE_CXX_STANDARD 14)
 
-find_program(
-  PG_CONFIG pg_config
-  HINTS ${PG_PATH}
-  PATH_SUFFIXES bin
-  DOC "The path to the pg_config of the CBDB version to compile against")
+set(TOP_DIR ${PROJECT_SOURCE_DIR}/../..)
+set(CBDB_INCLUDE_DIR ${TOP_DIR}/src/include)
+set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -g")
 
-if(NOT PG_CONFIG)
-  message(FATAL_ERROR "Unable to find 'pg_config'")
-endif()
-
-# Function to call pg_config and extract values.
-function(GET_PG_CONFIG var)
-  set(_temp)
-
-  # Only call pg_config if the variable didn't already have a value.
-  if(NOT ${var})
-    execute_process(
-      COMMAND ${PG_CONFIG} ${ARGN}
-      OUTPUT_VARIABLE _temp
-      OUTPUT_STRIP_TRAILING_WHITESPACE)
-  endif()
-
-  set(${var}
-    ${_temp}
-    PARENT_SCOPE)
-endfunction()
+# Build gtest options
+option(BUILD_GTEST "Build with google test" ON)
 
-# Get CBDB configuration from pg_config
-get_pg_config(PG_INCLUDEDIR --includedir)
 
-# TODO check exists if this is needed
-set(CBDB_INCLUDE_DIR ${PG_INCLUDEDIR}/postgresql/server)
+option(BUILD_GBENCH "Build with google benchmark" OFF)
 
-# Debug options
-option(ENBALE_DEBUG "Enable debug" ON)
+# Build pax tools
+option(BUILD_TOOLS "Build with pax tools" ON)
 
-# Build gtest options
-option(BUILD_GTEST "Build with google test" ON)
-
-# Build pax format lib
-option(BUILD_PAX_FORMAT "Build pax format lib" OFF)
+# env CBDB_BUILD_TYPE is set by Lighting pipeline
+if (NOT DEFINED ENV{CBDB_BUILD_TYPE})
+    set(ENV{CBDB_BUILD_TYPE} "debug")
+endif()
 
+set(CBDB_BUILD_TYPE $ENV{CBDB_BUILD_TYPE})
+message(STATUS "env CBDB_BUILD_TYPE=$ENV{CBDB_BUILD_TYPE} => ${CBDB_BUILD_TYPE}")
 
-if (ENBALE_DEBUG)
-  ADD_DEFINITIONS(-DENBALE_DEBUG)
-  # Use to build compile_commands.json
-  set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
-  SET(CMAKE_BUILD_TYPE "Debug")
-  SET(CMAKE_CXX_FLAGS_DEBUG "$ENV{CXXFLAGS} -O0 -Wall -g -ggdb")
-  SET(CMAKE_CXX_FLAGS_RELEASE "$ENV{CXXFLAGS} -O3 -Wall")
-else()
+if (${CBDB_BUILD_TYPE} STREQUAL "release")
   SET(CMAKE_BUILD_TYPE "Release")
+  SET(CMAKE_CXX_FLAGS_RELEASE "$ENV{CXXFLAGS} -O3")
   # no need build gtest in release mode
   SET(BUILD_GTEST OFF)
-endif(ENBALE_DEBUG)
-
-# Vec options
-option(VEC_BUILD "Build pax vectorization version" OFF)
-set(VEC_HOME "" CACHE STRING "Path to vectorization home")
-if (VEC_BUILD)
-
-if("${VEC_HOME}" STREQUAL "")
-  message(FATAL_ERROR "No found vectorization home setting. Using -DVEC_HOME to spec vectorization home")
+elseif(${CBDB_BUILD_TYPE} STREQUAL "debug")
+  ADD_DEFINITIONS(-DENABLE_DEBUG)
+  # Use to build compile_commands.json
+  SET(CMAKE_BUILD_TYPE "Debug")
+  SET(CMAKE_CXX_FLAGS_DEBUG "$ENV{CXXFLAGS} -O0 -ggdb")
+else()
+  message(FATAL_ERROR "unknown CBDB_BUILD_TYPE: ${CBDB_BUILD_TYPE}")
 endif()
 
-set(CBDB_ROOT_INCLUDE_DIR ${PG_INCLUDEDIR})
-ADD_DEFINITIONS(-DVEC_BUILD)
+if(BUILD_GBENCH)
+  SET(BUILD_GTEST ON)
+endif(BUILD_GBENCH)
+
+if (BUILD_GTEST)
+  SET(CMAKE_C_FLAGS_DEBUG "${CMAKE_C_FLAGS_DEBUG} -no-pie -fno-stack-protector -Wall -Wno-unused-function  -Wno-unused-variable")
+  SET(CMAKE_CXX_FLAGS_DEBUG "${CMAKE_CXX_FLAGS_DEBUG} -fno-access-control -fno-inline -Wno-pmf-conversions -Wl,--allow-multiple-definition -no-pie -fno-stack-protector")
+endif(BUILD_GTEST)
+
+# Plasma options
+option (ENABLE_PLASMA "Enable plasma cache" OFF)
+if (ENABLE_PLASMA)
+ADD_DEFINITIONS(-DENABLE_PLASMA)
+# plasma need use CXX_STANDARD 17
+set(CMAKE_CXX_STANDARD 17)
+endif()
 
+# Vec options
+include(CheckSymbolExists)
+SET(PG_CONFIG_HEADER_FILE "${CBDB_INCLUDE_DIR}/pg_config.h")
+CHECK_SYMBOL_EXISTS(USE_VECTORIZATION "${PG_CONFIG_HEADER_FILE}" VEC_BUILD)
+message(STATUS "pg_config.h => ${PG_CONFIG_HEADER_FILE}")
+if (VEC_BUILD)
+  set(VEC_HOME "${PROJECT_SOURCE_DIR}/../vectorization")
+  ADD_DEFINITIONS(-DVEC_BUILD)
+  message(STATUS "Build pax with vectorization support, VEC_HOME=${VEC_HOME}")
+else()
+  message(STATUS "Build pax without vectorization support")
 endif(VEC_BUILD)
+
+## find dependency
+## depend on the value of the above option to check dependencies.
+list(APPEND CMAKE_MODULE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/")
+include(FindDependencies)
 add_subdirectory(src/cpp)
diff --git a/contrib/pax_storage/FindDependencies.cmake b/contrib/pax_storage/FindDependencies.cmake
new file mode 100644
index 00000000000..c98e1eb3a67
--- /dev/null
+++ b/contrib/pax_storage/FindDependencies.cmake
@@ -0,0 +1,37 @@
+find_package(BISON REQUIRED)
+
+## protobuf
+include(FindProtobuf)
+find_package(Protobuf 3.6.1 REQUIRED)
+
+# ztsd
+# in our image snapshot, zstd is managed using pkg-config, so so the pkg-config method is used first here
+find_package(PkgConfig QUIET)
+if(PKGCONFIG_FOUND)
+    pkg_check_modules(ZSTD libzstd)
+endif()
+if(NOT ZSTD_FOUND)
+    find_package(ZSTD QUIET)
+    if(NOT ZSTD_FOUND)
+        message(FATAL_ERROR "zstd not found")
+    endif()
+endif()
+
+## for vectorazition
+if (VEC_BUILD)
+    find_package(PkgConfig REQUIRED)
+    pkg_check_modules(GLIB REQUIRED glib-2.0)
+
+    # resolve vectorization dependency, or the header files will miss
+    message(STATUS "Resolve vectorization dependency ...")
+    execute_process(
+        COMMAND make download_arrow
+        WORKING_DIRECTORY ${VEC_HOME}
+        RESULT_VARIABLE CMD_RESULT
+    )
+    if(CMD_RESULT EQUAL 0)
+        message(STATUS "Resolve vectorization dependency succeeded.")
+    else()
+        message(FATAL_ERROR "Resolve vectorization dependency failed with result: ${CMD_RESULT}")
+    endif()
+endif(VEC_BUILD)
\ No newline at end of file
diff --git a/contrib/pax_storage/Makefile b/contrib/pax_storage/Makefile
new file mode 100644
index 00000000000..8a6f143713d
--- /dev/null
+++ b/contrib/pax_storage/Makefile
@@ -0,0 +1,59 @@
+# contrib/pax_storage/Makefile
+
+MODULE_big = pax
+OBJS = \
+	$(WIN32RES) 
+PG_CPPFLAGS = -I/usr/local/include
+PG_CXXFLAGS = -std=c++14
+
+PGFILEDESC = "pax - PAX table access method"
+SHLIB_LINK += -luuid
+
+REGRESS = setup
+REGRESS += detoast ddl types update
+# FIXME: several plans are bad in update_gp when use orca
+# REGRESS += update_gp
+REGRESS +=  teardown
+
+ifdef USE_PGXS
+PG_CONFIG = pg_config
+PGXS := $(shell $(PG_CONFIG) --pgxs)
+include $(PGXS)
+else
+subdir = contrib/pax_storage
+top_builddir = ../../
+include $(top_builddir)/src/Makefile.global
+include $(top_srcdir)/contrib/contrib-global.mk
+endif
+
+REGRESS_OPTS += --init-file=$(top_builddir)/src/test/regress/init_file
+
+.PHONY: all
+all: build-pax
+
+.PHONY: install-data build-pax
+build-pax:
+	@echo "build pax"
+	mkdir -p build
+	cd build && cmake .. -DCMAKE_INSTALL_PREFIX=$(DESTDIR)$(prefix) && make -j8 && cp src/cpp/libpax.so ../pax.so
+
+install-data: build-pax
+	$(INSTALL_DATA) pax-cdbinit--1.0.sql '$(DESTDIR)$(datadir)/cdb_init.d/pax-cdbinit--1.0.sql'
+
+.PHONY: install
+install: install-data
+	@echo "install data"
+	make -C build install
+
+.PHONY: uninstall-data
+
+uninstall-data:
+	$(RM) '$(DESTDIR)$(datadir)/cdb_init.d/pax-cdbinit--1.0.sql'
+
+uninstall: uninstall-data
+
+clean-data:
+	$(RM) pax-cdbinit--1.0.sql
+	$(RM) -r build
+
+clean: clean-data
diff --git a/contrib/pax_storage/README.md b/contrib/pax_storage/README.md
index f26eeaf11be..e82817afed5 100644
--- a/contrib/pax_storage/README.md
+++ b/contrib/pax_storage/README.md
@@ -43,7 +43,7 @@ make -j
 ### Build GTEST
 
 1. make sure already build pax with cmake option `-DBUILD_GTEST=on`, default value is on
-2. better with debug cmake option `-DENBALE_DEBUG=on`, default value is on
+2. better with debug cmake option `-DENABLE_DEBUG=on`, default value is on
 3. run tests
 
 ```
diff --git a/contrib/pax_storage/expected/ddl.out b/contrib/pax_storage/expected/ddl.out
new file mode 100644
index 00000000000..2917f049b80
--- /dev/null
+++ b/contrib/pax_storage/expected/ddl.out
@@ -0,0 +1,73 @@
+set default_table_access_method = 'pax';
+create table pax_test.t1(
+    id int,
+    name text not null,
+    height float not null,
+    decimal_col decimal(10, 2) not null,
+    created_at timestamp with time zone not null,
+    updated_at timestamp with time zone not null
+)  using pax distributed BY (id);
+\d+ pax_test.t1
+                                               Table "pax_test.t1"
+   Column    |           Type           | Collation | Nullable | Default | Storage  | Stats target | Description 
+-------------+--------------------------+-----------+----------+---------+----------+--------------+-------------
+ id          | integer                  |           |          |         | plain    |              | 
+ name        | text                     |           | not null |         | extended |              | 
+ height      | double precision         |           | not null |         | plain    |              | 
+ decimal_col | numeric(10,2)            |           | not null |         | main     |              | 
+ created_at  | timestamp with time zone |           | not null |         | plain    |              | 
+ updated_at  | timestamp with time zone |           | not null |         | plain    |              | 
+Distributed by: (id)
+
+create table pax_test.t2(
+    id int,
+    name text not null,
+    height float not null,
+    decimal_col decimal(10, 2) not null,
+    created_at timestamp with time zone not null,
+    updated_at timestamp with time zone not null
+);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+\d+ pax_test.t2
+                                               Table "pax_test.t2"
+   Column    |           Type           | Collation | Nullable | Default | Storage  | Stats target | Description 
+-------------+--------------------------+-----------+----------+---------+----------+--------------+-------------
+ id          | integer                  |           |          |         | plain    |              | 
+ name        | text                     |           | not null |         | extended |              | 
+ height      | double precision         |           | not null |         | plain    |              | 
+ decimal_col | numeric(10,2)            |           | not null |         | main     |              | 
+ created_at  | timestamp with time zone |           | not null |         | plain    |              | 
+ updated_at  | timestamp with time zone |           | not null |         | plain    |              | 
+Distributed by: (id)
+
+insert into pax_test.t1 (id, name, height, decimal_col, created_at, updated_at) values
+    (1, 'Alice', 1.65, 1.23, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
+    (2, 'Bob', 1.75, 2.34, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
+    (3, 'Carol', 1.85, 3.45, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08');
+alter table pax_test.t1 add column new_col1 int;
+alter table pax_test.t1 add column new_col2 int default null;
+alter table pax_test.t1 add column new_col3 int default 0;
+alter table pax_test.t1 add column new_col4 int default 12;
+select * from pax_test.t1;
+ id | name  | height | decimal_col |             created_at              |             updated_at              | new_col1 | new_col2 | new_col3 | new_col4 
+----+-------+--------+-------------+-------------------------------------+-------------------------------------+----------+----------+----------+----------
+  1 | Alice |   1.65 |        1.23 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT |          |          |        0 |       12
+  2 | Bob   |   1.75 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT |          |          |        0 |       12
+  3 | Carol |   1.85 |        3.45 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT |          |          |        0 |       12
+(3 rows)
+
+alter table pax_test.t1 drop column new_col2;
+alter table pax_test.t1 drop column new_col3;
+vacuum pax_test.t1;
+vacuum full pax_test.t1;
+drop table pax_test.t1;
+drop table pax_test.t2;
+-- alter column with options 
+create table pax_test.t3 (v1 numeric(100,1)) with(compresstype=zstd, compresslevel=1);
+alter table pax_test.t3 alter column v1 type numeric;
+drop table pax_test.t3;
+-- add column with options
+create table pax_test.t4 (v1 text) with(compresstype=zstd, compresslevel=1);
+alter table pax_test.t4 add column v2 text;
+drop table pax_test.t4;
diff --git a/contrib/pax_storage/expected/detoast.out b/contrib/pax_storage/expected/detoast.out
new file mode 100644
index 00000000000..ded4073a380
--- /dev/null
+++ b/contrib/pax_storage/expected/detoast.out
@@ -0,0 +1,91 @@
+CREATE TABLE toasttest_external(f1 text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+-- The storage `EXTERNAL` allows out-of-line storage but not compression.
+alter table toasttest_external alter column f1 set storage external;
+-- These tests are sensitive to block size. In CBDB, the block
+-- size is 32 kB, whereas in PostgreSQL it's 8kB. Therefore make
+-- the data 4x larger here.
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+-- expect >0 blocks
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty
+  FROM pg_class where relname = 'toasttest_external';
+ is_empty 
+----------
+ f
+(1 row)
+
+create table toasttest_external_pax(f1 text) using pax;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into toasttest_external_pax select * from toasttest_external;
+drop table toasttest_external;
+-- If pax insert toast here, Then after drop toasttest_external, toast 
+-- will not get the source data.
+select length(f1) from toasttest_external_pax;
+ length 
+--------
+  12000
+  12000
+  12000
+  12000
+(4 rows)
+
+drop table toasttest_external_pax;
+CREATE TABLE toasttest_compress(f1 text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+-- The storage `MAIN` allows compression but not out-of-line storage. 
+alter table toasttest_compress alter column f1 set storage main;
+-- about 1M
+INSERT INTO toasttest_compress values (repeat('1234567890123456',1024 * 64));
+-- should be true, becase it's not store in toast table
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty FROM pg_class where relname = 'toasttest_compress';
+ is_empty 
+----------
+ t
+(1 row)
+
+create table toasttest_compress_pax(f1 text) using pax;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into toasttest_compress_pax select * from toasttest_compress;
+drop table toasttest_compress;
+select length(f1) from toasttest_compress_pax;
+ length  
+---------
+ 1048576
+(1 row)
+
+drop table toasttest_compress_pax;
+CREATE TABLE toasttest_extended(f1 text);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+-- The storage `EXTENDED` allows both compression and out-of-line storage. 
+alter table toasttest_extended alter column f1 set storage EXTENDED;
+-- about 1M, will use out-of-line storage
+INSERT INTO toasttest_extended values (repeat('1234567890123456',1024 * 64));
+-- about 80k , will use compression storage
+INSERT INTO toasttest_extended values (repeat('1234567890123456',1024 * 5));
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty FROM pg_class where relname = 'toasttest_extended';
+ is_empty 
+----------
+ f
+(1 row)
+
+create table toasttest_extended_pax(f1 text) using pax;
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'f1' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into toasttest_extended_pax select * from toasttest_extended;
+drop table toasttest_extended;
+select length(f1) from toasttest_extended_pax;
+ length  
+---------
+ 1048576
+   81920
+(2 rows)
+
+drop table toasttest_extended_pax;
diff --git a/contrib/pax_storage/src/data/sql/teardown.sql b/contrib/pax_storage/expected/setup.out
similarity index 100%
rename from contrib/pax_storage/src/data/sql/teardown.sql
rename to contrib/pax_storage/expected/setup.out
diff --git a/contrib/pax_storage/expected/teardown.out b/contrib/pax_storage/expected/teardown.out
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/contrib/pax_storage/src/data/expected/types.out b/contrib/pax_storage/expected/types.out
similarity index 75%
rename from contrib/pax_storage/src/data/expected/types.out
rename to contrib/pax_storage/expected/types.out
index 585ea81da8b..3f173f31c0e 100644
--- a/contrib/pax_storage/src/data/expected/types.out
+++ b/contrib/pax_storage/expected/types.out
@@ -1,8 +1,4 @@
--- start_ignore
-create extension pax;
-drop table if exists all_typbyval_pg_types;
--- end_ignore
-CREATE TABLE all_typbyval_pg_types (
+CREATE TABLE pax_test.all_typbyval_pg_types (
   id int,
   bool_col bool,
   char_col char,
@@ -24,10 +20,10 @@ CREATE TABLE all_typbyval_pg_types (
   timestamptz_col timestamptz,
   pg_lsn_col pg_lsn
 ) USING pax distributed by (id);
-insert into all_typbyval_pg_types values(1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
+insert into pax_test.all_typbyval_pg_types values(1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
 (1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
 (1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0');
-select * from all_typbyval_pg_types;
+select * from pax_test.all_typbyval_pg_types;
  id | bool_col | char_col | int2_col | cid_col | float4_col | int4_col |  date_col  | oid_col |      time_stamp_col      | int8_col | float8_col | money_col | time_col |       timestamptz_col        | pg_lsn_col 
 ----+----------+----------+----------+---------+------------+----------+------------+---------+--------------------------+----------+------------+-----------+----------+------------------------------+------------
   1 | t        | c        |        2 |       0 |        4.2 |        5 | 05-17-2023 |       7 | Wed May 17 17:56:49 2023 |       10 |    11.1111 |    $12.00 | 17:56:49 | Wed May 17 17:56:49 2023 PDT | 16/0
@@ -35,10 +31,7 @@ select * from all_typbyval_pg_types;
   1 | t        | c        |        2 |       0 |        4.2 |        5 | 05-17-2023 |       7 | Wed May 17 17:56:49 2023 |       10 |    11.1111 |    $12.00 | 17:56:49 | Wed May 17 17:56:49 2023 PDT | 16/0
 (3 rows)
 
--- start_ignore
-drop table if exists all_typlen_lt_0_pg_type;
--- end_ignore
-create table all_typlen_lt_0_pg_type (
+create table pax_test.all_typlen_lt_0_pg_type (
   id int,
   name_col name,
   numeric_col numeric,
@@ -46,13 +39,12 @@ create table all_typlen_lt_0_pg_type (
   varchar_col varchar(128),
   point_col point
 ) USING pax distributed by (id);
-insert into all_typlen_lt_0_pg_type values(1,'hello', 1.23, 'text', 'varchar', point(1,2));
-select * from all_typlen_lt_0_pg_type;
+insert into pax_test.all_typlen_lt_0_pg_type values(1,'hello', 1.23, 'text', 'varchar', point(1,2));
+select * from pax_test.all_typlen_lt_0_pg_type;
  id | name_col | numeric_col | text_col | varchar_col | point_col 
 ----+----------+-------------+----------+-------------+-----------
   1 | hello    |        1.23 | text     | varchar     | (1,2)
 (1 row)
 
--- start_ignore
-drop table if exists all_typbyval_pg_types;
--- end_ignore
+drop table pax_test.all_typbyval_pg_types;
+drop table pax_test.all_typlen_lt_0_pg_type;
diff --git a/contrib/pax_storage/expected/update.out b/contrib/pax_storage/expected/update.out
new file mode 100644
index 00000000000..2420012b121
--- /dev/null
+++ b/contrib/pax_storage/expected/update.out
@@ -0,0 +1,624 @@
+set default_table_access_method = pax;
+set pax.enable_filter = off;
+--
+-- UPDATE ... SET <col> = DEFAULT;
+--
+CREATE TABLE update_test (
+    a   INT DEFAULT 10,
+    b   INT,
+    c   TEXT
+);
+CREATE TABLE upsert_test (
+    a   INT PRIMARY KEY,
+    b   TEXT
+);
+INSERT INTO update_test VALUES (5, 10, 'foo');
+INSERT INTO update_test(b, a) VALUES (15, 10);
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+ a  | b  |  c  
+----+----+-----
+  5 | 10 | foo
+ 10 | 15 | 
+(2 rows)
+
+UPDATE update_test SET a = DEFAULT, b = DEFAULT;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+ a  | b |  c  
+----+---+-----
+ 10 |   | foo
+ 10 |   | 
+(2 rows)
+
+-- aliases for the UPDATE target table
+UPDATE update_test AS t SET b = 10 WHERE t.a = 10;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+ a  | b  |  c  
+----+----+-----
+ 10 | 10 | foo
+ 10 | 10 | 
+(2 rows)
+
+UPDATE update_test t SET b = t.b + 10 WHERE t.a = 10;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+ a  | b  |  c  
+----+----+-----
+ 10 | 20 | foo
+ 10 | 20 | 
+(2 rows)
+
+--
+-- Test VALUES in FROM
+--
+UPDATE update_test SET a=v.i FROM (VALUES(100, 20)) AS v(i, j)
+  WHERE update_test.b = v.j;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+  a  | b  |  c  
+-----+----+-----
+ 100 | 20 | foo
+ 100 | 20 | 
+(2 rows)
+
+-- fail, wrong data type:
+UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i, j)
+  WHERE update_test.b = v.j;
+ERROR:  column "a" is of type integer but expression is of type record
+LINE 1: UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i...
+                                   ^
+HINT:  You will need to rewrite or cast the expression.
+--
+-- Test multiple-set-clause syntax
+--
+INSERT INTO update_test SELECT a,b+1,c FROM update_test;
+SELECT * FROM update_test;
+  a  | b  |  c  
+-----+----+-----
+ 100 | 20 | foo
+ 100 | 20 | 
+ 100 | 21 | foo
+ 100 | 21 | 
+(4 rows)
+
+UPDATE update_test SET (c,b,a) = ('bugle', b+11, DEFAULT) WHERE c = 'foo';
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+  a  | b  |   c   
+-----+----+-------
+  10 | 31 | bugle
+  10 | 32 | bugle
+ 100 | 20 | 
+ 100 | 21 | 
+(4 rows)
+
+UPDATE update_test SET (c,b) = ('car', a+b), a = a + 1 WHERE a = 10;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+  a  | b  |  c  
+-----+----+-----
+  11 | 41 | car
+  11 | 42 | car
+ 100 | 20 | 
+ 100 | 21 | 
+(4 rows)
+
+-- fail, multi assignment to same column:
+UPDATE update_test SET (c,b) = ('car', a+b), b = a + 1 WHERE a = 10;
+ERROR:  multiple assignments to same column "b"
+-- uncorrelated sub-select:
+UPDATE update_test
+  SET (b,a) = (select a,b from update_test where b = 41 and c = 'car')
+  WHERE a = 100 AND b = 20;
+SELECT * FROM update_test;
+  a  | b  |  c  
+-----+----+-----
+ 100 | 21 | 
+  11 | 41 | car
+  11 | 42 | car
+  41 | 11 | 
+(4 rows)
+
+-- correlated sub-select:
+UPDATE update_test o
+  SET (b,a) = (select a+1,b from update_test i
+               where i.a=o.a and i.b=o.b and i.c is not distinct from o.c);
+SELECT * FROM update_test;
+ a  |  b  |  c  
+----+-----+-----
+ 21 | 101 | 
+ 41 |  12 | car
+ 42 |  12 | car
+ 11 |  42 | 
+(4 rows)
+
+-- fail, multiple rows supplied:
+UPDATE update_test SET (b,a) = (select a+1,b from update_test);
+ERROR:  more than one row returned by a subquery used as an expression
+-- set to null if no rows supplied:
+UPDATE update_test SET (b,a) = (select a+1,b from update_test where a = 1000)
+  WHERE a = 11;
+SELECT * FROM update_test;
+ a  |  b  |  c  
+----+-----+-----
+ 21 | 101 | 
+ 41 |  12 | car
+ 42 |  12 | car
+    |     | 
+(4 rows)
+
+-- *-expansion should work in this context:
+UPDATE update_test SET (a,b) = ROW(v.*) FROM (VALUES(21, 100)) AS v(i, j)
+  WHERE update_test.a = v.i;
+-- you might expect this to work, but syntactically it's not a RowExpr:
+UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) AS v(i, j)
+  WHERE update_test.a = v.i;
+ERROR:  source for a multiple-column UPDATE item must be a sub-SELECT or ROW() expression
+LINE 1: UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) ...
+                                        ^
+-- if an alias for the target table is specified, don't allow references
+-- to the original table name
+UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a = 10;
+ERROR:  invalid reference to FROM-clause entry for table "update_test"
+LINE 1: UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a...
+                                        ^
+HINT:  Perhaps you meant to reference the table alias "t".
+-- Make sure that we can update to a TOASTed value.
+UPDATE update_test SET c = repeat('x', 10000) WHERE c = 'car';
+SELECT a, b, char_length(c) FROM update_test;
+ a  |  b  | char_length 
+----+-----+-------------
+    |     |            
+ 21 | 100 |            
+ 41 |  12 |       10000
+ 42 |  12 |       10000
+(4 rows)
+
+-- Check multi-assignment with a Result node to handle a one-time filter.
+EXPLAIN (VERBOSE, COSTS OFF)
+UPDATE update_test t
+  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
+  WHERE CURRENT_USER = SESSION_USER;
+                                                QUERY PLAN                                                
+----------------------------------------------------------------------------------------------------------
+ Update on public.update_test t
+   ->  Explicit Redistribute Motion 3:3  (slice1; segments: 3)
+         Output: ($1), ($2), t.c, ((SubPlan 1 (returns $1,$2))), t.ctid, t.gp_segment_id, t.*, (DMLAction)
+         ->  Split
+               Output: ($1), ($2), t.c, ((SubPlan 1 (returns $1,$2))), t.ctid, t.gp_segment_id, t.*, DMLAction
+               ->  Seq Scan on public.update_test t
+                     Output: $1, $2, t.c, (SubPlan 1 (returns $1,$2)), t.ctid, t.gp_segment_id, t.*
+                     SubPlan 1 (returns $1,$2)
+                       ->  Result
+                             Output: s.b, s.a
+                             Filter: (s.a = t.a)
+                             ->  Materialize
+                                   Output: s.b, s.a
+                                   ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                                         Output: s.b, s.a
+                                         ->  Seq Scan on public.update_test s
+                                               Output: s.b, s.a
+ Optimizer: Postgres query optimizer
+(18 rows)
+
+UPDATE update_test t
+  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
+  WHERE CURRENT_USER = SESSION_USER;
+SELECT a, b, char_length(c) FROM update_test;
+  a  | b  | char_length 
+-----+----+-------------
+     |    |            
+ 100 | 21 |            
+  12 | 41 |       10000
+  12 | 42 |       10000
+(4 rows)
+
+-- Test ON CONFLICT DO UPDATE
+INSERT INTO upsert_test VALUES(1, 'Boo'), (3, 'Zoo');
+-- uncorrelated  sub-select:
+WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
+  VALUES (1, 'Bar') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+-- correlated sub-select:
+INSERT INTO upsert_test VALUES (1, 'Baz'), (3, 'Zaz') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Correlated', a from upsert_test i WHERE i.a = upsert_test.a)
+  RETURNING *;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+-- correlated sub-select (EXCLUDED.* alias):
+INSERT INTO upsert_test VALUES (1, 'Bat'), (3, 'Zot') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING *;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+-- ON CONFLICT using system attributes in RETURNING, testing both the
+-- inserting and updating paths. See bug report at:
+-- https://www.postgresql.org/message-id/73436355-6432-49B1-92ED-1FE4F7E7E100%40finefun.com.au
+INSERT INTO upsert_test VALUES (2, 'Beeble') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = 0 AS xmax_correct;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+-- currently xmax is set after a conflict - that's probably not good,
+-- but it seems worthwhile to have to be explicit if that changes.
+INSERT INTO upsert_test VALUES (2, 'Brox') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = pg_current_xact_id()::xid AS xmax_correct;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+DROP TABLE update_test;
+DROP TABLE upsert_test;
+-- Test ON CONFLICT DO UPDATE with partitioned table and non-identical children
+CREATE TABLE upsert_test (
+    a   INT PRIMARY KEY,
+    b   TEXT
+) PARTITION BY LIST (a);
+CREATE TABLE upsert_test_1 PARTITION OF upsert_test FOR VALUES IN (1);
+CREATE TABLE upsert_test_2 (b TEXT, a INT PRIMARY KEY);
+ALTER TABLE upsert_test ATTACH PARTITION upsert_test_2 FOR VALUES IN (2);
+INSERT INTO upsert_test VALUES(1, 'Boo'), (2, 'Zoo');
+-- uncorrelated sub-select:
+WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
+  VALUES (1, 'Bar') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+-- correlated sub-select:
+WITH aaa AS (SELECT 1 AS ctea, ' Foo' AS cteb) INSERT INTO upsert_test
+  VALUES (1, 'Bar'), (2, 'Baz') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT upsert_test.b||cteb, upsert_test.a FROM aaa) RETURNING *;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+DROP TABLE upsert_test;
+---------------------------
+-- UPDATE with row movement
+---------------------------
+-- When a partitioned table receives an UPDATE to the partitioned key and the
+-- new values no longer meet the partition's bound, the row must be moved to
+-- the correct partition for the new partition key (if one exists). We must
+-- also ensure that updatable views on partitioned tables properly enforce any
+-- WITH CHECK OPTION that is defined. The situation with triggers in this case
+-- also requires thorough testing as partition key updates causing row
+-- movement convert UPDATEs into DELETE+INSERT.
+CREATE TABLE range_parted (
+	a text,
+	b bigint,
+	c numeric,
+	d int,
+	e varchar
+) PARTITION BY RANGE (a, b);
+-- Create partitions intentionally in descending bound order, so as to test
+-- that update-row-movement works with the leaf partitions not in bound order.
+CREATE TABLE part_b_20_b_30 (e varchar, c numeric, a text, b bigint, d int);
+-- GPDB: distribution policy must match the parent table.
+alter table part_b_20_b_30 set distributed by (a);
+ALTER TABLE range_parted ATTACH PARTITION part_b_20_b_30 FOR VALUES FROM ('b', 20) TO ('b', 30);
+CREATE TABLE part_b_10_b_20 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY RANGE (c);
+alter table part_b_10_b_20 set distributed by (a);
+CREATE TABLE part_b_1_b_10 PARTITION OF range_parted FOR VALUES FROM ('b', 1) TO ('b', 10);
+ALTER TABLE range_parted ATTACH PARTITION part_b_10_b_20 FOR VALUES FROM ('b', 10) TO ('b', 20);
+CREATE TABLE part_a_10_a_20 PARTITION OF range_parted FOR VALUES FROM ('a', 10) TO ('a', 20);
+CREATE TABLE part_a_1_a_10 PARTITION OF range_parted FOR VALUES FROM ('a', 1) TO ('a', 10);
+-- Check that partition-key UPDATE works sanely on a partitioned table that
+-- does not have any child partitions.
+UPDATE part_b_10_b_20 set b = b - 6;
+-- Create some more partitions following the above pattern of descending bound
+-- order, but let's make the situation a bit more complex by having the
+-- attribute numbers of the columns vary from their parent partition.
+CREATE TABLE part_c_100_200 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY range (abs(d));
+ALTER TABLE part_c_100_200 DROP COLUMN e, DROP COLUMN c, DROP COLUMN a;
+ALTER TABLE part_c_100_200 ADD COLUMN c numeric, ADD COLUMN e varchar, ADD COLUMN a text;
+ALTER TABLE part_c_100_200 DROP COLUMN b;
+ALTER TABLE part_c_100_200 ADD COLUMN b bigint;
+CREATE TABLE part_d_1_15 PARTITION OF part_c_100_200 FOR VALUES FROM (1) TO (15);
+CREATE TABLE part_d_15_20 PARTITION OF part_c_100_200 FOR VALUES FROM (15) TO (20);
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
+ERROR:  distribution policy for "part_c_100_200" must be the same as that for "part_b_10_b_20"
+-- GPDB: distribution policy must match the parent table, so the previous command fails.
+-- Change the distribution key and try again.
+alter table part_c_100_200 set distributed by (a);
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
+CREATE TABLE part_c_1_100 (e varchar, d int, c numeric, b bigint, a text);
+alter table part_c_1_100 set distributed by (a);
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_1_100 FOR VALUES FROM (1) TO (100);
+\set init_range_parted 'truncate range_parted; insert into range_parted VALUES (''a'', 1, 1, 1), (''a'', 10, 200, 1), (''b'', 12, 96, 1), (''b'', 13, 97, 2), (''b'', 15, 105, 16), (''b'', 17, 105, 19)'
+\set show_data 'select tableoid::regclass::text COLLATE "C" partname, * from range_parted ORDER BY 1, 2, 3, 4, 5, 6'
+:init_range_parted;
+:show_data;
+    partname    | a | b  |  c  | d  | e 
+----------------+---+----+-----+----+---
+ part_a_10_a_20 | a | 10 | 200 |  1 | 
+ part_a_1_a_10  | a |  1 |   1 |  1 | 
+ part_c_1_100   | b | 12 |  96 |  1 | 
+ part_c_1_100   | b | 13 |  97 |  2 | 
+ part_d_15_20   | b | 15 | 105 | 16 | 
+ part_d_15_20   | b | 17 | 105 | 19 | 
+(6 rows)
+
+-- The order of subplans should be in bound order
+EXPLAIN (costs off) UPDATE range_parted set c = c - 50 WHERE c > 97;
+                      QUERY PLAN                       
+-------------------------------------------------------
+ Update on range_parted
+   Update on part_a_1_a_10 range_parted_1
+   Update on part_a_10_a_20 range_parted_2
+   Update on part_b_1_b_10 range_parted_3
+   Update on part_c_1_100 range_parted_4
+   Update on part_d_1_15 range_parted_5
+   Update on part_d_15_20 range_parted_6
+   Update on part_b_20_b_30 range_parted_7
+   ->  Append
+         ->  Seq Scan on part_a_1_a_10 range_parted_1
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_a_10_a_20 range_parted_2
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_b_1_b_10 range_parted_3
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_c_1_100 range_parted_4
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_d_1_15 range_parted_5
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_d_15_20 range_parted_6
+               Filter: (c > '97'::numeric)
+         ->  Seq Scan on part_b_20_b_30 range_parted_7
+               Filter: (c > '97'::numeric)
+(23 rows)
+
+-- fail, row movement happens only within the partition subtree.
+UPDATE part_c_100_200 set c = c - 20, d = c WHERE c = 105;
+ERROR:  new row for relation "part_c_100_200" violates partition constraint
+DETAIL:  Failing row contains (105, 85, null, b, 15).
+-- fail, no partition key update, so no attempt to move tuple,
+-- but "a = 'a'" violates partition constraint enforced by root partition)
+UPDATE part_b_10_b_20 set a = 'a';
+ERROR:  new row for relation "part_b_10_b_20" violates partition constraint
+DETAIL:  Failing row contains (null, 96, a, 12, 1).
+-- ok, partition key update, no constraint violation
+UPDATE range_parted set d = d - 10 WHERE d > 10;
+-- ok, no partition key update, no constraint violation
+UPDATE range_parted set e = d;
+-- No row found
+UPDATE part_c_1_100 set c = c + 20 WHERE c = 98;
+-- ok, row movement
+UPDATE part_b_10_b_20 set c = c + 20 returning c, b, a;
+  c  | b  | a 
+-----+----+---
+ 116 | 12 | b
+ 117 | 13 | b
+ 125 | 15 | b
+ 125 | 17 | b
+(4 rows)
+
+:show_data;
+    partname    | a | b  |  c  | d | e 
+----------------+---+----+-----+---+---
+ part_a_10_a_20 | a | 10 | 200 | 1 | 1
+ part_a_1_a_10  | a |  1 |   1 | 1 | 1
+ part_d_1_15    | b | 12 | 116 | 1 | 1
+ part_d_1_15    | b | 13 | 117 | 2 | 2
+ part_d_1_15    | b | 15 | 125 | 6 | 6
+ part_d_1_15    | b | 17 | 125 | 9 | 9
+(6 rows)
+
+-- fail, row movement happens only within the partition subtree.
+UPDATE part_b_10_b_20 set b = b - 6 WHERE c > 116 returning *;
+ERROR:  new row for relation "part_b_10_b_20" violates partition constraint
+DETAIL:  Failing row contains (2, 117, b, 7, 2).
+-- ok, row movement, with subset of rows moved into different partition.
+UPDATE range_parted set b = b - 6 WHERE c > 116 returning a, b + c;
+ a | ?column? 
+---+----------
+ a |      204
+ b |      124
+ b |      134
+ b |      136
+(4 rows)
+
+:show_data;
+   partname    | a | b  |  c  | d | e 
+---------------+---+----+-----+---+---
+ part_a_1_a_10 | a |  1 |   1 | 1 | 1
+ part_a_1_a_10 | a |  4 | 200 | 1 | 1
+ part_b_1_b_10 | b |  7 | 117 | 2 | 2
+ part_b_1_b_10 | b |  9 | 125 | 6 | 6
+ part_d_1_15   | b | 11 | 125 | 9 | 9
+ part_d_1_15   | b | 12 | 116 | 1 | 1
+(6 rows)
+
+-- Common table needed for multiple test scenarios.
+CREATE TABLE mintab(c1 int);
+INSERT into mintab VALUES (120);
+-- update partition key using updatable view.
+CREATE VIEW upview AS SELECT * FROM range_parted WHERE (select c > c1 FROM mintab) WITH CHECK OPTION;
+-- ok
+UPDATE upview set c = 199 WHERE b = 4;
+-- fail, check option violation
+UPDATE upview set c = 120 WHERE b = 4;
+ERROR:  new row violates check option for view "upview"
+DETAIL:  Failing row contains (a, 4, 120, 1, 1).
+-- fail, row movement with check option violation
+UPDATE upview set a = 'b', b = 15, c = 120 WHERE b = 4;
+ERROR:  new row violates check option for view "upview"
+DETAIL:  Failing row contains (b, 15, 120, 1, 1).
+-- ok, row movement, check option passes
+UPDATE upview set a = 'b', b = 15 WHERE b = 4;
+:show_data;
+   partname    | a | b  |  c  | d | e 
+---------------+---+----+-----+---+---
+ part_a_1_a_10 | a |  1 |   1 | 1 | 1
+ part_b_1_b_10 | b |  7 | 117 | 2 | 2
+ part_b_1_b_10 | b |  9 | 125 | 6 | 6
+ part_d_1_15   | b | 11 | 125 | 9 | 9
+ part_d_1_15   | b | 12 | 116 | 1 | 1
+ part_d_1_15   | b | 15 | 199 | 1 | 1
+(6 rows)
+
+-- cleanup
+DROP VIEW upview;
+-- RETURNING having whole-row vars.
+:init_range_parted;
+UPDATE range_parted set c = 95 WHERE a = 'b' and b > 10 and c > 100 returning (range_parted), *;
+ range_parted  | a | b  | c  | d  | e 
+---------------+---+----+----+----+---
+ (b,15,95,16,) | b | 15 | 95 | 16 | 
+ (b,17,95,19,) | b | 17 | 95 | 19 | 
+(2 rows)
+
+:show_data;
+    partname    | a | b  |  c  | d  | e 
+----------------+---+----+-----+----+---
+ part_a_10_a_20 | a | 10 | 200 |  1 | 
+ part_a_1_a_10  | a |  1 |   1 |  1 | 
+ part_c_1_100   | b | 12 |  96 |  1 | 
+ part_c_1_100   | b | 13 |  97 |  2 | 
+ part_c_1_100   | b | 15 |  95 | 16 | 
+ part_c_1_100   | b | 17 |  95 | 19 | 
+(6 rows)
+
+-- Creating default partition for range
+:init_range_parted;
+create table part_def partition of range_parted default;
+\d+ part_def
+                                       Table "public.part_def"
+ Column |       Type        | Collation | Nullable | Default | Storage  | Stats target | Description 
+--------+-------------------+-----------+----------+---------+----------+--------------+-------------
+ a      | text              |           |          |         | extended |              | 
+ b      | bigint            |           |          |         | plain    |              | 
+ c      | numeric           |           |          |         | main     |              | 
+ d      | integer           |           |          |         | plain    |              | 
+ e      | character varying |           |          |         | extended |              | 
+Partition of: range_parted DEFAULT
+Partition constraint: (NOT ((a IS NOT NULL) AND (b IS NOT NULL) AND (((a = 'a'::text) AND (b >= '1'::bigint) AND (b < '10'::bigint)) OR ((a = 'a'::text) AND (b >= '10'::bigint) AND (b < '20'::bigint)) OR ((a = 'b'::text) AND (b >= '1'::bigint) AND (b < '10'::bigint)) OR ((a = 'b'::text) AND (b >= '10'::bigint) AND (b < '20'::bigint)) OR ((a = 'b'::text) AND (b >= '20'::bigint) AND (b < '30'::bigint)))))
+
+insert into range_parted values ('c', 9);
+-- ok
+update part_def set a = 'd' where a = 'c';
+-- fail
+update part_def set a = 'a' where a = 'd';
+ERROR:  new row for relation "part_def" violates partition constraint
+DETAIL:  Failing row contains (a, 9, null, null, null).
+:show_data;
+    partname    | a | b  |  c  | d  | e 
+----------------+---+----+-----+----+---
+ part_a_10_a_20 | a | 10 | 200 |  1 | 
+ part_a_1_a_10  | a |  1 |   1 |  1 | 
+ part_c_1_100   | b | 12 |  96 |  1 | 
+ part_c_1_100   | b | 13 |  97 |  2 | 
+ part_d_15_20   | b | 15 | 105 | 16 | 
+ part_d_15_20   | b | 17 | 105 | 19 | 
+ part_def       | d |  9 |     |    | 
+(7 rows)
+
+-- Update row movement from non-default to default partition.
+-- fail, default partition is not under part_a_10_a_20;
+UPDATE part_a_10_a_20 set a = 'ad' WHERE a = 'a';
+ERROR:  new row for relation "part_a_10_a_20" violates partition constraint
+DETAIL:  Failing row contains (ad, 10, 200, 1, null).
+-- ok
+UPDATE range_parted set a = 'ad' WHERE a = 'a';
+UPDATE range_parted set a = 'bd' WHERE a = 'b';
+:show_data;
+ partname | a  | b  |  c  | d  | e 
+----------+----+----+-----+----+---
+ part_def | ad |  1 |   1 |  1 | 
+ part_def | ad | 10 | 200 |  1 | 
+ part_def | bd | 12 |  96 |  1 | 
+ part_def | bd | 13 |  97 |  2 | 
+ part_def | bd | 15 | 105 | 16 | 
+ part_def | bd | 17 | 105 | 19 | 
+ part_def | d  |  9 |     |    | 
+(7 rows)
+
+-- Update row movement from default to non-default partitions.
+-- ok
+UPDATE range_parted set a = 'a' WHERE a = 'ad';
+UPDATE range_parted set a = 'b' WHERE a = 'bd';
+:show_data;
+    partname    | a | b  |  c  | d  | e 
+----------------+---+----+-----+----+---
+ part_a_10_a_20 | a | 10 | 200 |  1 | 
+ part_a_1_a_10  | a |  1 |   1 |  1 | 
+ part_c_1_100   | b | 12 |  96 |  1 | 
+ part_c_1_100   | b | 13 |  97 |  2 | 
+ part_d_15_20   | b | 15 | 105 | 16 | 
+ part_d_15_20   | b | 17 | 105 | 19 | 
+ part_def       | d |  9 |     |    | 
+(7 rows)
+
+-- Cleanup: range_parted no longer needed.
+DROP TABLE range_parted;
+CREATE TABLE list_parted (
+	a text,
+	b int
+) PARTITION BY list (a);
+CREATE TABLE list_part1  PARTITION OF list_parted for VALUES in ('a', 'b');
+CREATE TABLE list_default PARTITION OF list_parted default;
+INSERT into list_part1 VALUES ('a', 1);
+INSERT into list_default VALUES ('d', 10);
+-- fail
+UPDATE list_default set a = 'a' WHERE a = 'd';
+ERROR:  new row for relation "list_default" violates partition constraint
+DETAIL:  Failing row contains (a, 10).
+-- ok
+UPDATE list_default set a = 'x' WHERE a = 'd';
+DROP TABLE list_parted;
+--------------
+-- Some more update-partition-key test scenarios below. This time use list
+-- partitions.
+--------------
+-- Setup for list partitions
+CREATE TABLE list_parted (a numeric, b int, c int8) PARTITION BY list (a);
+CREATE TABLE sub_parted PARTITION OF list_parted for VALUES in (1) PARTITION BY list (b);
+CREATE TABLE sub_part1(b int, c int8, a numeric);
+alter table sub_part1 set distributed by (a); -- GPDB: distribution policy must match the parent table.
+ALTER TABLE sub_parted ATTACH PARTITION sub_part1 for VALUES in (1);
+CREATE TABLE sub_part2(b int, c int8, a numeric);
+alter table sub_part2 set distributed by (a); -- GPDB: distribution policy must match the parent table.
+ALTER TABLE sub_parted ATTACH PARTITION sub_part2 for VALUES in (2);
+CREATE TABLE list_part1(a numeric, b int, c int8);
+ALTER TABLE list_parted ATTACH PARTITION list_part1 for VALUES in (2,3);
+INSERT into list_parted VALUES (2,5,50);
+INSERT into list_parted VALUES (3,6,60);
+INSERT into sub_parted VALUES (1,1,60);
+INSERT into sub_parted VALUES (1,2,10);
+-- Test partition constraint violation when intermediate ancestor is used and
+-- constraint is inherited from upper root.
+UPDATE sub_parted set a = 2 WHERE c = 10;
+ERROR:  new row for relation "sub_parted" violates partition constraint
+DETAIL:  Failing row contains (2, 2, 10).
+-- Test update-partition-key, where the unpruned partitions do not have their
+-- partition keys updated.
+SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
+  tableoid  | a | b | c  
+------------+---+---+----
+ list_part1 | 2 | 5 | 50
+(1 row)
+
+UPDATE list_parted set b = c + a WHERE a = 2;
+SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
+  tableoid  | a | b  | c  
+------------+---+----+----
+ list_part1 | 2 | 52 | 50
+(1 row)
+
+-- Cleanup: list_parted no longer needed.
+DROP TABLE list_parted;
+-- create custom operator class and hash function, for the same reason
+-- explained in alter_table.sql
+create or replace function dummy_hashint4(a int4, seed int8) returns int8 as
+$$ begin return (a + seed); end; $$ language 'plpgsql' immutable;
+create operator class custom_opclass for type int4 using hash as
+operator 1 = , function 2 dummy_hashint4(int4, int8);
+create table hash_parted (
+	a int,
+	b int
+) partition by hash (a custom_opclass, b custom_opclass);
+create table hpart1 partition of hash_parted for values with (modulus 2, remainder 1);
+create table hpart2 partition of hash_parted for values with (modulus 4, remainder 2);
+create table hpart3 partition of hash_parted for values with (modulus 8, remainder 0);
+create table hpart4 partition of hash_parted for values with (modulus 8, remainder 4);
+insert into hpart1 values (1, 1);
+insert into hpart2 values (2, 5);
+insert into hpart4 values (3, 4);
+-- fail
+update hpart1 set a = 3, b=4 where a = 1;
+ERROR:  new row for relation "hpart1" violates partition constraint
+DETAIL:  Failing row contains (3, 4).
+-- ok, row movement
+update hash_parted set b = b - 1 where b = 1;
+-- ok
+update hash_parted set b = b + 8 where b = 1;
+-- cleanup
+drop table hash_parted;
+drop operator class custom_opclass using hash;
+drop function dummy_hashint4(a int4, seed int8);
diff --git a/contrib/pax_storage/src/data/expected/update_gp.out b/contrib/pax_storage/expected/update_gp.out
similarity index 77%
rename from contrib/pax_storage/src/data/expected/update_gp.out
rename to contrib/pax_storage/expected/update_gp.out
index ba6ca2bc930..9a06ce92d04 100644
--- a/contrib/pax_storage/src/data/expected/update_gp.out
+++ b/contrib/pax_storage/expected/update_gp.out
@@ -1,9 +1,9 @@
+set default_table_access_method = pax;
 -- Test DELETE and UPDATE on an inherited table.
 -- The special aspect of this table is that the inherited table has
 -- a different distribution key. 'p' table's distribution key matches
 -- that of 'r', but 'p2's doesn't. Test that the planner adds a Motion
 -- node correctly for p2.
-set default_table_access_method = 'pax';
 create table todelete (a int) distributed by (a);
 create table parent (a int, b int, c int) distributed by (a);
 create table child (a int, b int, c int) inherits (parent) distributed by (b);
@@ -19,14 +19,14 @@ update parent set c=c+100 from todelete where parent.a = todelete.a;
 select * from parent;
  a  | b  |  c  
 ----+----+-----
+  1 |  1 |   1
   5 |  5 | 105
   9 |  9 |   9
- 10 | 10 |  10
-  6 |  6 | 106
+  7 |  7 | 107
   2 |  2 |   2
   8 |  8 |   8
-  7 |  7 | 107
-  1 |  1 |   1
+ 10 | 10 |  10
+  6 |  6 | 106
 (8 rows)
 
 drop table todelete;
@@ -49,13 +49,13 @@ update target set b=target.b+100 where c = 3 and a in (select b from todelete);
 select * from target;
  a |  b  | c 
 ---+-----+---
- 5 |   0 | 1
- 5 | 100 | 3
- 1 |   0 | 1
  2 |   0 | 1
- 3 |   0 | 1
  4 |   0 | 1
  4 |   0 | 3
+ 1 |   0 | 1
+ 3 |   0 | 1
+ 5 |   0 | 1
+ 5 | 100 | 3
 (7 rows)
 
 -- Also test an update with a qual that doesn't match any partition. The
@@ -76,12 +76,10 @@ create table child_b (a int4, b int4) inherits (base_tbl) distributed by (b);
 NOTICE:  merging column "a" with inherited definition
 NOTICE:  merging column "b" with inherited definition
 insert into base_tbl select g, g from generate_series(1, 5) g;
--- start_ignore
 explain (costs off) update base_tbl set a=a+1;
-ERROR:  can't split update for inherit table: base_tbl (preptlist.c:138)
--- end_ignore
+ERROR:  can't split update for inherit table: base_tbl
 update base_tbl set a = 5;
-ERROR:  can't split update for inherit table: base_tbl (preptlist.c:138)
+ERROR:  can't split update for inherit table: base_tbl
 --
 -- Explicit Distribution motion must be added if any of the child nodes
 -- contains any motion excluding the motions in initplans.
@@ -96,8 +94,8 @@ CREATE TABLE keo3 ( sky_per character varying(24), bky_per character varying(24)
 INSERT INTO keo3 VALUES ('1', '1');
 CREATE TABLE keo4 ( keo_para_required_period character varying(6), keo_para_budget_date character varying(24)) DISTRIBUTED RANDOMLY;
 INSERT INTO keo4 VALUES ('1', '1');
+ANALYZE keo1, keo2, keo3, keo4;
 -- Explicit Redistribution motion should be added in case of GPDB Planner (test case not applicable for ORCA)
--- start_ignore
 EXPLAIN (COSTS OFF) UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
     ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
         ON b.projects_pk=a.user_vie_project_code_pk
@@ -107,41 +105,37 @@ EXPLAIN (COSTS OFF) UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
                 (SELECT min (keo4.keo_para_budget_date) FROM keo4)))
     ) t1
 WHERE t1.user_vie_project_code_pk = keo1.user_vie_project_code_pk;
-                                                       QUERY PLAN                                                        
--------------------------------------------------------------------------------------------------------------------------
+                                              QUERY PLAN                                               
+-------------------------------------------------------------------------------------------------------
  Update on keo1
-   InitPlan 3 (returns $2)  (slice4)
-     ->  Finalize Aggregate
-           InitPlan 2 (returns $1)  (slice6)
-             ->  Gather Motion 3:1  (slice7; segments: 3)
-                   InitPlan 1 (returns $0)  (slice8)
-                     ->  Finalize Aggregate
-                           ->  Gather Motion 3:1  (slice9; segments: 3)
-                                 ->  Partial Aggregate
-                                       ->  Seq Scan on keo4
+   InitPlan 3 (returns $2)  (slice3)
+     ->  Aggregate
+           InitPlan 2 (returns $1)  (slice5)
+             ->  Gather Motion 3:1  (slice6; segments: 3)
+                   InitPlan 1 (returns $0)  (slice7)
+                     ->  Aggregate
+                           ->  Gather Motion 3:1  (slice8; segments: 3)
+                                 ->  Seq Scan on keo4
                    ->  Seq Scan on keo4 keo4_1
                          Filter: ((keo_para_budget_date)::text = $0)
-           ->  Gather Motion 3:1  (slice5; segments: 3)
-                 ->  Partial Aggregate
-                       ->  Seq Scan on keo3
-                             Filter: ((bky_per)::text = ($1)::text)
-   ->  Explicit Redistribute Motion 3:3  (slice1; segments: 3)
+           ->  Gather Motion 3:1  (slice4; segments: 3)
+                 ->  Seq Scan on keo3
+                       Filter: ((bky_per)::text = ($1)::text)
+   ->  Hash Join
+         Hash Cond: ((a.user_vie_project_code_pk)::text = (b.projects_pk)::text)
          ->  Hash Join
-               Hash Cond: ((b.projects_pk)::text = (a.user_vie_project_code_pk)::text)
-               ->  Seq Scan on keo2 b
+               Hash Cond: ((a.user_vie_project_code_pk)::text = (keo1.user_vie_project_code_pk)::text)
+               ->  Broadcast Motion 3:3  (slice1; segments: 3)
+                     ->  Seq Scan on keo1 a
+                           Filter: ((user_vie_fiscal_year_period_sk)::text = $2)
                ->  Hash
-                     ->  Broadcast Motion 3:3  (slice2; segments: 3)
-                           ->  Hash Join
-                                 Hash Cond: ((keo1.user_vie_project_code_pk)::text = (a.user_vie_project_code_pk)::text)
-                                 ->  Seq Scan on keo1
-                                 ->  Hash
-                                       ->  Broadcast Motion 3:3  (slice3; segments: 3)
-                                             ->  Seq Scan on keo1 a
-                                                   Filter: ((user_vie_fiscal_year_period_sk)::text = $2)
+                     ->  Seq Scan on keo1
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Seq Scan on keo2 b
  Optimizer: Postgres query optimizer
-(30 rows)
+(27 rows)
 
--- end_ignore
 UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
     ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
         ON b.projects_pk=a.user_vie_project_code_pk
@@ -160,7 +154,6 @@ SELECT user_vie_act_cntr_marg_cum FROM keo1;
 -- Explicit Redistribution motion should not be added in case of GPDB Planner (test case not applicable to ORCA)
 CREATE TABLE keo5 (x int, y int) DISTRIBUTED BY (x);
 INSERT INTO keo5 VALUES (1,1);
--- start_ignore
 EXPLAIN (COSTS OFF) DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
                       QUERY PLAN                       
 -------------------------------------------------------
@@ -181,7 +174,6 @@ EXPLAIN (COSTS OFF) DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS
  Optimizer: Postgres query optimizer
 (15 rows)
 
--- end_ignore
 DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
 SELECT x FROM keo5;
  x 
@@ -194,34 +186,48 @@ DROP TABLE keo2;
 DROP TABLE keo3;
 DROP TABLE keo4;
 DROP TABLE keo5;
--- start_ignore
--- -- text types. We should support the following updates.
--- --
--- CREATE TEMP TABLE ttab1 (a varchar(15), b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a varchar(15), b integer) DISTRIBUTED BY (a);
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
--- CREATE TEMP TABLE ttab1 (a text, b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a text, b integer) DISTRIBUTED BY (a);
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
--- CREATE TEMP TABLE ttab1 (a varchar, b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a varchar, b integer) DISTRIBUTED BY (a);
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
--- CREATE TEMP TABLE ttab1 (a char(15), b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a char(15), b integer) DISTRIBUTED BY (a);
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
--- DROP TABLE IF EXISTS update_distr_key;
--- CREATE TEMP TABLE update_distr_key (a int, b int) DISTRIBUTED BY (a);
--- INSERT INTO update_distr_key select i, i* 10 from generate_series(0, 9) i;
--- UPDATE update_distr_key SET a = 5 WHERE b = 10;
--- SELECT * from update_distr_key;
--- DROP TABLE update_distr_key;
--- end_ignore
+--
+-- text types. We should support the following updates.
+--
+CREATE TEMP TABLE ttab1 (a varchar(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar(15), b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a text, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a text, b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a varchar, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar, b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a char(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a char(15), b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE IF EXISTS update_distr_key;
+NOTICE:  table "update_distr_key" does not exist, skipping
+CREATE TEMP TABLE update_distr_key (a int, b int) DISTRIBUTED BY (a);
+INSERT INTO update_distr_key select i, i* 10 from generate_series(0, 9) i;
+UPDATE update_distr_key SET a = 5 WHERE b = 10;
+SELECT * from update_distr_key;
+ a | b  
+---+----
+ 0 |  0
+ 2 | 20
+ 4 | 40
+ 6 | 60
+ 8 | 80
+ 5 | 10
+ 3 | 30
+ 5 | 50
+ 7 | 70
+ 9 | 90
+(10 rows)
+
+DROP TABLE update_distr_key;
 -- below cases is to test multi-hash-cols
 CREATE TABLE tab3(c1 int, c2 int, c3 int, c4 int, c5 int) DISTRIBUTED BY (c1, c2, c3);
 CREATE TABLE tab5(c1 int, c2 int, c3 int, c4 int, c5 int) DISTRIBUTED BY (c1, c2, c3, c4, c5);
@@ -233,14 +239,14 @@ SELECT gp_segment_id, * FROM tab3;
 ---------------+----+----+----+----+----
              0 |  5 |  5 |  5 |  5 |  5
              0 |  8 |  8 |  8 |  8 |  8
-             2 |  1 |  1 |  1 |  1 |  1
-             2 |  2 |  2 |  2 |  2 |  2
-             2 |  6 |  6 |  6 |  6 |  6
-             2 |  7 |  7 |  7 |  7 |  7
              1 |  3 |  3 |  3 |  3 |  3
              1 |  4 |  4 |  4 |  4 |  4
              1 |  9 |  9 |  9 |  9 |  9
              1 | 10 | 10 | 10 | 10 | 10
+             2 |  1 |  1 |  1 |  1 |  1
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
 (10 rows)
 
 UPDATE tab3 set c1 = 9 where c4 = 1;
@@ -267,66 +273,69 @@ SELECT gp_segment_id, * FROM tab3;
              1 |  4 |  4 |  4 |  4 |  4
              1 |  9 |  9 |  9 |  9 |  9
              1 | 10 | 10 | 10 | 10 | 10
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
              2 |  2 |  2 |  2 |  2 |  2
              2 |  6 |  6 |  6 |  6 |  6
              2 |  7 |  7 |  7 |  7 |  7
              2 |  5 |  6 |  1 |  1 |  1
-             0 |  5 |  5 |  5 |  5 |  5
-             0 |  8 |  8 |  8 |  8 |  8
 (10 rows)
 
 UPDATE tab3 set (c1,c2,c3) = (3,2,1) where c4 = 1;
 SELECT gp_segment_id, * FROM tab3;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
-             0 |  5 |  5 |  5 |  5 |  5
-             0 |  8 |  8 |  8 |  8 |  8
-             1 |  3 |  3 |  3 |  3 |  3
-             1 |  4 |  4 |  4 |  4 |  4
-             1 |  9 |  9 |  9 |  9 |  9
-             1 | 10 | 10 | 10 | 10 | 10
              2 |  2 |  2 |  2 |  2 |  2
              2 |  6 |  6 |  6 |  6 |  6
              2 |  7 |  7 |  7 |  7 |  7
              2 |  3 |  2 |  1 |  1 |  1
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
 (10 rows)
 
 UPDATE tab3 set c1 = 11 where c2 = 10 and c2 < 1;
 SELECT gp_segment_id, * FROM tab3;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
-             1 |  3 |  3 |  3 |  3 |  3
-             1 |  4 |  4 |  4 |  4 |  4
-             1 |  9 |  9 |  9 |  9 |  9
-             1 | 10 | 10 | 10 | 10 | 10
              0 |  5 |  5 |  5 |  5 |  5
              0 |  8 |  8 |  8 |  8 |  8
              2 |  2 |  2 |  2 |  2 |  2
              2 |  6 |  6 |  6 |  6 |  6
              2 |  7 |  7 |  7 |  7 |  7
              2 |  3 |  2 |  1 |  1 |  1
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
 (10 rows)
 
 -- test tab5
 SELECT gp_segment_id, * FROM tab5;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
-             0 |  4 |  4 |  4 |  4 |  4
-             0 |  9 |  9 |  9 |  9 |  9
-             0 | 10 | 10 | 10 | 10 | 10
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
              1 |  1 |  1 |  1 |  1 |  1
              1 |  2 |  2 |  2 |  2 |  2
              1 |  3 |  3 |  3 |  3 |  3
              1 |  5 |  5 |  5 |  5 |  5
-             2 |  6 |  6 |  6 |  6 |  6
-             2 |  7 |  7 |  7 |  7 |  7
-             2 |  8 |  8 |  8 |  8 |  8
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
 (10 rows)
 
 UPDATE tab5 set c1 = 1000 where c4 = 1;
 SELECT gp_segment_id, * FROM tab5;
  gp_segment_id |  c1  | c2 | c3 | c4 | c5 
 ---------------+------+----+----+----+----
+             0 |    4 |  4 |  4 |  4 |  4
+             0 |    9 |  9 |  9 |  9 |  9
+             0 |   10 | 10 | 10 | 10 | 10
              1 |    2 |  2 |  2 |  2 |  2
              1 |    3 |  3 |  3 |  3 |  3
              1 |    5 |  5 |  5 |  5 |  5
@@ -334,9 +343,6 @@ SELECT gp_segment_id, * FROM tab5;
              2 |    6 |  6 |  6 |  6 |  6
              2 |    7 |  7 |  7 |  7 |  7
              2 |    8 |  8 |  8 |  8 |  8
-             0 |    4 |  4 |  4 |  4 |  4
-             0 |    9 |  9 |  9 |  9 |  9
-             0 |   10 | 10 | 10 | 10 | 10
 (10 rows)
 
 UPDATE tab5 set (c1,c2) = (9,10) where c4 = 1;
@@ -359,12 +365,12 @@ UPDATE tab5 set (c1,c2,c4) = (5,8,6) where c4 = 1;
 SELECT gp_segment_id, * FROM tab5;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
-             2 |  6 |  6 |  6 |  6 |  6
-             2 |  7 |  7 |  7 |  7 |  7
-             2 |  8 |  8 |  8 |  8 |  8
              1 |  2 |  2 |  2 |  2 |  2
              1 |  3 |  3 |  3 |  3 |  3
              1 |  5 |  5 |  5 |  5 |  5
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
              0 |  4 |  4 |  4 |  4 |  4
              0 |  9 |  9 |  9 |  9 |  9
              0 | 10 | 10 | 10 | 10 | 10
@@ -375,6 +381,9 @@ UPDATE tab5 set (c1,c2,c3,c4,c5) = (1,2,3,0,6) where c5 = 1;
 SELECT gp_segment_id, * FROM tab5;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
              1 |  2 |  2 |  2 |  2 |  2
              1 |  3 |  3 |  3 |  3 |  3
              1 |  5 |  5 |  5 |  5 |  5
@@ -382,15 +391,15 @@ SELECT gp_segment_id, * FROM tab5;
              2 |  6 |  6 |  6 |  6 |  6
              2 |  7 |  7 |  7 |  7 |  7
              2 |  8 |  8 |  8 |  8 |  8
-             0 |  4 |  4 |  4 |  4 |  4
-             0 |  9 |  9 |  9 |  9 |  9
-             0 | 10 | 10 | 10 | 10 | 10
 (10 rows)
 
 UPDATE tab5 set c1 = 11 where c3 = 10 and c3 < 1;
 SELECT gp_segment_id, * FROM tab5;
  gp_segment_id | c1 | c2 | c3 | c4 | c5 
 ---------------+----+----+----+----+----
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
              1 |  2 |  2 |  2 |  2 |  2
              1 |  3 |  3 |  3 |  3 |  3
              1 |  5 |  5 |  5 |  5 |  5
@@ -398,12 +407,8 @@ SELECT gp_segment_id, * FROM tab5;
              2 |  6 |  6 |  6 |  6 |  6
              2 |  7 |  7 |  7 |  7 |  7
              2 |  8 |  8 |  8 |  8 |  8
-             0 |  4 |  4 |  4 |  4 |  4
-             0 |  9 |  9 |  9 |  9 |  9
-             0 | 10 | 10 | 10 | 10 | 10
 (10 rows)
 
--- start_ignore
 EXPLAIN (COSTS OFF ) UPDATE tab3 SET C1 = C1 + 1, C5 = C5+1;
                           QUERY PLAN                           
 ---------------------------------------------------------------
@@ -414,7 +419,6 @@ EXPLAIN (COSTS OFF ) UPDATE tab3 SET C1 = C1 + 1, C5 = C5+1;
  Optimizer: Postgres query optimizer
 (5 rows)
 
--- end_ignore
 -- clean up
 drop table tab3;
 drop table tab5;
@@ -430,6 +434,12 @@ drop table if exists update_ao_table;
 NOTICE:  table "update_ao_table" does not exist, skipping
 drop table if exists update_aoco_table;
 NOTICE:  table "update_aoco_table" does not exist, skipping
+drop table if exists p_1;
+NOTICE:  table "p_1" does not exist, skipping
+drop table if exists p_2;
+NOTICE:  table "p_2" does not exist, skipping
+drop table if exists subpartition_1;
+NOTICE:  table "subpartition_1" does not exist, skipping
 -- end_ignore
 -- Update normal table distribution key
 create table update_dist(a int) distributed by (a);
@@ -449,43 +459,43 @@ insert into s select generate_series(1, 5), generate_series(1, 5) * 2;
 select * from r;
  a | b  
 ---+----
- 1 |  2
- 5 | 10
- 2 |  4
  3 |  6
  4 |  8
+ 5 | 10
+ 1 |  2
+ 2 |  4
 (5 rows)
 
 select * from s;
  a | b  
 ---+----
+ 1 |  2
  2 |  4
  3 |  6
  4 |  8
  5 | 10
- 1 |  2
 (5 rows)
 
 update r set a = r.a + 1 from s where r.a = s.a;
 select * from r;
  a | b  
 ---+----
- 3 |  4
  4 |  6
- 2 |  2
  5 |  8
  6 | 10
+ 3 |  4
+ 2 |  2
 (5 rows)
 
 update r set a = r.a + 1 where a in (select a from s);
 select * from r;
  a | b  
 ---+----
- 4 |  4
- 3 |  2
  6 | 10
  5 |  6
  6 |  8
+ 4 |  4
+ 3 |  2
 (5 rows)
 
 -- Update redistribution
@@ -496,32 +506,32 @@ insert into s select generate_series(1, 5), generate_series(1, 5) * 2;
 select * from r;
  a | b 
 ---+---
+ 3 | 3
+ 4 | 4
  5 | 5
  1 | 1
  2 | 2
- 3 | 3
- 4 | 4
 (5 rows)
 
 select * from s;
  a | b  
 ---+----
- 1 |  2
- 5 | 10
- 2 |  4
  3 |  6
  4 |  8
+ 5 | 10
+ 1 |  2
+ 2 |  4
 (5 rows)
 
 update r set a = r.a + 1 from s where r.b = s.b;
 select * from r;
  a | b 
 ---+---
- 3 | 3
- 3 | 2
  1 | 1
+ 3 | 3
  5 | 5
  5 | 4
+ 3 | 2
 (5 rows)
 
 update r set a = r.a + 1 where b in (select b from s);
@@ -529,9 +539,9 @@ select * from r;
  a | b 
 ---+---
  1 | 1
+ 3 | 3
  5 | 5
  6 | 4
- 3 | 3
  4 | 2
 (5 rows)
 
@@ -553,48 +563,82 @@ select * from r;
 select * from s;
  a | b 
 ---+---
- 2 | 2
  3 | 3
  4 | 4
- 1 | 1
  5 | 5
+ 1 | 1
+ 2 | 2
 (5 rows)
 
 update s set a = s.a + 1 where exists (select 1 from r where s.a = r.b);
 select * from s;
  a | b 
 ---+---
- 5 | 5
- 5 | 4
  1 | 1
  3 | 3
+ 5 | 5
  3 | 2
+ 5 | 4
 (5 rows)
 
--- start_ignore
 -- Update ao table distribution key
--- create table update_ao_table (a int, b int) WITH (appendonly=true) distributed by (a);
--- insert into update_ao_table select g, g from generate_series(1, 5) g;
--- select * from update_ao_table;
--- update update_ao_table set a = a + 1 where b = 3;
--- select * from update_ao_table;
+create table update_ao_table (a int, b int) WITH (appendonly=true) distributed by (a);
+insert into update_ao_table select g, g from generate_series(1, 5) g;
+select * from update_ao_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 3 | 3
+ 4 | 4
+ 5 | 5
+(5 rows)
+
+update update_ao_table set a = a + 1 where b = 3;
+select * from update_ao_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 4 | 4
+ 5 | 5
+ 4 | 3
+(5 rows)
+
 -- Update aoco table distribution key
--- create table update_aoco_table (a int, b int) WITH (appendonly=true, orientation=column) distributed by (a);
--- insert into update_aoco_table select g,g from generate_series(1, 5) g;
--- select * from update_aoco_table;
--- update update_aoco_table set a = a + 1 where b = 3;
--- select * from update_aoco_table;
--- end_ignore
+create table update_aoco_table (a int, b int) WITH (appendonly=true, orientation=column) distributed by (a);
+insert into update_aoco_table select g,g from generate_series(1, 5) g;
+select * from update_aoco_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 3 | 3
+ 4 | 4
+ 5 | 5
+(5 rows)
+
+update update_aoco_table set a = a + 1 where b = 3;
+select * from update_aoco_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 4 | 4
+ 5 | 5
+ 4 | 3
+(5 rows)
+
 -- Update prepare
 delete from s;
 insert into s select generate_series(1, 5), generate_series(1, 5);
 select * from r;
  a | b  
 ---+----
+ 1 |  2
  2 |  4
  3 |  6
  4 |  8
- 1 |  2
  5 | 10
 (5 rows)
 
@@ -602,10 +646,10 @@ select * from s;
  a | b 
 ---+---
  1 | 1
- 5 | 5
  2 | 2
  3 | 3
  4 | 4
+ 5 | 5
 (5 rows)
 
 prepare update_s(int) as update s set a = s.a + $1 where exists (select 1 from r where s.a = r.b);
@@ -613,27 +657,26 @@ execute update_s(10);
 select * from s;
  a  | b 
 ----+---
-  3 | 3
   1 | 1
- 12 | 2
-  5 | 5
  14 | 4
+  3 | 3
+  5 | 5
+ 12 | 2
 (5 rows)
 
 -- Confirm that a split update is not created for a table excluded by
 -- constraints in the planner.
 create table nosplitupdate (a int) distributed by (a);
--- start_ignore
 explain update nosplitupdate set a=0 where a=1 and a<1;
                         QUERY PLAN                         
 -----------------------------------------------------------
- Update on nosplitupdate  (cost=0.00..0.01 rows=0 width=0)
-   ->  Result  (cost=0.00..0.00 rows=0 width=46)
+ Update on nosplitupdate  (cost=0.00..0.01 rows=1 width=0)
+   ->  Result  (cost=0.00..0.01 rows=1 width=0)
          One-Time Filter: false
+ Planning time: 0.271 ms
  Optimizer: Postgres query optimizer
-(4 rows)
+(5 rows)
 
--- end_ignore
 -- test split-update when split-node's flow is entry
 create table tsplit_entry (c int);
 NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c' as the Cloudberry Database data distribution key for this table.
@@ -641,53 +684,56 @@ HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sur
 insert into tsplit_entry values (1), (2);
 analyze tsplit_entry;
 -- start_ignore
+-- gp_segment_configuration scan is different when using different FTS
 explain update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
                                                     QUERY PLAN                                                    
 ------------------------------------------------------------------------------------------------------------------
- Update on tsplit_entry  (cost=10000000001.01..10000000002.17 rows=0 width=0)
-   ->  Explicit Redistribute Motion 1:3  (slice1)  (cost=10000000001.01..10000000002.17 rows=2 width=74)
-         ->  Split  (cost=10000000001.01..10000000002.08 rows=7 width=74)
-               ->  Nested Loop  (cost=10000000001.01..10000000002.08 rows=3 width=74)
-                     ->  Gather Motion 3:1  (slice2; segments: 3)  (cost=0.00..1.03 rows=1 width=38)
-                           ->  Seq Scan on tsplit_entry  (cost=0.00..1.01 rows=1 width=38)
-                     ->  Materialize  (cost=1.01..1.04 rows=1 width=40)
-                           ->  Subquery Scan on s  (cost=1.01..1.03 rows=1 width=40)
-                                 ->  Aggregate  (cost=1.01..1.02 rows=1 width=8)
-                                       ->  Seq Scan on gp_segment_configuration  (cost=0.00..1.01 rows=1 width=0)
+ Update on tsplit_entry  (cost=10000000001.00..10000000003.18 rows=3 width=54)
+   ->  Explicit Redistribute Motion 1:3  (slice)  (cost=10000000001.00..10000000003.18 rows=7 width=54)
+         ->  Split  (cost=10000000001.00..10000000003.18 rows=7 width=54)
+               ->  Nested Loop  (cost=10000000001.00..10000000003.12 rows=4 width=54)
+                     ->  Gather Motion 3:1  (slice2; segments: 3)  (cost=0.00..2.06 rows=2 width=14)
+                           ->  Seq Scan on tsplit_entry  (cost=0.00..2.02 rows=1 width=14)
+                     ->  Materialize  (cost=1.00..1.03 rows=1 width=40)
+                           ->  Subquery Scan on s  (cost=1.00..1.02 rows=1 width=40)
+                                 ->  Aggregate  (cost=1.00..1.01 rows=1 width=8)
+                                       ->  Function Scan on gp_get_segment_configuration  (cost=0.00..1.00 rows=1 width=0)
  Optimizer: Postgres query optimizer
 (11 rows)
-
 -- end_ignore
 update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
--- start_ignore
--- CREATE TABLE update_gp_foo (
---     a_dist int,
---     b int,
---     c_part int,
---     d int
--- )
--- WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
---           (
---           PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo_1_prt_p20190305', appendonly=false)
---           );
--- CREATE TABLE update_gp_foo1 (
---         a_dist int,
---         b int,
---         c_part int,
---         d int
--- )
--- WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
---           (
---           PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo1_1_prt_p20190305', appendonly=false)
---           );
--- INSERT INTO update_gp_foo VALUES (12, 40, 1, 50);
--- INSERT INTO update_gp_foo1 VALUES (12, 3, 1, 50);
--- UPDATE update_gp_foo
--- SET    b = update_gp_foo.c_part,
---        d = update_gp_foo1.a_dist
--- FROM   update_gp_foo1;
--- SELECT * from update_gp_foo;
--- end_ignore
+CREATE TABLE update_gp_foo (
+    a_dist int,
+    b int,
+    c_part int,
+    d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo_1_prt_p20190305', appendonly=false)
+          );
+CREATE TABLE update_gp_foo1 (
+        a_dist int,
+        b int,
+        c_part int,
+        d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo1_1_prt_p20190305', appendonly=false)
+          );
+INSERT INTO update_gp_foo VALUES (12, 40, 1, 50);
+INSERT INTO update_gp_foo1 VALUES (12, 3, 1, 50);
+UPDATE update_gp_foo
+SET    b = update_gp_foo.c_part,
+       d = update_gp_foo1.a_dist
+FROM   update_gp_foo1;
+SELECT * from update_gp_foo;
+ a_dist | b | c_part | d  
+--------+---+--------+----
+     12 | 1 |      1 | 12
+(1 row)
+
 -- Test insert on conflict do update
 -- Insert on conflict do update is an insert statement but might
 -- invoke ExecUpdate on segments, but updating distkeys of a table
@@ -695,31 +741,24 @@ update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_confi
 -- planning, if a `insert on conflict do update` statement set the
 -- dist keys of the table, it will raise an error.
 -- See github issue: https://github.com/greenplum-db/gpdb/issues/9444
--- start_ignore
 create table t_insert_on_conflict_update_distkey(a int, b int) distributed by (a);
 create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
-ERROR:  not supported on pax relations: IndexBuildRangeScan
 -- the following statement should error out because the on conflict update want to
 -- modify the tuple's distkey which might lead to wrong data distribution
 insert into t_insert_on_conflict_update_distkey values (1, 1) on conflict(a, b) do update set a = 1;
 ERROR:  modification of distribution columns in OnConflictUpdate is not supported
 drop index uidx_t_insert_on_conflict_update_distkey;
-ERROR:  index "uidx_t_insert_on_conflict_update_distkey" does not exist
 drop table t_insert_on_conflict_update_distkey;
 -- randomly distributed table cannot add unique constrain, so next we test replicated table
 create table t_insert_on_conflict_update_distkey(a int, b int) distributed replicated;
 create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
-ERROR:  not supported on pax relations: IndexBuildRangeScan
 -- the following statement should succeed because replicated table does not contain distkey
 insert into t_insert_on_conflict_update_distkey values (1, 1) on conflict(a, b) do update set a = 1;
-ERROR:  there is no unique or exclusion constraint matching the ON CONFLICT specification
--- end_ignore
+ERROR:  not implemented yet on pax relations: TupleInsertSpeculative
 -- Some tests on a partitioned table.
 CREATE TABLE update_gp_rangep (a int, b int, orig_a int) DISTRIBUTED BY (b) PARTITION BY RANGE (a);
 CREATE TABLE update_gp_rangep_1_to_10  PARTITION OF update_gp_rangep FOR VALUES FROM  (1) TO (10);
-NOTICE:  table has parent, setting distribution columns to match parent table
 CREATE TABLE update_gp_rangep_10_to_20 PARTITION OF update_gp_rangep FOR VALUES FROM (10) TO (20);
-NOTICE:  table has parent, setting distribution columns to match parent table
 INSERT INTO update_gp_rangep SELECT g, g, g FROM generate_series(1, 4) g;
 -- Simple case: Same partition, same node.
 UPDATE update_gp_rangep SET a = 9 WHERE a = 1;
@@ -729,24 +768,23 @@ UPDATE update_gp_rangep SET b = 1 WHERE a = 2;
 UPDATE update_gp_rangep SET a = 10 WHERE a = 3;
 -- Move row to different partition and also change distribution key
 UPDATE update_gp_rangep SET a = 11, b = 1 WHERE a = 4;
--- start_ignore
 SELECT tableoid::regclass, * FROM update_gp_rangep ORDER BY orig_a;
          tableoid          | a  | b | orig_a 
 ---------------------------+----+---+--------
  update_gp_rangep_1_to_10  |  9 | 1 |      1
  update_gp_rangep_1_to_10  |  2 | 1 |      2
+ update_gp_rangep_10_to_20 | 10 | 3 |      3
  update_gp_rangep_10_to_20 | 11 | 1 |      4
-(3 rows)
+(4 rows)
 
--- end_ignore
 -- Also do a lookup with specific distribution key. If the rows were not
 -- correctly moved across segments, this would fail to find them, assuming
 -- that direct dispatch is effective.
 SELECT tableoid::regclass, * FROM update_gp_rangep WHERE b = 1;
          tableoid          | a  | b | orig_a 
 ---------------------------+----+---+--------
- update_gp_rangep_1_to_10  |  9 | 1 |      1
  update_gp_rangep_1_to_10  |  2 | 1 |      2
+ update_gp_rangep_1_to_10  |  9 | 1 |      1
  update_gp_rangep_10_to_20 | 11 | 1 |      4
 (3 rows)
 
@@ -755,9 +793,7 @@ drop table r;
 drop table s;
 drop table update_dist;
 drop table update_ao_table;
-ERROR:  table "update_ao_table" does not exist
 drop table update_aoco_table;
-ERROR:  table "update_aoco_table" does not exist
 drop table nosplitupdate;
 drop table tsplit_entry;
 -- end_ignore
diff --git a/contrib/pax_storage/expected/update_gp_optimizer.out b/contrib/pax_storage/expected/update_gp_optimizer.out
new file mode 100644
index 00000000000..d335f4c3f61
--- /dev/null
+++ b/contrib/pax_storage/expected/update_gp_optimizer.out
@@ -0,0 +1,793 @@
+set default_table_access_method = pax;
+-- Test DELETE and UPDATE on an inherited table.
+-- The special aspect of this table is that the inherited table has
+-- a different distribution key. 'p' table's distribution key matches
+-- that of 'r', but 'p2's doesn't. Test that the planner adds a Motion
+-- node correctly for p2.
+create table todelete (a int) distributed by (a);
+create table parent (a int, b int, c int) distributed by (a);
+create table child (a int, b int, c int) inherits (parent) distributed by (b);
+NOTICE:  merging column "a" with inherited definition
+NOTICE:  merging column "b" with inherited definition
+NOTICE:  merging column "c" with inherited definition
+insert into parent select g, g, g from generate_series(1,5) g;
+insert into child select g, g, g from generate_series(6,10) g;
+insert into todelete select generate_series(3,4);
+delete from parent using todelete where parent.a = todelete.a;
+insert into todelete select generate_series(5,7);
+update parent set c=c+100 from todelete where parent.a = todelete.a;
+select * from parent;
+ a  | b  |  c  
+----+----+-----
+  1 |  1 |   1
+  5 |  5 | 105
+  9 |  9 |   9
+  7 |  7 | 107
+  2 |  2 |   2
+  8 |  8 |   8
+ 10 | 10 |  10
+  6 |  6 | 106
+(8 rows)
+
+drop table todelete;
+drop table child;
+drop table parent;
+-- This is similar to the above, but with a partitioned table (which is
+-- implemented by inheritance) rather than an explicitly inherited table.
+-- The scans on some of the partitions degenerate into Result nodes with
+-- False one-time filter, which don't need a Motion node.
+create table todelete (a int, b int) distributed by (a);
+create table target (a int, b int, c int)
+        distributed by (a)
+        partition by range (c) (start(1) end(5) every(1), default partition extra);
+insert into todelete select g, g % 4 from generate_series(1, 10) g;
+insert into target select g, 0, 3 from generate_series(1, 5) g;
+insert into target select g, 0, 1 from generate_series(1, 5) g;
+delete from target where c = 3 and a in (select b from todelete);
+insert into todelete values (1, 5);
+update target set b=target.b+100 where c = 3 and a in (select b from todelete);
+select * from target;
+ a |  b  | c 
+---+-----+---
+ 2 |   0 | 1
+ 4 |   0 | 1
+ 4 |   0 | 3
+ 1 |   0 | 1
+ 3 |   0 | 1
+ 5 |   0 | 1
+ 5 | 100 | 3
+(7 rows)
+
+-- Also test an update with a qual that doesn't match any partition. The
+-- Append degenerates into a dummy Result with false One-Time Filter.
+alter table target drop default partition;
+update target set b = 10 where c = 10;
+drop table todelete;
+drop table target;
+--
+-- Test updated on inheritance parent table, where some child tables need a
+-- Split Update, but not all.
+--
+create table base_tbl (a int4, b int4) distributed by (a);
+create table child_a (a int4, b int4) inherits (base_tbl) distributed by (a);
+NOTICE:  merging column "a" with inherited definition
+NOTICE:  merging column "b" with inherited definition
+create table child_b (a int4, b int4) inherits (base_tbl) distributed by (b);
+NOTICE:  merging column "a" with inherited definition
+NOTICE:  merging column "b" with inherited definition
+insert into base_tbl select g, g from generate_series(1, 5) g;
+explain (costs off) update base_tbl set a=a+1;
+ERROR:  can't split update for inherit table: base_tbl
+update base_tbl set a = 5;
+ERROR:  can't split update for inherit table: base_tbl
+--
+-- Explicit Distribution motion must be added if any of the child nodes
+-- contains any motion excluding the motions in initplans.
+-- These test cases and expectation are applicable for GPDB planner not for ORCA.
+--
+SET gp_autostats_mode = NONE;
+CREATE TABLE keo1 ( user_vie_project_code_pk character varying(24), user_vie_fiscal_year_period_sk character varying(24), user_vie_act_cntr_marg_cum character varying(24)) DISTRIBUTED RANDOMLY;
+INSERT INTO keo1 VALUES ('1', '1', '1');
+CREATE TABLE keo2 ( projects_pk character varying(24)) DISTRIBUTED RANDOMLY;
+INSERT INTO keo2 VALUES ('1');
+CREATE TABLE keo3 ( sky_per character varying(24), bky_per character varying(24)) DISTRIBUTED BY (sky_per);
+INSERT INTO keo3 VALUES ('1', '1');
+CREATE TABLE keo4 ( keo_para_required_period character varying(6), keo_para_budget_date character varying(24)) DISTRIBUTED RANDOMLY;
+INSERT INTO keo4 VALUES ('1', '1');
+ANALYZE keo1, keo2, keo3, keo4;
+-- Explicit Redistribution motion should be added in case of GPDB Planner (test case not applicable for ORCA)
+EXPLAIN (COSTS OFF) UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
+    ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
+        ON b.projects_pk=a.user_vie_project_code_pk
+        WHERE a.user_vie_fiscal_year_period_sk =
+          (SELECT MAX (sky_per) FROM keo3 WHERE bky_per =
+             (SELECT keo4.keo_para_required_period FROM keo4 WHERE keo_para_budget_date =
+                (SELECT min (keo4.keo_para_budget_date) FROM keo4)))
+    ) t1
+WHERE t1.user_vie_project_code_pk = keo1.user_vie_project_code_pk;
+                                              QUERY PLAN                                               
+-------------------------------------------------------------------------------------------------------
+ Update on keo1
+   InitPlan 3 (returns $2)  (slice3)
+     ->  Aggregate
+           InitPlan 2 (returns $1)  (slice5)
+             ->  Gather Motion 3:1  (slice6; segments: 3)
+                   InitPlan 1 (returns $0)  (slice7)
+                     ->  Aggregate
+                           ->  Gather Motion 3:1  (slice8; segments: 3)
+                                 ->  Seq Scan on keo4
+                   ->  Seq Scan on keo4 keo4_1
+                         Filter: ((keo_para_budget_date)::text = $0)
+           ->  Gather Motion 3:1  (slice4; segments: 3)
+                 ->  Seq Scan on keo3
+                       Filter: ((bky_per)::text = ($1)::text)
+   ->  Hash Join
+         Hash Cond: ((a.user_vie_project_code_pk)::text = (b.projects_pk)::text)
+         ->  Hash Join
+               Hash Cond: ((a.user_vie_project_code_pk)::text = (keo1.user_vie_project_code_pk)::text)
+               ->  Broadcast Motion 3:3  (slice1; segments: 3)
+                     ->  Seq Scan on keo1 a
+                           Filter: ((user_vie_fiscal_year_period_sk)::text = $2)
+               ->  Hash
+                     ->  Seq Scan on keo1
+         ->  Hash
+               ->  Broadcast Motion 3:3  (slice2; segments: 3)
+                     ->  Seq Scan on keo2 b
+ Optimizer: Postgres query optimizer
+(27 rows)
+
+UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
+    ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
+        ON b.projects_pk=a.user_vie_project_code_pk
+        WHERE a.user_vie_fiscal_year_period_sk =
+          (SELECT MAX (sky_per) FROM keo3 WHERE bky_per =
+             (SELECT keo4.keo_para_required_period FROM keo4 WHERE keo_para_budget_date =
+                (SELECT min (keo4.keo_para_budget_date) FROM keo4)))
+    ) t1
+WHERE t1.user_vie_project_code_pk = keo1.user_vie_project_code_pk;
+SELECT user_vie_act_cntr_marg_cum FROM keo1;
+ user_vie_act_cntr_marg_cum 
+----------------------------
+ 234.682
+(1 row)
+
+-- Explicit Redistribution motion should not be added in case of GPDB Planner (test case not applicable to ORCA)
+CREATE TABLE keo5 (x int, y int) DISTRIBUTED BY (x);
+INSERT INTO keo5 VALUES (1,1);
+EXPLAIN (COSTS OFF) DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
+                      QUERY PLAN                       
+-------------------------------------------------------
+ Delete on keo5
+   InitPlan 1 (returns $0)  (slice1)
+     ->  Gather Motion 3:1  (slice2; segments: 3)
+           ->  Seq Scan on keo5 keo5_2
+                 Filter: (x < 2)
+   ->  Result
+         One-Time Filter: $0
+         ->  Hash Join
+               Hash Cond: (keo5.x = keo5_1.x)
+               ->  Seq Scan on keo5
+               ->  Hash
+                     ->  HashAggregate
+                           Group Key: keo5_1.x
+                           ->  Seq Scan on keo5 keo5_1
+ Optimizer: Postgres query optimizer
+(15 rows)
+
+DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
+SELECT x FROM keo5;
+ x 
+---
+(0 rows)
+
+RESET gp_autostats_mode;
+DROP TABLE keo1;
+DROP TABLE keo2;
+DROP TABLE keo3;
+DROP TABLE keo4;
+DROP TABLE keo5;
+--
+-- text types. We should support the following updates.
+--
+CREATE TEMP TABLE ttab1 (a varchar(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar(15), b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a text, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a text, b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a varchar, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar, b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
+CREATE TEMP TABLE ttab1 (a char(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a char(15), b integer) DISTRIBUTED BY (a);
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+DROP TABLE IF EXISTS update_distr_key;
+NOTICE:  table "update_distr_key" does not exist, skipping
+CREATE TEMP TABLE update_distr_key (a int, b int) DISTRIBUTED BY (a);
+INSERT INTO update_distr_key select i, i* 10 from generate_series(0, 9) i;
+UPDATE update_distr_key SET a = 5 WHERE b = 10;
+SELECT * from update_distr_key;
+ a | b  
+---+----
+ 0 |  0
+ 2 | 20
+ 4 | 40
+ 6 | 60
+ 8 | 80
+ 5 | 10
+ 3 | 30
+ 5 | 50
+ 7 | 70
+ 9 | 90
+(10 rows)
+
+DROP TABLE update_distr_key;
+-- below cases is to test multi-hash-cols
+CREATE TABLE tab3(c1 int, c2 int, c3 int, c4 int, c5 int) DISTRIBUTED BY (c1, c2, c3);
+CREATE TABLE tab5(c1 int, c2 int, c3 int, c4 int, c5 int) DISTRIBUTED BY (c1, c2, c3, c4, c5);
+INSERT INTO tab3 SELECT i, i, i, i, i FROM generate_series(1, 10)i;
+INSERT INTO tab5 SELECT i, i, i, i, i FROM generate_series(1, 10)i;
+-- test tab3
+SELECT gp_segment_id, * FROM tab3;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+             2 |  1 |  1 |  1 |  1 |  1
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+(10 rows)
+
+UPDATE tab3 set c1 = 9 where c4 = 1;
+SELECT gp_segment_id, * FROM tab3;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
+             0 |  9 |  1 |  1 |  1 |  1
+(10 rows)
+
+UPDATE tab3 set (c1,c2) = (5,6) where c4 = 1;
+SELECT gp_segment_id, * FROM tab3;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  5 |  6 |  1 |  1 |  1
+(10 rows)
+
+UPDATE tab3 set (c1,c2,c3) = (3,2,1) where c4 = 1;
+SELECT gp_segment_id, * FROM tab3;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  3 |  2 |  1 |  1 |  1
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
+(10 rows)
+
+UPDATE tab3 set c1 = 11 where c2 = 10 and c2 < 1;
+SELECT gp_segment_id, * FROM tab3;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             0 |  5 |  5 |  5 |  5 |  5
+             0 |  8 |  8 |  8 |  8 |  8
+             2 |  2 |  2 |  2 |  2 |  2
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  3 |  2 |  1 |  1 |  1
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  4 |  4 |  4 |  4 |  4
+             1 |  9 |  9 |  9 |  9 |  9
+             1 | 10 | 10 | 10 | 10 | 10
+(10 rows)
+
+-- test tab5
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
+             1 |  1 |  1 |  1 |  1 |  1
+             1 |  2 |  2 |  2 |  2 |  2
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  5 |  5 |  5 |  5 |  5
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
+(10 rows)
+
+UPDATE tab5 set c1 = 1000 where c4 = 1;
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id |  c1  | c2 | c3 | c4 | c5 
+---------------+------+----+----+----+----
+             0 |    4 |  4 |  4 |  4 |  4
+             0 |    9 |  9 |  9 |  9 |  9
+             0 |   10 | 10 | 10 | 10 | 10
+             1 |    2 |  2 |  2 |  2 |  2
+             1 |    3 |  3 |  3 |  3 |  3
+             1 |    5 |  5 |  5 |  5 |  5
+             1 | 1000 |  1 |  1 |  1 |  1
+             2 |    6 |  6 |  6 |  6 |  6
+             2 |    7 |  7 |  7 |  7 |  7
+             2 |    8 |  8 |  8 |  8 |  8
+(10 rows)
+
+UPDATE tab5 set (c1,c2) = (9,10) where c4 = 1;
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             1 |  2 |  2 |  2 |  2 |  2
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  5 |  5 |  5 |  5 |  5
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
+             0 |  9 | 10 |  1 |  1 |  1
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
+(10 rows)
+
+UPDATE tab5 set (c1,c2,c4) = (5,8,6) where c4 = 1;
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             1 |  2 |  2 |  2 |  2 |  2
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  5 |  5 |  5 |  5 |  5
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
+             0 |  5 |  8 |  1 |  6 |  1
+(10 rows)
+
+UPDATE tab5 set (c1,c2,c3,c4,c5) = (1,2,3,0,6) where c5 = 1;
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
+             1 |  2 |  2 |  2 |  2 |  2
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  5 |  5 |  5 |  5 |  5
+             1 |  1 |  2 |  3 |  0 |  6
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
+(10 rows)
+
+UPDATE tab5 set c1 = 11 where c3 = 10 and c3 < 1;
+SELECT gp_segment_id, * FROM tab5;
+ gp_segment_id | c1 | c2 | c3 | c4 | c5 
+---------------+----+----+----+----+----
+             0 |  4 |  4 |  4 |  4 |  4
+             0 |  9 |  9 |  9 |  9 |  9
+             0 | 10 | 10 | 10 | 10 | 10
+             1 |  2 |  2 |  2 |  2 |  2
+             1 |  3 |  3 |  3 |  3 |  3
+             1 |  5 |  5 |  5 |  5 |  5
+             1 |  1 |  2 |  3 |  0 |  6
+             2 |  6 |  6 |  6 |  6 |  6
+             2 |  7 |  7 |  7 |  7 |  7
+             2 |  8 |  8 |  8 |  8 |  8
+(10 rows)
+
+EXPLAIN (COSTS OFF ) UPDATE tab3 SET C1 = C1 + 1, C5 = C5+1;
+                          QUERY PLAN                           
+---------------------------------------------------------------
+ Update on tab3
+   ->  Explicit Redistribute Motion 3:3  (slice1; segments: 3)
+         ->  Split
+               ->  Seq Scan on tab3
+ Optimizer: Postgres query optimizer
+(5 rows)
+
+-- clean up
+drop table tab3;
+drop table tab5;
+-- Update distribution key
+-- start_ignore
+drop table if exists r;
+NOTICE:  table "r" does not exist, skipping
+drop table if exists s;
+NOTICE:  table "s" does not exist, skipping
+drop table if exists update_dist;
+NOTICE:  table "update_dist" does not exist, skipping
+drop table if exists update_ao_table;
+NOTICE:  table "update_ao_table" does not exist, skipping
+drop table if exists update_aoco_table;
+NOTICE:  table "update_aoco_table" does not exist, skipping
+-- end_ignore
+-- Update normal table distribution key
+create table update_dist(a int) distributed by (a);
+insert into update_dist values(1);
+update update_dist set a=0 where a=1;
+select * from update_dist;
+ a 
+---
+ 0
+(1 row)
+
+-- Update distribution key with join
+create table r (a int, b int) distributed by (a);
+create table s (a int, b int) distributed by (a);
+insert into r select generate_series(1, 5), generate_series(1, 5) * 2;
+insert into s select generate_series(1, 5), generate_series(1, 5) * 2;
+select * from r;
+ a | b  
+---+----
+ 3 |  6
+ 4 |  8
+ 5 | 10
+ 1 |  2
+ 2 |  4
+(5 rows)
+
+select * from s;
+ a | b  
+---+----
+ 1 |  2
+ 2 |  4
+ 3 |  6
+ 4 |  8
+ 5 | 10
+(5 rows)
+
+update r set a = r.a + 1 from s where r.a = s.a;
+select * from r;
+ a | b  
+---+----
+ 4 |  6
+ 5 |  8
+ 6 | 10
+ 3 |  4
+ 2 |  2
+(5 rows)
+
+update r set a = r.a + 1 where a in (select a from s);
+select * from r;
+ a | b  
+---+----
+ 6 | 10
+ 5 |  6
+ 6 |  8
+ 4 |  4
+ 3 |  2
+(5 rows)
+
+-- Update redistribution
+delete from r;
+delete from s;
+insert into r select generate_series(1, 5), generate_series(1, 5);
+insert into s select generate_series(1, 5), generate_series(1, 5) * 2;
+select * from r;
+ a | b 
+---+---
+ 3 | 3
+ 4 | 4
+ 5 | 5
+ 1 | 1
+ 2 | 2
+(5 rows)
+
+select * from s;
+ a | b  
+---+----
+ 3 |  6
+ 4 |  8
+ 5 | 10
+ 1 |  2
+ 2 |  4
+(5 rows)
+
+update r set a = r.a + 1 from s where r.b = s.b;
+select * from r;
+ a | b 
+---+---
+ 1 | 1
+ 3 | 3
+ 5 | 5
+ 5 | 4
+ 3 | 2
+(5 rows)
+
+update r set a = r.a + 1 where b in (select b from s);
+select * from r;
+ a | b 
+---+---
+ 1 | 1
+ 3 | 3
+ 5 | 5
+ 6 | 4
+ 4 | 2
+(5 rows)
+
+-- Update hash aggreate group by
+delete from r;
+delete from s;
+insert into r select generate_series(1, 5), generate_series(1, 5) * 2;
+insert into s select generate_series(1, 5), generate_series(1, 5);
+select * from r;
+ a | b  
+---+----
+ 1 |  2
+ 2 |  4
+ 3 |  6
+ 4 |  8
+ 5 | 10
+(5 rows)
+
+select * from s;
+ a | b 
+---+---
+ 3 | 3
+ 4 | 4
+ 5 | 5
+ 1 | 1
+ 2 | 2
+(5 rows)
+
+update s set a = s.a + 1 where exists (select 1 from r where s.a = r.b);
+select * from s;
+ a | b 
+---+---
+ 1 | 1
+ 3 | 3
+ 5 | 5
+ 3 | 2
+ 5 | 4
+(5 rows)
+
+-- Update ao table distribution key
+create table update_ao_table (a int, b int) WITH (appendonly=true) distributed by (a);
+insert into update_ao_table select g, g from generate_series(1, 5) g;
+select * from update_ao_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 3 | 3
+ 4 | 4
+ 5 | 5
+(5 rows)
+
+update update_ao_table set a = a + 1 where b = 3;
+select * from update_ao_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 4 | 4
+ 5 | 5
+ 4 | 3
+(5 rows)
+
+-- Update aoco table distribution key
+create table update_aoco_table (a int, b int) WITH (appendonly=true, orientation=column) distributed by (a);
+insert into update_aoco_table select g,g from generate_series(1, 5) g;
+select * from update_aoco_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 3 | 3
+ 4 | 4
+ 5 | 5
+(5 rows)
+
+update update_aoco_table set a = a + 1 where b = 3;
+select * from update_aoco_table;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 4 | 4
+ 5 | 5
+ 4 | 3
+(5 rows)
+
+-- Update prepare
+delete from s;
+insert into s select generate_series(1, 5), generate_series(1, 5);
+select * from r;
+ a | b  
+---+----
+ 1 |  2
+ 2 |  4
+ 3 |  6
+ 4 |  8
+ 5 | 10
+(5 rows)
+
+select * from s;
+ a | b 
+---+---
+ 1 | 1
+ 2 | 2
+ 3 | 3
+ 4 | 4
+ 5 | 5
+(5 rows)
+
+prepare update_s(int) as update s set a = s.a + $1 where exists (select 1 from r where s.a = r.b);
+execute update_s(10);
+select * from s;
+ a  | b 
+----+---
+  1 | 1
+ 14 | 4
+  3 | 3
+  5 | 5
+ 12 | 2
+(5 rows)
+
+-- Confirm that a split update is not created for a table excluded by
+-- constraints in the planner.
+create table nosplitupdate (a int) distributed by (a);
+explain update nosplitupdate set a=0 where a=1 and a<1;
+                        QUERY PLAN                         
+-----------------------------------------------------------
+ Update on nosplitupdate  (cost=0.00..0.01 rows=1 width=0)
+   ->  Result  (cost=0.00..0.01 rows=1 width=0)
+         One-Time Filter: false
+ Planning time: 0.271 ms
+ Optimizer: Postgres query optimizer
+(5 rows)
+
+-- test split-update when split-node's flow is entry
+create table tsplit_entry (c int);
+NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c' as the Cloudberry Database data distribution key for this table.
+HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
+insert into tsplit_entry values (1), (2);
+analyze tsplit_entry;
+-- start_ignore
+-- gp_segment_configuration scan is different when using different FTS
+explain update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
+                                                    QUERY PLAN                                                    
+------------------------------------------------------------------------------------------------------------------
+ Update on tsplit_entry  (cost=10000000001.00..10000000003.18 rows=3 width=54)
+   ->  Explicit Redistribute Motion 1:3  (slice)  (cost=10000000001.00..10000000003.18 rows=7 width=54)
+         ->  Split  (cost=10000000001.00..10000000003.18 rows=7 width=54)
+               ->  Nested Loop  (cost=10000000001.00..10000000003.12 rows=4 width=54)
+                     ->  Gather Motion 3:1  (slice2; segments: 3)  (cost=0.00..2.06 rows=2 width=14)
+                           ->  Seq Scan on tsplit_entry  (cost=0.00..2.02 rows=1 width=14)
+                     ->  Materialize  (cost=1.00..1.03 rows=1 width=40)
+                           ->  Subquery Scan on s  (cost=1.00..1.02 rows=1 width=40)
+                                 ->  Aggregate  (cost=1.00..1.01 rows=1 width=8)
+                                       ->  Function Scan on gp_get_segment_configuration  (cost=0.00..1.00 rows=1 width=0)
+ Optimizer: Postgres query optimizer
+(11 rows)
+-- end_ignore
+update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
+CREATE TABLE update_gp_foo (
+    a_dist int,
+    b int,
+    c_part int,
+    d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo_1_prt_p20190305', appendonly=false)
+          );
+CREATE TABLE update_gp_foo1 (
+        a_dist int,
+        b int,
+        c_part int,
+        d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo1_1_prt_p20190305', appendonly=false)
+          );
+INSERT INTO update_gp_foo VALUES (12, 40, 1, 50);
+INSERT INTO update_gp_foo1 VALUES (12, 3, 1, 50);
+UPDATE update_gp_foo
+SET    b = update_gp_foo.c_part,
+       d = update_gp_foo1.a_dist
+FROM   update_gp_foo1;
+SELECT * from update_gp_foo;
+ a_dist | b | c_part | d  
+--------+---+--------+----
+     12 | 1 |      1 | 12
+(1 row)
+
+-- Test insert on conflict do update
+-- Insert on conflict do update is an insert statement but might
+-- invoke ExecUpdate on segments, but updating distkeys of a table
+-- may lead to wrong data distribution. We will check this before
+-- planning, if a `insert on conflict do update` statement set the
+-- dist keys of the table, it will raise an error.
+-- See github issue: https://github.com/greenplum-db/gpdb/issues/9444
+create table t_insert_on_conflict_update_distkey(a int, b int) distributed by (a);
+create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
+-- the following statement should error out because the on conflict update want to
+-- modify the tuple's distkey which might lead to wrong data distribution
+insert into t_insert_on_conflict_update_distkey values (1, 1) on conflict(a, b) do update set a = 1;
+ERROR:  modification of distribution columns in OnConflictUpdate is not supported
+drop index uidx_t_insert_on_conflict_update_distkey;
+drop table t_insert_on_conflict_update_distkey;
+-- randomly distributed table cannot add unique constrain, so next we test replicated table
+create table t_insert_on_conflict_update_distkey(a int, b int) distributed replicated;
+create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
+-- the following statement should succeed because replicated table does not contain distkey
+insert into t_insert_on_conflict_update_distkey values (1, 1) on conflict(a, b) do update set a = 1;
+ERROR:  not implemented yet on pax relations: TupleInsertSpeculative
+-- Some tests on a partitioned table.
+CREATE TABLE update_gp_rangep (a int, b int, orig_a int) DISTRIBUTED BY (b) PARTITION BY RANGE (a);
+CREATE TABLE update_gp_rangep_1_to_10  PARTITION OF update_gp_rangep FOR VALUES FROM  (1) TO (10);
+CREATE TABLE update_gp_rangep_10_to_20 PARTITION OF update_gp_rangep FOR VALUES FROM (10) TO (20);
+INSERT INTO update_gp_rangep SELECT g, g, g FROM generate_series(1, 4) g;
+-- Simple case: Same partition, same node.
+UPDATE update_gp_rangep SET a = 9 WHERE a = 1;
+-- Distribution key update, same partition.
+UPDATE update_gp_rangep SET b = 1 WHERE a = 2;
+-- Move row to different partition, but no change in distribution key
+UPDATE update_gp_rangep SET a = 10 WHERE a = 3;
+-- Move row to different partition and also change distribution key
+UPDATE update_gp_rangep SET a = 11, b = 1 WHERE a = 4;
+SELECT tableoid::regclass, * FROM update_gp_rangep ORDER BY orig_a;
+         tableoid          | a  | b | orig_a 
+---------------------------+----+---+--------
+ update_gp_rangep_1_to_10  |  9 | 1 |      1
+ update_gp_rangep_1_to_10  |  2 | 1 |      2
+ update_gp_rangep_10_to_20 | 10 | 3 |      3
+ update_gp_rangep_10_to_20 | 11 | 1 |      4
+(4 rows)
+
+-- Also do a lookup with specific distribution key. If the rows were not
+-- correctly moved across segments, this would fail to find them, assuming
+-- that direct dispatch is effective.
+SELECT tableoid::regclass, * FROM update_gp_rangep WHERE b = 1;
+         tableoid          | a  | b | orig_a 
+---------------------------+----+---+--------
+ update_gp_rangep_1_to_10  |  2 | 1 |      2
+ update_gp_rangep_1_to_10  |  9 | 1 |      1
+ update_gp_rangep_10_to_20 | 11 | 1 |      4
+(3 rows)
+
+-- start_ignore
+drop table r;
+drop table s;
+drop table update_dist;
+drop table update_ao_table;
+drop table update_aoco_table;
+drop table nosplitupdate;
+drop table tsplit_entry;
+-- end_ignore
diff --git a/contrib/pax_storage/hd-ci/clang_tidy_pax.bash b/contrib/pax_storage/hd-ci/clang_tidy_pax.bash
index 6d94247c41d..108c4bdfaab 100644
--- a/contrib/pax_storage/hd-ci/clang_tidy_pax.bash
+++ b/contrib/pax_storage/hd-ci/clang_tidy_pax.bash
@@ -16,7 +16,7 @@ function do_git_diff() {
         exit 0
     fi
 
-    modified_files=$(git diff --name-only $CBDB_PAX_DEV_BRANCH)
+    modified_files=$(git diff --name-only $CBDB_PAX_DEV_BRANCH -- ':!icw_test')
     for extension in "${CBDB_PAX_EXT[@]}"; do
         if echo "$modified_files" | grep -E -e "$extension" | grep -q -v "$CBDB_PAXC_GREP"; then
             files=$(echo "$modified_files" | grep -E -e "$extension" | grep -v "$CBDB_PAXC_GREP")
diff --git a/contrib/pax_storage/sql/ddl.sql b/contrib/pax_storage/sql/ddl.sql
new file mode 100644
index 00000000000..fbb390e12ae
--- /dev/null
+++ b/contrib/pax_storage/sql/ddl.sql
@@ -0,0 +1,51 @@
+set default_table_access_method = 'pax';
+
+create table pax_test.t1(
+    id int,
+    name text not null,
+    height float not null,
+    decimal_col decimal(10, 2) not null,
+    created_at timestamp with time zone not null,
+    updated_at timestamp with time zone not null
+)  using pax distributed BY (id);
+\d+ pax_test.t1
+
+create table pax_test.t2(
+    id int,
+    name text not null,
+    height float not null,
+    decimal_col decimal(10, 2) not null,
+    created_at timestamp with time zone not null,
+    updated_at timestamp with time zone not null
+);
+\d+ pax_test.t2
+
+insert into pax_test.t1 (id, name, height, decimal_col, created_at, updated_at) values
+    (1, 'Alice', 1.65, 1.23, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
+    (2, 'Bob', 1.75, 2.34, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
+    (3, 'Carol', 1.85, 3.45, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08');
+
+alter table pax_test.t1 add column new_col1 int;
+alter table pax_test.t1 add column new_col2 int default null;
+alter table pax_test.t1 add column new_col3 int default 0;
+alter table pax_test.t1 add column new_col4 int default 12;
+
+select * from pax_test.t1;
+
+alter table pax_test.t1 drop column new_col2;
+alter table pax_test.t1 drop column new_col3;
+
+vacuum pax_test.t1;
+vacuum full pax_test.t1;
+
+drop table pax_test.t1;
+drop table pax_test.t2;
+
+-- alter column with options 
+create table pax_test.t3 (v1 numeric(100,1)) with(compresstype=zstd, compresslevel=1);
+alter table pax_test.t3 alter column v1 type numeric;
+drop table pax_test.t3;
+-- add column with options
+create table pax_test.t4 (v1 text) with(compresstype=zstd, compresslevel=1);
+alter table pax_test.t4 add column v2 text;
+drop table pax_test.t4;
diff --git a/contrib/pax_storage/sql/detoast.sql b/contrib/pax_storage/sql/detoast.sql
new file mode 100644
index 00000000000..0af5be392e7
--- /dev/null
+++ b/contrib/pax_storage/sql/detoast.sql
@@ -0,0 +1,51 @@
+CREATE TABLE toasttest_external(f1 text);
+-- The storage `EXTERNAL` allows out-of-line storage but not compression.
+alter table toasttest_external alter column f1 set storage external;
+-- These tests are sensitive to block size. In CBDB, the block
+-- size is 32 kB, whereas in PostgreSQL it's 8kB. Therefore make
+-- the data 4x larger here.
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+INSERT INTO toasttest_external values (repeat('1234567890',300*4));
+-- expect >0 blocks
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty
+  FROM pg_class where relname = 'toasttest_external';
+
+create table toasttest_external_pax(f1 text) using pax;
+insert into toasttest_external_pax select * from toasttest_external;
+drop table toasttest_external;
+-- If pax insert toast here, Then after drop toasttest_external, toast 
+-- will not get the source data.
+select length(f1) from toasttest_external_pax;
+drop table toasttest_external_pax;
+
+
+CREATE TABLE toasttest_compress(f1 text);
+-- The storage `MAIN` allows compression but not out-of-line storage. 
+alter table toasttest_compress alter column f1 set storage main;
+-- about 1M
+INSERT INTO toasttest_compress values (repeat('1234567890123456',1024 * 64));
+-- should be true, becase it's not store in toast table
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty FROM pg_class where relname = 'toasttest_compress';
+
+create table toasttest_compress_pax(f1 text) using pax;
+insert into toasttest_compress_pax select * from toasttest_compress;
+drop table toasttest_compress;
+select length(f1) from toasttest_compress_pax;
+drop table toasttest_compress_pax;
+
+CREATE TABLE toasttest_extended(f1 text);
+-- The storage `EXTENDED` allows both compression and out-of-line storage. 
+alter table toasttest_extended alter column f1 set storage EXTENDED;
+-- about 1M, will use out-of-line storage
+INSERT INTO toasttest_extended values (repeat('1234567890123456',1024 * 64));
+-- about 80k , will use compression storage
+INSERT INTO toasttest_extended values (repeat('1234567890123456',1024 * 5));
+SELECT pg_relation_size(reltoastrelid) = 0 AS is_empty FROM pg_class where relname = 'toasttest_extended';
+
+create table toasttest_extended_pax(f1 text) using pax;
+insert into toasttest_extended_pax select * from toasttest_extended;
+drop table toasttest_extended;
+select length(f1) from toasttest_extended_pax;
+drop table toasttest_extended_pax;
\ No newline at end of file
diff --git a/contrib/pax_storage/sql/setup.sql b/contrib/pax_storage/sql/setup.sql
new file mode 100644
index 00000000000..0966d0946a8
--- /dev/null
+++ b/contrib/pax_storage/sql/setup.sql
@@ -0,0 +1,3 @@
+-- start_ignore
+create schema pax_test;
+-- end_ignore
diff --git a/contrib/pax_storage/sql/teardown.sql b/contrib/pax_storage/sql/teardown.sql
new file mode 100644
index 00000000000..641380076f8
--- /dev/null
+++ b/contrib/pax_storage/sql/teardown.sql
@@ -0,0 +1,3 @@
+-- start_ignore
+drop schema if exists pax_test;
+-- end_ignore
diff --git a/contrib/pax_storage/src/data/sql/types.sql b/contrib/pax_storage/sql/types.sql
similarity index 54%
rename from contrib/pax_storage/src/data/sql/types.sql
rename to contrib/pax_storage/sql/types.sql
index 6eb3e09f895..1509c634889 100644
--- a/contrib/pax_storage/src/data/sql/types.sql
+++ b/contrib/pax_storage/sql/types.sql
@@ -1,9 +1,5 @@
--- start_ignore
-create extension pax;
-drop table if exists all_typbyval_pg_types;
--- end_ignore
 
-CREATE TABLE all_typbyval_pg_types (
+CREATE TABLE pax_test.all_typbyval_pg_types (
   id int,
   bool_col bool,
   char_col char,
@@ -26,16 +22,12 @@ CREATE TABLE all_typbyval_pg_types (
   pg_lsn_col pg_lsn
 ) USING pax distributed by (id);
 
-insert into all_typbyval_pg_types values(1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
+insert into pax_test.all_typbyval_pg_types values(1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
 (1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0'),
 (1, true,'c',2,'cid',4.2,5,'2023-05-17 17:56:49',7,'2023-05-17 17:56:49',10,11.1111,12,'2023-05-17 17:56:49','2023-05-17 17:56:49', '16/0');
-select * from all_typbyval_pg_types;
+select * from pax_test.all_typbyval_pg_types;
 
--- start_ignore
-drop table if exists all_typlen_lt_0_pg_type;
--- end_ignore
-
-create table all_typlen_lt_0_pg_type (
+create table pax_test.all_typlen_lt_0_pg_type (
   id int,
   name_col name,
   numeric_col numeric,
@@ -44,9 +36,8 @@ create table all_typlen_lt_0_pg_type (
   point_col point
 ) USING pax distributed by (id);
 
-insert into all_typlen_lt_0_pg_type values(1,'hello', 1.23, 'text', 'varchar', point(1,2));
-select * from all_typlen_lt_0_pg_type;
+insert into pax_test.all_typlen_lt_0_pg_type values(1,'hello', 1.23, 'text', 'varchar', point(1,2));
+select * from pax_test.all_typlen_lt_0_pg_type;
 
--- start_ignore
-drop table if exists all_typbyval_pg_types;
--- end_ignore
\ No newline at end of file
+drop table pax_test.all_typbyval_pg_types;
+drop table pax_test.all_typlen_lt_0_pg_type;
diff --git a/contrib/pax_storage/sql/update.sql b/contrib/pax_storage/sql/update.sql
new file mode 100644
index 00000000000..669ba110f4c
--- /dev/null
+++ b/contrib/pax_storage/sql/update.sql
@@ -0,0 +1,386 @@
+set default_table_access_method = pax;
+set pax.enable_filter = off;
+
+--
+-- UPDATE ... SET <col> = DEFAULT;
+--
+
+CREATE TABLE update_test (
+    a   INT DEFAULT 10,
+    b   INT,
+    c   TEXT
+);
+
+CREATE TABLE upsert_test (
+    a   INT PRIMARY KEY,
+    b   TEXT
+);
+
+INSERT INTO update_test VALUES (5, 10, 'foo');
+INSERT INTO update_test(b, a) VALUES (15, 10);
+
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+
+UPDATE update_test SET a = DEFAULT, b = DEFAULT;
+
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+
+-- aliases for the UPDATE target table
+UPDATE update_test AS t SET b = 10 WHERE t.a = 10;
+
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+
+UPDATE update_test t SET b = t.b + 10 WHERE t.a = 10;
+
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+
+--
+-- Test VALUES in FROM
+--
+
+UPDATE update_test SET a=v.i FROM (VALUES(100, 20)) AS v(i, j)
+  WHERE update_test.b = v.j;
+
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+
+-- fail, wrong data type:
+UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i, j)
+  WHERE update_test.b = v.j;
+
+--
+-- Test multiple-set-clause syntax
+--
+
+INSERT INTO update_test SELECT a,b+1,c FROM update_test;
+SELECT * FROM update_test;
+
+UPDATE update_test SET (c,b,a) = ('bugle', b+11, DEFAULT) WHERE c = 'foo';
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+UPDATE update_test SET (c,b) = ('car', a+b), a = a + 1 WHERE a = 10;
+SELECT a,b,c FROM update_test ORDER BY a,b,c;
+-- fail, multi assignment to same column:
+UPDATE update_test SET (c,b) = ('car', a+b), b = a + 1 WHERE a = 10;
+
+-- uncorrelated sub-select:
+UPDATE update_test
+  SET (b,a) = (select a,b from update_test where b = 41 and c = 'car')
+  WHERE a = 100 AND b = 20;
+SELECT * FROM update_test;
+-- correlated sub-select:
+UPDATE update_test o
+  SET (b,a) = (select a+1,b from update_test i
+               where i.a=o.a and i.b=o.b and i.c is not distinct from o.c);
+SELECT * FROM update_test;
+-- fail, multiple rows supplied:
+UPDATE update_test SET (b,a) = (select a+1,b from update_test);
+-- set to null if no rows supplied:
+UPDATE update_test SET (b,a) = (select a+1,b from update_test where a = 1000)
+  WHERE a = 11;
+SELECT * FROM update_test;
+-- *-expansion should work in this context:
+UPDATE update_test SET (a,b) = ROW(v.*) FROM (VALUES(21, 100)) AS v(i, j)
+  WHERE update_test.a = v.i;
+-- you might expect this to work, but syntactically it's not a RowExpr:
+UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) AS v(i, j)
+  WHERE update_test.a = v.i;
+
+-- if an alias for the target table is specified, don't allow references
+-- to the original table name
+UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a = 10;
+
+-- Make sure that we can update to a TOASTed value.
+UPDATE update_test SET c = repeat('x', 10000) WHERE c = 'car';
+SELECT a, b, char_length(c) FROM update_test;
+
+-- Check multi-assignment with a Result node to handle a one-time filter.
+EXPLAIN (VERBOSE, COSTS OFF)
+UPDATE update_test t
+  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
+  WHERE CURRENT_USER = SESSION_USER;
+UPDATE update_test t
+  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
+  WHERE CURRENT_USER = SESSION_USER;
+SELECT a, b, char_length(c) FROM update_test;
+
+-- Test ON CONFLICT DO UPDATE
+
+INSERT INTO upsert_test VALUES(1, 'Boo'), (3, 'Zoo');
+-- uncorrelated  sub-select:
+WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
+  VALUES (1, 'Bar') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
+-- correlated sub-select:
+INSERT INTO upsert_test VALUES (1, 'Baz'), (3, 'Zaz') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Correlated', a from upsert_test i WHERE i.a = upsert_test.a)
+  RETURNING *;
+-- correlated sub-select (EXCLUDED.* alias):
+INSERT INTO upsert_test VALUES (1, 'Bat'), (3, 'Zot') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING *;
+
+-- ON CONFLICT using system attributes in RETURNING, testing both the
+-- inserting and updating paths. See bug report at:
+-- https://www.postgresql.org/message-id/73436355-6432-49B1-92ED-1FE4F7E7E100%40finefun.com.au
+INSERT INTO upsert_test VALUES (2, 'Beeble') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = 0 AS xmax_correct;
+-- currently xmax is set after a conflict - that's probably not good,
+-- but it seems worthwhile to have to be explicit if that changes.
+INSERT INTO upsert_test VALUES (2, 'Brox') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
+  RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = pg_current_xact_id()::xid AS xmax_correct;
+
+DROP TABLE update_test;
+DROP TABLE upsert_test;
+
+-- Test ON CONFLICT DO UPDATE with partitioned table and non-identical children
+
+CREATE TABLE upsert_test (
+    a   INT PRIMARY KEY,
+    b   TEXT
+) PARTITION BY LIST (a);
+
+CREATE TABLE upsert_test_1 PARTITION OF upsert_test FOR VALUES IN (1);
+CREATE TABLE upsert_test_2 (b TEXT, a INT PRIMARY KEY);
+ALTER TABLE upsert_test ATTACH PARTITION upsert_test_2 FOR VALUES IN (2);
+
+INSERT INTO upsert_test VALUES(1, 'Boo'), (2, 'Zoo');
+-- uncorrelated sub-select:
+WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
+  VALUES (1, 'Bar') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
+-- correlated sub-select:
+WITH aaa AS (SELECT 1 AS ctea, ' Foo' AS cteb) INSERT INTO upsert_test
+  VALUES (1, 'Bar'), (2, 'Baz') ON CONFLICT(a)
+  DO UPDATE SET (b, a) = (SELECT upsert_test.b||cteb, upsert_test.a FROM aaa) RETURNING *;
+
+DROP TABLE upsert_test;
+
+
+---------------------------
+-- UPDATE with row movement
+---------------------------
+
+-- When a partitioned table receives an UPDATE to the partitioned key and the
+-- new values no longer meet the partition's bound, the row must be moved to
+-- the correct partition for the new partition key (if one exists). We must
+-- also ensure that updatable views on partitioned tables properly enforce any
+-- WITH CHECK OPTION that is defined. The situation with triggers in this case
+-- also requires thorough testing as partition key updates causing row
+-- movement convert UPDATEs into DELETE+INSERT.
+
+CREATE TABLE range_parted (
+	a text,
+	b bigint,
+	c numeric,
+	d int,
+	e varchar
+) PARTITION BY RANGE (a, b);
+
+-- Create partitions intentionally in descending bound order, so as to test
+-- that update-row-movement works with the leaf partitions not in bound order.
+CREATE TABLE part_b_20_b_30 (e varchar, c numeric, a text, b bigint, d int);
+-- GPDB: distribution policy must match the parent table.
+alter table part_b_20_b_30 set distributed by (a);
+ALTER TABLE range_parted ATTACH PARTITION part_b_20_b_30 FOR VALUES FROM ('b', 20) TO ('b', 30);
+CREATE TABLE part_b_10_b_20 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY RANGE (c);
+alter table part_b_10_b_20 set distributed by (a);
+CREATE TABLE part_b_1_b_10 PARTITION OF range_parted FOR VALUES FROM ('b', 1) TO ('b', 10);
+ALTER TABLE range_parted ATTACH PARTITION part_b_10_b_20 FOR VALUES FROM ('b', 10) TO ('b', 20);
+CREATE TABLE part_a_10_a_20 PARTITION OF range_parted FOR VALUES FROM ('a', 10) TO ('a', 20);
+CREATE TABLE part_a_1_a_10 PARTITION OF range_parted FOR VALUES FROM ('a', 1) TO ('a', 10);
+
+-- Check that partition-key UPDATE works sanely on a partitioned table that
+-- does not have any child partitions.
+UPDATE part_b_10_b_20 set b = b - 6;
+
+-- Create some more partitions following the above pattern of descending bound
+-- order, but let's make the situation a bit more complex by having the
+-- attribute numbers of the columns vary from their parent partition.
+CREATE TABLE part_c_100_200 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY range (abs(d));
+ALTER TABLE part_c_100_200 DROP COLUMN e, DROP COLUMN c, DROP COLUMN a;
+ALTER TABLE part_c_100_200 ADD COLUMN c numeric, ADD COLUMN e varchar, ADD COLUMN a text;
+ALTER TABLE part_c_100_200 DROP COLUMN b;
+ALTER TABLE part_c_100_200 ADD COLUMN b bigint;
+CREATE TABLE part_d_1_15 PARTITION OF part_c_100_200 FOR VALUES FROM (1) TO (15);
+CREATE TABLE part_d_15_20 PARTITION OF part_c_100_200 FOR VALUES FROM (15) TO (20);
+
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
+
+-- GPDB: distribution policy must match the parent table, so the previous command fails.
+-- Change the distribution key and try again.
+alter table part_c_100_200 set distributed by (a);
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
+
+CREATE TABLE part_c_1_100 (e varchar, d int, c numeric, b bigint, a text);
+alter table part_c_1_100 set distributed by (a);
+ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_1_100 FOR VALUES FROM (1) TO (100);
+
+\set init_range_parted 'truncate range_parted; insert into range_parted VALUES (''a'', 1, 1, 1), (''a'', 10, 200, 1), (''b'', 12, 96, 1), (''b'', 13, 97, 2), (''b'', 15, 105, 16), (''b'', 17, 105, 19)'
+\set show_data 'select tableoid::regclass::text COLLATE "C" partname, * from range_parted ORDER BY 1, 2, 3, 4, 5, 6'
+:init_range_parted;
+:show_data;
+
+-- The order of subplans should be in bound order
+EXPLAIN (costs off) UPDATE range_parted set c = c - 50 WHERE c > 97;
+
+-- fail, row movement happens only within the partition subtree.
+UPDATE part_c_100_200 set c = c - 20, d = c WHERE c = 105;
+-- fail, no partition key update, so no attempt to move tuple,
+-- but "a = 'a'" violates partition constraint enforced by root partition)
+UPDATE part_b_10_b_20 set a = 'a';
+-- ok, partition key update, no constraint violation
+UPDATE range_parted set d = d - 10 WHERE d > 10;
+-- ok, no partition key update, no constraint violation
+UPDATE range_parted set e = d;
+-- No row found
+UPDATE part_c_1_100 set c = c + 20 WHERE c = 98;
+-- ok, row movement
+UPDATE part_b_10_b_20 set c = c + 20 returning c, b, a;
+:show_data;
+
+-- fail, row movement happens only within the partition subtree.
+UPDATE part_b_10_b_20 set b = b - 6 WHERE c > 116 returning *;
+-- ok, row movement, with subset of rows moved into different partition.
+UPDATE range_parted set b = b - 6 WHERE c > 116 returning a, b + c;
+
+:show_data;
+
+-- Common table needed for multiple test scenarios.
+CREATE TABLE mintab(c1 int);
+INSERT into mintab VALUES (120);
+
+-- update partition key using updatable view.
+CREATE VIEW upview AS SELECT * FROM range_parted WHERE (select c > c1 FROM mintab) WITH CHECK OPTION;
+-- ok
+UPDATE upview set c = 199 WHERE b = 4;
+-- fail, check option violation
+UPDATE upview set c = 120 WHERE b = 4;
+-- fail, row movement with check option violation
+UPDATE upview set a = 'b', b = 15, c = 120 WHERE b = 4;
+-- ok, row movement, check option passes
+UPDATE upview set a = 'b', b = 15 WHERE b = 4;
+
+:show_data;
+
+-- cleanup
+DROP VIEW upview;
+
+-- RETURNING having whole-row vars.
+:init_range_parted;
+UPDATE range_parted set c = 95 WHERE a = 'b' and b > 10 and c > 100 returning (range_parted), *;
+:show_data;
+
+
+-- Creating default partition for range
+:init_range_parted;
+create table part_def partition of range_parted default;
+\d+ part_def
+insert into range_parted values ('c', 9);
+-- ok
+update part_def set a = 'd' where a = 'c';
+-- fail
+update part_def set a = 'a' where a = 'd';
+
+:show_data;
+
+-- Update row movement from non-default to default partition.
+-- fail, default partition is not under part_a_10_a_20;
+UPDATE part_a_10_a_20 set a = 'ad' WHERE a = 'a';
+-- ok
+UPDATE range_parted set a = 'ad' WHERE a = 'a';
+UPDATE range_parted set a = 'bd' WHERE a = 'b';
+:show_data;
+-- Update row movement from default to non-default partitions.
+-- ok
+UPDATE range_parted set a = 'a' WHERE a = 'ad';
+UPDATE range_parted set a = 'b' WHERE a = 'bd';
+:show_data;
+
+-- Cleanup: range_parted no longer needed.
+DROP TABLE range_parted;
+
+CREATE TABLE list_parted (
+	a text,
+	b int
+) PARTITION BY list (a);
+CREATE TABLE list_part1  PARTITION OF list_parted for VALUES in ('a', 'b');
+CREATE TABLE list_default PARTITION OF list_parted default;
+INSERT into list_part1 VALUES ('a', 1);
+INSERT into list_default VALUES ('d', 10);
+
+-- fail
+UPDATE list_default set a = 'a' WHERE a = 'd';
+-- ok
+UPDATE list_default set a = 'x' WHERE a = 'd';
+
+DROP TABLE list_parted;
+
+--------------
+-- Some more update-partition-key test scenarios below. This time use list
+-- partitions.
+--------------
+
+-- Setup for list partitions
+CREATE TABLE list_parted (a numeric, b int, c int8) PARTITION BY list (a);
+CREATE TABLE sub_parted PARTITION OF list_parted for VALUES in (1) PARTITION BY list (b);
+
+CREATE TABLE sub_part1(b int, c int8, a numeric);
+alter table sub_part1 set distributed by (a); -- GPDB: distribution policy must match the parent table.
+ALTER TABLE sub_parted ATTACH PARTITION sub_part1 for VALUES in (1);
+CREATE TABLE sub_part2(b int, c int8, a numeric);
+alter table sub_part2 set distributed by (a); -- GPDB: distribution policy must match the parent table.
+ALTER TABLE sub_parted ATTACH PARTITION sub_part2 for VALUES in (2);
+
+CREATE TABLE list_part1(a numeric, b int, c int8);
+ALTER TABLE list_parted ATTACH PARTITION list_part1 for VALUES in (2,3);
+
+INSERT into list_parted VALUES (2,5,50);
+INSERT into list_parted VALUES (3,6,60);
+INSERT into sub_parted VALUES (1,1,60);
+INSERT into sub_parted VALUES (1,2,10);
+
+-- Test partition constraint violation when intermediate ancestor is used and
+-- constraint is inherited from upper root.
+UPDATE sub_parted set a = 2 WHERE c = 10;
+
+-- Test update-partition-key, where the unpruned partitions do not have their
+-- partition keys updated.
+SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
+UPDATE list_parted set b = c + a WHERE a = 2;
+SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
+
+
+-- Cleanup: list_parted no longer needed.
+DROP TABLE list_parted;
+
+-- create custom operator class and hash function, for the same reason
+-- explained in alter_table.sql
+create or replace function dummy_hashint4(a int4, seed int8) returns int8 as
+$$ begin return (a + seed); end; $$ language 'plpgsql' immutable;
+create operator class custom_opclass for type int4 using hash as
+operator 1 = , function 2 dummy_hashint4(int4, int8);
+
+create table hash_parted (
+	a int,
+	b int
+) partition by hash (a custom_opclass, b custom_opclass);
+create table hpart1 partition of hash_parted for values with (modulus 2, remainder 1);
+create table hpart2 partition of hash_parted for values with (modulus 4, remainder 2);
+create table hpart3 partition of hash_parted for values with (modulus 8, remainder 0);
+create table hpart4 partition of hash_parted for values with (modulus 8, remainder 4);
+insert into hpart1 values (1, 1);
+insert into hpart2 values (2, 5);
+insert into hpart4 values (3, 4);
+
+-- fail
+update hpart1 set a = 3, b=4 where a = 1;
+-- ok, row movement
+update hash_parted set b = b - 1 where b = 1;
+-- ok
+update hash_parted set b = b + 8 where b = 1;
+
+-- cleanup
+drop table hash_parted;
+drop operator class custom_opclass using hash;
+drop function dummy_hashint4(a int4, seed int8);
diff --git a/contrib/pax_storage/src/data/sql/update_gp.sql b/contrib/pax_storage/sql/update_gp.sql
similarity index 78%
rename from contrib/pax_storage/src/data/sql/update_gp.sql
rename to contrib/pax_storage/sql/update_gp.sql
index 3fe87351ac5..30efc73f679 100644
--- a/contrib/pax_storage/src/data/sql/update_gp.sql
+++ b/contrib/pax_storage/sql/update_gp.sql
@@ -1,9 +1,10 @@
+set default_table_access_method = pax;
+
 -- Test DELETE and UPDATE on an inherited table.
 -- The special aspect of this table is that the inherited table has
 -- a different distribution key. 'p' table's distribution key matches
 -- that of 'r', but 'p2's doesn't. Test that the planner adds a Motion
 -- node correctly for p2.
-set default_table_access_method = 'pax';
 create table todelete (a int) distributed by (a);
 create table parent (a int, b int, c int) distributed by (a);
 create table child (a int, b int, c int) inherits (parent) distributed by (b);
@@ -62,9 +63,8 @@ create table base_tbl (a int4, b int4) distributed by (a);
 create table child_a (a int4, b int4) inherits (base_tbl) distributed by (a);
 create table child_b (a int4, b int4) inherits (base_tbl) distributed by (b);
 insert into base_tbl select g, g from generate_series(1, 5) g;
--- start_ignore
+
 explain (costs off) update base_tbl set a=a+1;
--- end_ignore
 update base_tbl set a = 5;
 
 --
@@ -84,8 +84,8 @@ INSERT INTO keo3 VALUES ('1', '1');
 
 CREATE TABLE keo4 ( keo_para_required_period character varying(6), keo_para_budget_date character varying(24)) DISTRIBUTED RANDOMLY;
 INSERT INTO keo4 VALUES ('1', '1');
+ANALYZE keo1, keo2, keo3, keo4;
 -- Explicit Redistribution motion should be added in case of GPDB Planner (test case not applicable for ORCA)
--- start_ignore
 EXPLAIN (COSTS OFF) UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
     ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
         ON b.projects_pk=a.user_vie_project_code_pk
@@ -95,7 +95,6 @@ EXPLAIN (COSTS OFF) UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
                 (SELECT min (keo4.keo_para_budget_date) FROM keo4)))
     ) t1
 WHERE t1.user_vie_project_code_pk = keo1.user_vie_project_code_pk;
--- end_ignore
 UPDATE keo1 SET user_vie_act_cntr_marg_cum = 234.682 FROM
     ( SELECT a.user_vie_project_code_pk FROM keo1 a INNER JOIN keo2 b
         ON b.projects_pk=a.user_vie_project_code_pk
@@ -110,9 +109,7 @@ SELECT user_vie_act_cntr_marg_cum FROM keo1;
 -- Explicit Redistribution motion should not be added in case of GPDB Planner (test case not applicable to ORCA)
 CREATE TABLE keo5 (x int, y int) DISTRIBUTED BY (x);
 INSERT INTO keo5 VALUES (1,1);
--- start_ignore
 EXPLAIN (COSTS OFF) DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
--- end_ignore
 DELETE FROM keo5 WHERE x IN (SELECT x FROM keo5 WHERE EXISTS (SELECT x FROM keo5 WHERE x < 2));
 SELECT x FROM keo5;
 
@@ -123,54 +120,52 @@ DROP TABLE keo3;
 DROP TABLE keo4;
 DROP TABLE keo5;
 
--- start_ignore
--- -- text types. We should support the following updates.
--- --
+--
+-- text types. We should support the following updates.
+--
 
--- CREATE TEMP TABLE ttab1 (a varchar(15), b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a varchar(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab1 (a varchar(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar(15), b integer) DISTRIBUTED BY (a);
 
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
 
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
 
 
--- CREATE TEMP TABLE ttab1 (a text, b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a text, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab1 (a text, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a text, b integer) DISTRIBUTED BY (a);
 
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
 
 
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
 
--- CREATE TEMP TABLE ttab1 (a varchar, b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a varchar, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab1 (a varchar, b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a varchar, b integer) DISTRIBUTED BY (a);
 
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
 
 
--- DROP TABLE ttab1;
--- DROP TABLE ttab2;
+DROP TABLE ttab1;
+DROP TABLE ttab2;
 
--- CREATE TEMP TABLE ttab1 (a char(15), b integer) DISTRIBUTED BY (a);
--- CREATE TEMP TABLE ttab2 (a char(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab1 (a char(15), b integer) DISTRIBUTED BY (a);
+CREATE TEMP TABLE ttab2 (a char(15), b integer) DISTRIBUTED BY (a);
 
--- UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
+UPDATE ttab1 SET b = ttab2.b FROM ttab2 WHERE ttab1.a = ttab2.a;
 
--- DROP TABLE IF EXISTS update_distr_key;
+DROP TABLE IF EXISTS update_distr_key;
 
--- CREATE TEMP TABLE update_distr_key (a int, b int) DISTRIBUTED BY (a);
--- INSERT INTO update_distr_key select i, i* 10 from generate_series(0, 9) i;
+CREATE TEMP TABLE update_distr_key (a int, b int) DISTRIBUTED BY (a);
+INSERT INTO update_distr_key select i, i* 10 from generate_series(0, 9) i;
 
--- UPDATE update_distr_key SET a = 5 WHERE b = 10;
+UPDATE update_distr_key SET a = 5 WHERE b = 10;
 
--- SELECT * from update_distr_key;
+SELECT * from update_distr_key;
 
--- DROP TABLE update_distr_key;
-
--- end_ignore
+DROP TABLE update_distr_key;
 
 -- below cases is to test multi-hash-cols
 CREATE TABLE tab3(c1 int, c2 int, c3 int, c4 int, c5 int) DISTRIBUTED BY (c1, c2, c3);
@@ -202,9 +197,8 @@ UPDATE tab5 set (c1,c2,c3,c4,c5) = (1,2,3,0,6) where c5 = 1;
 SELECT gp_segment_id, * FROM tab5;
 UPDATE tab5 set c1 = 11 where c3 = 10 and c3 < 1;
 SELECT gp_segment_id, * FROM tab5;
--- start_ignore
+
 EXPLAIN (COSTS OFF ) UPDATE tab3 SET C1 = C1 + 1, C5 = C5+1;
--- end_ignore
 
 -- clean up
 drop table tab3;
@@ -260,21 +254,20 @@ select * from r;
 select * from s;
 update s set a = s.a + 1 where exists (select 1 from r where s.a = r.b);
 select * from s;
--- start_ignore
+
 -- Update ao table distribution key
--- create table update_ao_table (a int, b int) WITH (appendonly=true) distributed by (a);
--- insert into update_ao_table select g, g from generate_series(1, 5) g;
--- select * from update_ao_table;
--- update update_ao_table set a = a + 1 where b = 3;
--- select * from update_ao_table;
+create table update_ao_table (a int, b int) WITH (appendonly=true) distributed by (a);
+insert into update_ao_table select g, g from generate_series(1, 5) g;
+select * from update_ao_table;
+update update_ao_table set a = a + 1 where b = 3;
+select * from update_ao_table;
 
 -- Update aoco table distribution key
--- create table update_aoco_table (a int, b int) WITH (appendonly=true, orientation=column) distributed by (a);
--- insert into update_aoco_table select g,g from generate_series(1, 5) g;
--- select * from update_aoco_table;
--- update update_aoco_table set a = a + 1 where b = 3;
--- select * from update_aoco_table;
--- end_ignore
+create table update_aoco_table (a int, b int) WITH (appendonly=true, orientation=column) distributed by (a);
+insert into update_aoco_table select g,g from generate_series(1, 5) g;
+select * from update_aoco_table;
+update update_aoco_table set a = a + 1 where b = 3;
+select * from update_aoco_table;
 
 -- Update prepare
 delete from s;
@@ -288,9 +281,7 @@ select * from s;
 -- Confirm that a split update is not created for a table excluded by
 -- constraints in the planner.
 create table nosplitupdate (a int) distributed by (a);
--- start_ignore
 explain update nosplitupdate set a=0 where a=1 and a<1;
--- end_ignore
 
 -- test split-update when split-node's flow is entry
 create table tsplit_entry (c int);
@@ -298,42 +289,42 @@ insert into tsplit_entry values (1), (2);
 analyze tsplit_entry;
 
 -- start_ignore
+-- gp_segment_configuration scan is different when using different FTS
 explain update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
 -- end_ignore
 update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_configuration) s;
--- start_ignore
--- CREATE TABLE update_gp_foo (
---     a_dist int,
---     b int,
---     c_part int,
---     d int
--- )
--- WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
---           (
---           PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo_1_prt_p20190305', appendonly=false)
---           );
-
--- CREATE TABLE update_gp_foo1 (
---         a_dist int,
---         b int,
---         c_part int,
---         d int
--- )
--- WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
---           (
---           PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo1_1_prt_p20190305', appendonly=false)
---           );
-
--- INSERT INTO update_gp_foo VALUES (12, 40, 1, 50);
--- INSERT INTO update_gp_foo1 VALUES (12, 3, 1, 50);
-
--- UPDATE update_gp_foo
--- SET    b = update_gp_foo.c_part,
---        d = update_gp_foo1.a_dist
--- FROM   update_gp_foo1;
-
--- SELECT * from update_gp_foo;
--- end_ignore
+
+CREATE TABLE update_gp_foo (
+    a_dist int,
+    b int,
+    c_part int,
+    d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo_1_prt_p20190305', appendonly=false)
+          );
+
+CREATE TABLE update_gp_foo1 (
+        a_dist int,
+        b int,
+        c_part int,
+        d int
+)
+WITH (appendonly=false) DISTRIBUTED BY (a_dist) PARTITION BY RANGE(c_part)
+          (
+          PARTITION p20190305 START (1) END (2) WITH (tablename='update_gp_foo1_1_prt_p20190305', appendonly=false)
+          );
+
+INSERT INTO update_gp_foo VALUES (12, 40, 1, 50);
+INSERT INTO update_gp_foo1 VALUES (12, 3, 1, 50);
+
+UPDATE update_gp_foo
+SET    b = update_gp_foo.c_part,
+       d = update_gp_foo1.a_dist
+FROM   update_gp_foo1;
+
+SELECT * from update_gp_foo;
 
 -- Test insert on conflict do update
 -- Insert on conflict do update is an insert statement but might
@@ -342,7 +333,6 @@ update tsplit_entry set c = s.a from (select count(*) as a from gp_segment_confi
 -- planning, if a `insert on conflict do update` statement set the
 -- dist keys of the table, it will raise an error.
 -- See github issue: https://github.com/greenplum-db/gpdb/issues/9444
--- start_ignore
 create table t_insert_on_conflict_update_distkey(a int, b int) distributed by (a);
 create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
 
@@ -358,7 +348,6 @@ create table t_insert_on_conflict_update_distkey(a int, b int) distributed repli
 create unique index uidx_t_insert_on_conflict_update_distkey on t_insert_on_conflict_update_distkey(a, b);
 -- the following statement should succeed because replicated table does not contain distkey
 insert into t_insert_on_conflict_update_distkey values (1, 1) on conflict(a, b) do update set a = 1;
--- end_ignore
 
 -- Some tests on a partitioned table.
 CREATE TABLE update_gp_rangep (a int, b int, orig_a int) DISTRIBUTED BY (b) PARTITION BY RANGE (a);
@@ -379,9 +368,8 @@ UPDATE update_gp_rangep SET a = 10 WHERE a = 3;
 
 -- Move row to different partition and also change distribution key
 UPDATE update_gp_rangep SET a = 11, b = 1 WHERE a = 4;
--- start_ignore
+
 SELECT tableoid::regclass, * FROM update_gp_rangep ORDER BY orig_a;
--- end_ignore
 -- Also do a lookup with specific distribution key. If the rows were not
 -- correctly moved across segments, this would fail to find them, assuming
 -- that direct dispatch is effective.
diff --git a/contrib/pax_storage/src/cpp/CMakeLists.txt b/contrib/pax_storage/src/cpp/CMakeLists.txt
index 8ac5f846c7a..8b6cbe0fd29 100644
--- a/contrib/pax_storage/src/cpp/CMakeLists.txt
+++ b/contrib/pax_storage/src/cpp/CMakeLists.txt
@@ -1,242 +1,37 @@
 cmake_minimum_required (VERSION 3.11.0)
 
 # protobuf
-include(ExternalProject)
-option(ORC_PREFER_STATIC_PROTOBUF "Prefer static protobuf library, if available" ON)
-set(THIRDPARTY_CONFIGURE_COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}")
-set(THIRDPARTY_DIR "${CMAKE_BINARY_DIR}/src/cpp/contrib")
-set(THIRDPARTY_LOG_OPTIONS LOG_CONFIGURE 1
-                           LOG_BUILD 1
-                           LOG_INSTALL 1
-                           LOG_DOWNLOAD 1)
 
-set(PROTOBUF_PREFIX "${THIRDPARTY_DIR}/protobuf_ep-install")
-set(PROTOBUF_INCLUDE_DIR "${PROTOBUF_PREFIX}/include")
-set(PROTOBUF_CMAKE_ARGS -DCMAKE_INSTALL_PREFIX=${PROTOBUF_PREFIX}
-                        -DCMAKE_INSTALL_LIBDIR=lib
-                        -DBUILD_SHARED_LIBS=OFF
-                        -Dprotobuf_BUILD_TESTS=OFF)
-
-set(PROTOBUF_CMAKE_ARGS ${PROTOBUF_CMAKE_ARGS} -DCMAKE_POSITION_INDEPENDENT_CODE=ON)
-set(PROTOBUF_STATIC_LIB_PREFIX ${CMAKE_STATIC_LIBRARY_PREFIX})
-set(PROTOBUF_STATIC_LIB "${PROTOBUF_PREFIX}/lib/${PROTOBUF_STATIC_LIB_PREFIX}protobuf${CMAKE_STATIC_LIBRARY_SUFFIX}")
-message(STATUS "${PROTOBUF_STATIC_LIB}")
-set(PROTOC_STATIC_LIB "${PROTOBUF_PREFIX}/lib/${PROTOBUF_STATIC_LIB_PREFIX}protoc${CMAKE_STATIC_LIBRARY_SUFFIX}")
-set(PROTOBUF_EXECUTABLE "${PROTOBUF_PREFIX}/bin/protoc${CMAKE_EXECUTABLE_SUFFIX}")
-
-set(PROTOBUF_CONFIGURE CONFIGURE_COMMAND "${THIRDPARTY_CONFIGURE_COMMAND}" ${PROTOBUF_CMAKE_ARGS}
-                                             "${CMAKE_CURRENT_BINARY_DIR}/protobuf_ep-prefix/src/protobuf_ep/cmake")
-
-ExternalProject_Add(protobuf_ep
-    URL "https://artifactory.hashdata.xyz/artifactory/utility/protobuf-3.6.1.tar.gz"
-    ${PROTOBUF_CONFIGURE}
-    ${THIRDPARTY_LOG_OPTIONS}
-    BUILD_BYPRODUCTS "${PROTOBUF_STATIC_LIB}" "${PROTOC_STATIC_LIB}")
-
-set(PROTOBUF_LIBRARY ${PROTOBUF_STATIC_LIB})
-set(PROTOC_LIBRARY ${PROTOC_STATIC_LIB})
-set(PROTOBUF_VENDORED ON)
-set(INSTALL_VENDORED_LIBS OFF)
-
-add_library (orc_protobuf INTERFACE)
-add_library (orc::protobuf ALIAS orc_protobuf)
-add_library (orc_protoc INTERFACE)
-add_library (orc::protoc ALIAS orc_protoc)
-
-if (ORC_PREFER_STATIC_PROTOBUF AND ${PROTOBUF_STATIC_LIB})
-  target_link_libraries (orc_protobuf INTERFACE ${PROTOBUF_STATIC_LIB})
-else ()
-  target_link_libraries (orc_protobuf INTERFACE ${PROTOBUF_LIBRARY})
-endif()
-
-target_include_directories (orc_protobuf SYSTEM INTERFACE ${PROTOBUF_INCLUDE_DIR})
-
-if (ORC_PREFER_STATIC_PROTOBUF AND ${PROTOC_STATIC_LIB})
-  target_link_libraries (orc_protoc INTERFACE ${PROTOC_STATIC_LIB})
-else ()
-  target_link_libraries (orc_protoc INTERFACE ${PROTOC_LIBRARY})
-endif()
-
-target_include_directories (orc_protoc SYSTEM INTERFACE ${PROTOBUF_INCLUDE_DIR})
-
-if (PROTOBUF_VENDORED)
-  add_dependencies (orc_protoc protobuf_ep)
-  add_dependencies (orc_protobuf protobuf_ep)
-  if (INSTALL_VENDORED_LIBS)
-    install(FILES "${PROTOBUF_STATIC_LIB}" "${PROTOC_STATIC_LIB}"
-            DESTINATION "lib")
-  endif ()
-endif ()
-
-set(orc_proto_file "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/orc_proto.proto")
-set(orc_proto_src "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/orc_proto.pb.h" "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/orc_proto.pb.cc")
-
-set(pax_proto_file "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/pax.proto")
-set(pax_proto_src "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/pax.pb.h" "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/pax.pb.cc")
-
-set(catalog_proto_file "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/micro_partition_stats.proto")
-set(stats_proto_src "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/micro_partition_stats.pb.h" "${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/micro_partition_stats.pb.cc")
-
-add_custom_command(OUTPUT ${orc_proto_src}
-  COMMAND ${PROTOBUF_EXECUTABLE}
-  -I ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/
-  --cpp_out="${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/"
-  ${orc_proto_file})
-
-add_custom_command(OUTPUT ${pax_proto_src}
-  COMMAND ${PROTOBUF_EXECUTABLE}
-  -I ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/
-  --cpp_out="${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/"
-  ${pax_proto_file})
-
-add_custom_command(OUTPUT ${stats_proto_src}
-  COMMAND ${PROTOBUF_EXECUTABLE}
-  -I ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/
-  --cpp_out="${CMAKE_CURRENT_SOURCE_DIR}/storage/proto"
-  ${catalog_proto_file})
-
-add_custom_target(generate_protobuf DEPENDS ${orc_proto_src} ${pax_proto_src} ${stats_proto_src})
-
-if (BUILD_GTEST AND NOT BUILD_PAX_FORMAT)
-  add_subdirectory(contrib/googletest)
-  ADD_DEFINITIONS(-DRUN_GTEST)
-  file(GLOB TEST_CASE_SOURCES
-    ${CMAKE_CURRENT_SOURCE_DIR}/*/*_test.cc
-    ${CMAKE_CURRENT_SOURCE_DIR}/*/*/*_test.cc)
-
-  link_directories($ENV{GPHOME}/lib)
-  add_executable(test_main ${TEST_CASE_SOURCES})
-  add_dependencies(test_main gtest gmock gtest_main)
-  target_include_directories(test_main PUBLIC ${CMAKE_CURRENT_SOURCE_DIR} ${gtest_SOURCE_DIR}/include)
-  target_link_libraries(test_main gtest gmock gtest_main postgres pax)
-endif(BUILD_GTEST AND NOT BUILD_PAX_FORMAT)
-
-# ztsd
-set(ZSTD_BUILD_PROGRAMS OFF)
-set(ZSTD_BUILD_TESTS OFF)
-set(ZSTD_BUILD_CONTRIB)
-add_subdirectory(contrib/zstd/build/cmake/)
-set(ZTSD_HEADER contrib/zstd/lib)
-
-set(pax_comm_src
-    comm/bitmap.cc
-    comm/paxc_wrappers.cc
-    comm/cbdb_wrappers.cc)
-
-set(pax_exceptions_src
-    exceptions/CException.cc)
-
-set(pax_storage_src
-    storage/columns/pax_column.cc
-    storage/columns/pax_column_int.cc
-    storage/columns/pax_compress.cc
-    storage/columns/pax_columns.cc
-    storage/columns/pax_encoding_utils.cc
-    storage/columns/pax_encoding_non_fixed_column.cc
-    storage/columns/pax_encoding_column.cc
-    storage/columns/pax_decoding.cc
-    storage/columns/pax_encoding.cc
-    storage/columns/pax_rlev2_decoding.cc
-    storage/columns/pax_rlev2_encoding.cc
-    storage/file_system.cc
-    storage/pax_filter.cc
-    storage/local_file_system.cc
-    storage/micro_partition.cc
-    storage/micro_partition_file_factory.cc
-    storage/micro_partition_iterator.cc
-    storage/micro_partition_metadata.cc
-    storage/pax_buffer.cc  
-    storage/proto/protobuf_stream.cc
-    storage/pax_filter.cc
-    storage/strategy.cc
-    storage/paxc_block_map_manager.cc
-    storage/orc/orc.cc
-    storage/strategy.cc)
-
-if(NOT BUILD_PAX_FORMAT) 
-  set(pax_storage_src ${pax_storage_src} storage/pax.cc)
-endif(NOT BUILD_PAX_FORMAT)
-
-set(pax_access_src
-    access/pax_access_handle.cc
-    access/pax_deleter.cc
-    access/pax_dml_state.cc
-    access/pax_inserter.cc
-    access/pax_updater.cc
-    access/pax_scanner.cc)
-
-set(pax_catalog_src
-    catalog/micro_partition_stats.cc
-    catalog/pax_aux_table.cc)
-
-set(pax_vec_src
-  storage/vec/pax_vec_adapter.cc
-  storage/vec/pax_vec_reader.cc)
-
-link_directories($ENV{GPHOME}/lib)
-
-if(BUILD_PAX_FORMAT)
-  # paxformat.so
-  ADD_DEFINITIONS(-DBUILD_PAX_FORMAT)
-  add_library(paxformat SHARED ${orc_proto_src} ${pax_proto_src} ${pax_storage_src} ${pax_exceptions_src} ${pax_comm_src} )
-  target_include_directories(paxformat PUBLIC ${ZTSD_HEADER} ${CMAKE_CURRENT_SOURCE_DIR} ${CBDB_INCLUDE_DIR})
-  target_link_libraries(paxformat PUBLIC uuid orc_protobuf zstd z)
-  set_target_properties(paxformat PROPERTIES
-   OUTPUT_NAME paxformat)
-  add_dependencies(paxformat generate_protobuf)
-
-  # export headers
-  set(PAX_COMM_HEADERS
-    comm/cbdb_api.h
-  )
-
-  ## install dynamic libraray
-  install(TARGETS paxformat
-    LIBRARY DESTINATION ${CMAKE_INSTALL_PREFIX}/lib)
-
-  # TODO(gongxun):
-  # We should explicitly specify the headers
-  # that need to be exported, and use the syntax of
-  # install(FILES,...) to install the header files
-  install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/storage
-    DESTINATION ${CMAKE_INSTALL_PREFIX}/include/pax
-    FILES_MATCHING
-    PATTERN "*.h"
-)
-
-install(FILES ${PAX_COMM_HEADERS}
-  DESTINATION ${CMAKE_INSTALL_PREFIX}/include/pax/comm
+set(protobuf_files
+  ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/micro_partition_stats.proto
+  ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/pax.proto
+  ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto/orc_proto.proto
 )
 
-else()
 
-  add_library(pax SHARED ${orc_proto_src} ${pax_proto_src} ${pax_storage_src} ${stats_proto_src} ${pax_exceptions_src}
-                  ${pax_access_src} ${pax_comm_src} ${pax_catalog_src} ${pax_vec_src})
-  set_target_properties(pax PROPERTIES OUTPUT_NAME pax)
-  target_include_directories(pax PUBLIC ${ZTSD_HEADER}  ${CMAKE_CURRENT_SOURCE_DIR} ${CBDB_INCLUDE_DIR})
-  target_link_libraries(pax PUBLIC uuid orc_protobuf zstd z postgres)
-  add_dependencies(pax generate_protobuf)
-  add_custom_command(TARGET pax POST_BUILD
-                  COMMAND ${CMAKE_COMMAND} -E
-                  copy_if_different $<TARGET_FILE:pax> ${CMAKE_CURRENT_SOURCE_DIR}/../data/pax.so)
-endif(BUILD_PAX_FORMAT)
+set(PROTO_DIR ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto)
+set(PROTO_OUTPUT_DIR ${CMAKE_CURRENT_SOURCE_DIR}/storage/proto)
 
-# vec build
-if (VEC_BUILD)
-  set(VEC_HEADER ${VEC_HOME}/src/include/)
+## we generate these files in the cmake -B build phase.
+## when we start the make phase, all dependent files exist, and we can compile with multiple threads.
+FOREACH(FIL ${protobuf_files})
+    GET_FILENAME_COMPONENT(FIL_WE ${FIL} NAME_WE)
+    string(REGEX REPLACE ".+/(.+)\\..*" "\\1" FILE_NAME ${FIL})
+    string(REGEX REPLACE "(.+)\\${FILE_NAME}.*" "\\1" FILE_PATH ${FIL})
 
-  find_package(PkgConfig REQUIRED)
-  pkg_check_modules(GLIB REQUIRED glib-2.0)
+    set(PROTO_SRCS ${PROTO_SRCS} "${PROTO_OUTPUT_DIR}/${FIL_WE}.pb.cc")
+    set(PROTO_HDRS ${PROTO_SRCS} "${PROTO_OUTPUT_DIR}/${FIL_WE}.pb.h")
 
-  target_include_directories(pax PRIVATE 
-    ${VEC_HEADER} # for utils/tuptable_vec.h
-    ${CBDB_ROOT_INCLUDE_DIR}  # for arrow-glib/arrow-glib.h and otehr arrow interface
-    ${GLIB_INCLUDE_DIRS} # for glib-object.h
-  )
+    EXECUTE_PROCESS(
+            COMMAND ${PROTOBUF_PROTOC_EXECUTABLE} -I ${PROTO_DIR} --cpp_out=${PROTO_OUTPUT_DIR} ${FIL}
+    )
+ENDFOREACH()
+add_custom_target(generate_protobuf DEPENDS ${PROTO_SRCS} ${PROTO_HDRS})
 
-  if(BUILD_GTEST)
-    target_include_directories(test_main PRIVATE ${VEC_HEADER} ${CBDB_ROOT_INCLUDE_DIR} ${GLIB_INCLUDE_DIRS})
-  endif(BUILD_GTEST)
+link_directories($ENV{GPHOME}/lib)
 
-  target_link_libraries(pax PRIVATE arrow)
-endif(VEC_BUILD)
+list(APPEND CMAKE_MODULE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/cmake")
+## build pax_format.so
+include(pax_format)
+## build pax.so
+include(pax)
diff --git a/contrib/pax_storage/src/cpp/access/pax_access_handle.cc b/contrib/pax_storage/src/cpp/access/pax_access_handle.cc
index be34ff3aecc..a6bc4ab74be 100644
--- a/contrib/pax_storage/src/cpp/access/pax_access_handle.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_access_handle.cc
@@ -3,11 +3,18 @@
 #include "comm/cbdb_api.h"
 
 #include "access/pax_dml_state.h"
+#include "access/pax_partition.h"
 #include "access/pax_scanner.h"
 #include "access/pax_updater.h"
+#include "access/paxc_rel_options.h"
+#include "access/paxc_scanner.h"
 #include "catalog/pax_aux_table.h"
+#include "catalog/pax_fastsequence.h"
+#include "catalog/pg_pax_tables.h"
+#include "comm/guc.h"
+#include "comm/pax_memory.h"
 #include "exceptions/CException.h"
-#include "storage/paxc_block_map_manager.h"
+#include "storage/local_file_system.h"
 
 #define NOT_IMPLEMENTED_YET                        \
   ereport(ERROR,                                   \
@@ -18,14 +25,8 @@
   ereport(ERROR, (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), \
                   errmsg("not supported on pax relations: %s", __func__)))
 
-#define PAX_DEFAULT_COMPRESSLEVEL AO_DEFAULT_COMPRESSLEVEL
-#define PAX_MIN_COMPRESSLEVEL AO_MIN_COMPRESSLEVEL
-#define PAX_MAX_COMPRESSLEVEL AO_MAX_COMPRESSLEVEL
-
-#define PAX_DEFAULT_COMPRESSTYPE AO_DEFAULT_COMPRESSTYPE
-
 #define RELATION_IS_PAX(rel) \
-  (OidIsValid((rel)->rd_rel->relam) && AMOidIsPax((rel)->rd_rel->relam))
+  (OidIsValid((rel)->rd_rel->relam) && RelationIsPAX(rel))
 
 // CBDB_TRY();
 // {
@@ -41,6 +42,7 @@
 //
 // CBDB_CATCH_MATCH() is optional and can have several match pattern.
 
+char *global_pg_error_message = nullptr;
 cbdb::CException global_exception(cbdb::CException::kExTypeInvalid);
 
 // being of a try block w/o explicit handler
@@ -63,6 +65,7 @@ cbdb::CException global_exception(cbdb::CException::kExTypeInvalid);
   catch (cbdb::CException & e) {                      \
     internal_cbdb_try_throw_error_ = true;            \
     internal_cbdb_try_throw_error_with_stack_ = true; \
+    global_pg_error_message = elog_message();         \
     elog(LOG, "\npax stack trace: \n%s", e.Stack());  \
     global_exception = e;                             \
   }                                                   \
@@ -79,44 +82,29 @@ cbdb::CException global_exception(cbdb::CException::kExTypeInvalid);
     } while (0);
 
 // end of a try-catch block
-#define CBDB_END_TRY()                                                \
-  }                                                                   \
-  if (internal_cbdb_try_throw_error_) {                               \
-    if (internal_cbdb_try_throw_error_with_stack_) {                  \
-      elog(LOG, "\npax stack trace: \n%s", global_exception.Stack()); \
-      ereport(ERROR, errmsg("%s", global_exception.What().c_str()));  \
-    }                                                                 \
-    if (error_message.Length() == 0)                                  \
-      error_message.Append("ERROR: %s", __func__);                    \
-    ereport(ERROR, errmsg("%s", error_message.Message()));            \
-  }                                                                   \
-  }                                                                   \
+#define CBDB_END_TRY()                                                      \
+  }                                                                         \
+  if (internal_cbdb_try_throw_error_) {                                     \
+    if (global_pg_error_message) {                                          \
+      elog(LOG, "\npg error message:%s", global_pg_error_message);          \
+    }                                                                       \
+    if (internal_cbdb_try_throw_error_with_stack_) {                        \
+      elog(LOG, "\npax stack trace: \n%s", global_exception.Stack());       \
+      ereport(                                                              \
+          ERROR,                                                            \
+          errmsg("%s (PG message: %s)", global_exception.What().c_str(),    \
+                 !global_pg_error_message ? "" : global_pg_error_message)); \
+    }                                                                       \
+    if (error_message.Length() == 0)                                        \
+      error_message.Append("ERROR: %s", __func__);                          \
+    ereport(ERROR, errmsg("%s", error_message.Message()));                  \
+  }                                                                         \
+  }                                                                         \
   while (0)
 
-bool AMOidIsPax(Oid am_oid) {
-  HeapTuple tuple;
-  Form_pg_am form;
-  bool is_pax;
-
-  tuple = SearchSysCache1(AMOID, ObjectIdGetDatum(am_oid));
-  if (!HeapTupleIsValid(tuple))
-    elog(ERROR, "cache lookup failed for pg_am.oid = %u", am_oid);
-
-  form = (Form_pg_am)GETSTRUCT(tuple);
-  is_pax = strcmp(NameStr(form->amname), "pax") == 0;
-  ReleaseSysCache(tuple);
-
-  return is_pax;
-}
-
-// reloptions structure and variables.
-static relopt_kind self_relopt_kind;
-static const relopt_parse_elt kSelfReloptTab[] = {
-    {"compresslevel", RELOPT_TYPE_INT, offsetof(PaxOptions, compress_level)},
-    {"compresstype", RELOPT_TYPE_STRING, offsetof(PaxOptions, compress_type)},
-    {"storage_format", RELOPT_TYPE_STRING,
-     offsetof(PaxOptions, storage_format)},
-};
+#define PAX_SCAN_REUSE_BUFFER_DEFAULT_SIZE 8 * 1024 * 1024
+#define PAX_SCAN_REUSE_BUFFER_MIN_SIZE 1 * 1024 * 1024
+#define PAX_SCAN_REUSE_BUFFER_MAX_SIZE 32 * 1024 * 1024
 
 // access methods that are implemented in C++
 namespace pax {
@@ -128,7 +116,7 @@ TableScanDesc CCPaxAccessMethod::ScanBegin(Relation relation, Snapshot snapshot,
   CBDB_TRY();
   {
     return PaxScanDesc::BeginScan(relation, snapshot, nkeys, key, pscan, flags,
-                                  nullptr);
+                                  nullptr, true);
   }
   CBDB_CATCH_DEFAULT();
   CBDB_END_TRY();
@@ -138,21 +126,22 @@ TableScanDesc CCPaxAccessMethod::ScanBegin(Relation relation, Snapshot snapshot,
 
 void CCPaxAccessMethod::ScanEnd(TableScanDesc scan) {
   CBDB_TRY();
-  { PaxScanDesc::EndScan(scan); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    desc->EndScan();
+  }
   CBDB_CATCH_DEFAULT();
-  CBDB_FINALLY({
-      // FIXME: destroy PaxScanDesc?
-  });
+  CBDB_FINALLY({});
   CBDB_END_TRY();
 }
 
 TableScanDesc CCPaxAccessMethod::ScanExtractColumns(
-    Relation rel, Snapshot snapshot, ParallelTableScanDesc parallel_scan,
-    List *targetlist, List *qual, uint32 flags) {
+    Relation rel, Snapshot snapshot, int nkeys, struct ScanKeyData *key,
+    ParallelTableScanDesc parallel_scan, struct PlanState *ps, uint32 flags) {
   CBDB_TRY();
   {
-    return pax::PaxScanDesc::BeginScanExtractColumns(
-        rel, snapshot, parallel_scan, targetlist, qual, flags);
+    return pax::PaxScanDesc::BeginScanExtractColumns(rel, snapshot, nkeys, key,
+                                                     parallel_scan, ps, flags);
   }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
@@ -160,16 +149,107 @@ TableScanDesc CCPaxAccessMethod::ScanExtractColumns(
   pg_unreachable();
 }
 
+struct IndexFetchTableData *CCPaxAccessMethod::IndexFetchBegin(Relation rel) {
+  CBDB_TRY();
+  {
+    auto desc = PAX_NEW<PaxIndexScanDesc>(rel);
+    return desc->ToBase();
+  }
+  CBDB_CATCH_DEFAULT();
+  CBDB_FINALLY({});
+  CBDB_END_TRY();
+  return nullptr;  // keep compiler quiet
+}
+
+void CCPaxAccessMethod::IndexFetchEnd(IndexFetchTableData *scan) {
+  CBDB_TRY();
+  {
+    auto desc = PaxIndexScanDesc::FromBase(scan);
+    PAX_DELETE(desc);
+  }
+  CBDB_CATCH_DEFAULT();
+  CBDB_FINALLY({});
+  CBDB_END_TRY();
+}
+
+bool CCPaxAccessMethod::IndexFetchTuple(struct IndexFetchTableData *scan,
+                                        ItemPointer tid, Snapshot snapshot,
+                                        TupleTableSlot *slot, bool *call_again,
+                                        bool *all_dead) {
+  CBDB_TRY();
+  {
+    auto desc = PaxIndexScanDesc::FromBase(scan);
+    return desc->FetchTuple(tid, snapshot, slot, call_again, all_dead);
+  }
+  CBDB_CATCH_DEFAULT();
+  CBDB_FINALLY({});
+  CBDB_END_TRY();
+  return false;  // keep compiler quiet
+}
+
+void CCPaxAccessMethod::IndexFetchReset(IndexFetchTableData * /*scan*/) {}
+
 void CCPaxAccessMethod::RelationSetNewFilenode(Relation rel,
                                                const RelFileNode *newrnode,
                                                char persistence,
                                                TransactionId *freeze_xid,
                                                MultiXactId *minmulti) {
+  Relation pax_tables_rel;
+  ScanKeyData scan_key[1];
+  SysScanDesc scan;
+  HeapTuple tuple;
+  Oid pax_relid;
+  bool exists;
+
+  *freeze_xid = *minmulti = InvalidTransactionId;
+
+  pax_tables_rel = table_open(PAX_TABLES_RELATION_ID, RowExclusiveLock);
+  pax_relid = RelationGetRelid(rel);
+
+  ScanKeyInit(&scan_key[0], ANUM_PG_PAX_TABLES_RELID, BTEqualStrategyNumber,
+              F_OIDEQ, ObjectIdGetDatum(pax_relid));
+  scan = systable_beginscan(pax_tables_rel, PAX_TABLES_RELID_INDEX_ID, true,
+                            NULL, 1, scan_key);
+  tuple = systable_getnext(scan);
+  exists = HeapTupleIsValid(tuple);
+  if (exists) {
+    Oid aux_relid;
+
+    // set new filenode, not create new table
+    //
+    // 1. truncate aux table by new relfilenode
+    aux_relid = ::paxc::GetPaxAuxRelid(pax_relid);
+    Assert(OidIsValid(aux_relid));
+    paxc::PaxAuxRelationSetNewFilenode(aux_relid);
+  } else {
+    // create new table
+    //
+    // 1. create aux table
+    // 2. initialize fast sequence in pg_pax_fastsequence
+    // 3. setup dependency
+    paxc::CPaxCreateMicroPartitionTable(rel);
+  }
+
+  // initialize or reset the fast sequence number
+  paxc::CPaxInitializeFastSequenceEntry(
+      pax_relid,
+      exists ? FASTSEQUENCE_INIT_TYPE_UPDATE : FASTSEQUENCE_INIT_TYPE_CREATE);
+
+  systable_endscan(scan);
+  table_close(pax_tables_rel, NoLock);
+
+  // create relfilenode file for pax table
+  auto srel = RelationCreateStorage(*newrnode, persistence, SMGR_MD, rel);
+  smgrclose(srel);
+
+  // create data directory
   CBDB_TRY();
   {
-    *freeze_xid = *minmulti = InvalidTransactionId;
-    pax::CCPaxAuxTable::PaxAuxRelationSetNewFilenode(rel, newrnode,
-                                                     persistence);
+    FileSystem *fs = pax::Singleton<LocalFileSystem>::GetInstance();
+    auto path = cbdb::BuildPaxDirectoryPath(*newrnode, rel->rd_backend);
+    Assert(!path.empty());
+    CBDB_CHECK((fs->CreateDirectory(path) == 0),
+               cbdb::CException::ExType::kExTypeIOError);
   }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
@@ -233,12 +313,14 @@ void CCPaxAccessMethod::RelationFileUnlink(RelFileNodeBackend rnode) {
   CBDB_END_TRY();
 }
 
-void CCPaxAccessMethod::ScanRescan(TableScanDesc scan, ScanKey /*key*/,
-                                   bool /*set_params*/, bool /*allow_strat*/,
-                                   bool /*allow_sync*/,
-                                   bool /*allow_pagemode*/) {
+void CCPaxAccessMethod::ScanRescan(TableScanDesc scan, ScanKey key,
+                                   bool set_params, bool allow_strat,
+                                   bool allow_sync, bool allow_pagemode) {
   CBDB_TRY();
-  { pax::PaxScanDesc::ReScan(scan); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    desc->ReScan(key, set_params, allow_strat, allow_sync, allow_pagemode);
+  }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
   CBDB_END_TRY();
@@ -248,11 +330,12 @@ bool CCPaxAccessMethod::ScanGetNextSlot(TableScanDesc scan,
                                         ScanDirection /*direction*/,
                                         TupleTableSlot *slot) {
   CBDB_TRY();
-  { return PaxScanDesc::ScanGetNextSlot(scan, slot); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->GetNextSlot(slot);
+  }
   CBDB_CATCH_DEFAULT();
-  CBDB_FINALLY({
-      // FIXME: destroy PaxScanDesc?
-  });
+  CBDB_FINALLY({});
   CBDB_END_TRY();
 
   pg_unreachable();
@@ -315,11 +398,14 @@ TM_Result CCPaxAccessMethod::TupleUpdate(Relation relation, ItemPointer otid,
   pg_unreachable();
 }
 
-bool CCPaxAccessMethod::ScanAnalyzeNextBlock(
-    TableScanDesc scan, BlockNumber blockno,
-    BufferAccessStrategy /*bstrategy*/) {
+bool CCPaxAccessMethod::ScanAnalyzeNextBlock(TableScanDesc scan,
+                                             BlockNumber blockno,
+                                             BufferAccessStrategy bstrategy) {
   CBDB_TRY();
-  { return PaxScanDesc::ScanAnalyzeNextBlock(scan, blockno); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->ScanAnalyzeNextBlock(blockno, bstrategy);
+  }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
   CBDB_END_TRY();
@@ -327,34 +413,54 @@ bool CCPaxAccessMethod::ScanAnalyzeNextBlock(
 }
 
 bool CCPaxAccessMethod::ScanAnalyzeNextTuple(TableScanDesc scan,
-                                             TransactionId /*oldest_xmin*/,
+                                             TransactionId oldest_xmin,
                                              double *liverows, double *deadrows,
                                              TupleTableSlot *slot) {
   CBDB_TRY();
-  { return PaxScanDesc::ScanAnalyzeNextTuple(scan, liverows, deadrows, slot); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->ScanAnalyzeNextTuple(oldest_xmin, liverows, deadrows, slot);
+  }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
   CBDB_END_TRY();
   pg_unreachable();
 }
 
-bool CCPaxAccessMethod::ScanBitmapNextBlock(TableScanDesc /*scan*/,
-                                            TBMIterateResult * /*tbmres*/) {
-  NOT_IMPLEMENTED_YET;
-  return false;
+bool CCPaxAccessMethod::ScanBitmapNextBlock(TableScanDesc scan,
+                                            TBMIterateResult *tbmres) {
+  CBDB_TRY();
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->BitmapNextBlock(tbmres);
+  }
+  CBDB_CATCH_DEFAULT();
+  CBDB_FINALLY({});
+  CBDB_END_TRY();
+  pg_unreachable();
 }
 
-bool CCPaxAccessMethod::ScanBitmapNextTuple(TableScanDesc /*scan*/,
-                                            TBMIterateResult * /*tbmres*/,
-                                            TupleTableSlot * /*slot*/) {
-  NOT_IMPLEMENTED_YET;
-  return false;
+bool CCPaxAccessMethod::ScanBitmapNextTuple(TableScanDesc scan,
+                                            TBMIterateResult *tbmres,
+                                            TupleTableSlot *slot) {
+  CBDB_TRY();
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->BitmapNextTuple(tbmres, slot);
+  }
+  CBDB_CATCH_DEFAULT();
+  CBDB_FINALLY({});
+  CBDB_END_TRY();
+  pg_unreachable();
 }
 
 bool CCPaxAccessMethod::ScanSampleNextBlock(TableScanDesc scan,
                                             SampleScanState *scanstate) {
   CBDB_TRY();
-  { return PaxScanDesc::ScanSampleNextBlock(scan, scanstate); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->ScanSampleNextBlock(scanstate);
+  }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
   CBDB_END_TRY();
@@ -362,10 +468,13 @@ bool CCPaxAccessMethod::ScanSampleNextBlock(TableScanDesc scan,
 }
 
 bool CCPaxAccessMethod::ScanSampleNextTuple(TableScanDesc scan,
-                                            SampleScanState * /*scanstate*/,
+                                            SampleScanState *scanstate,
                                             TupleTableSlot *slot) {
   CBDB_TRY();
-  { return PaxScanDesc::ScanSampleNextTuple(scan, slot); }
+  {
+    auto desc = PaxScanDesc::ToDesc(scan);
+    return desc->ScanSampleNextTuple(scanstate, slot);
+  }
   CBDB_CATCH_DEFAULT();
   CBDB_FINALLY({});
   CBDB_END_TRY();
@@ -409,9 +518,7 @@ void CCPaxAccessMethod::FinishBulkInsert(Relation relation, int options) {
 }
 
 void CCPaxAccessMethod::ExtDmlInit(Relation rel, CmdType operation) {
-  if (!RELATION_IS_PAX(rel)) {
-    return;
-  }
+  if (!RELATION_IS_PAX(rel)) return;
 
   CBDB_TRY();
   { pax::CPaxDmlStateLocal::Instance()->InitDmlState(rel, operation); }
@@ -421,9 +528,7 @@ void CCPaxAccessMethod::ExtDmlInit(Relation rel, CmdType operation) {
 }
 
 void CCPaxAccessMethod::ExtDmlFini(Relation rel, CmdType operation) {
-  if (!RELATION_IS_PAX(rel)) {
-    return;
-  }
+  if (!RELATION_IS_PAX(rel)) return;
 
   CBDB_TRY();
   { pax::CPaxDmlStateLocal::Instance()->FinishDmlState(rel, operation); }
@@ -458,29 +563,6 @@ void PaxAccessMethod::ParallelscanReinitialize(
   NOT_IMPLEMENTED_YET;
 }
 
-struct IndexFetchTableData *PaxAccessMethod::IndexFetchBegin(Relation /*rel*/) {
-  NOT_SUPPORTED_YET;
-  return nullptr;
-}
-
-void PaxAccessMethod::IndexFetchEnd(IndexFetchTableData * /*data*/) {
-  NOT_SUPPORTED_YET;
-}
-
-void PaxAccessMethod::IndexFetchReset(IndexFetchTableData * /*data*/) {
-  NOT_SUPPORTED_YET;
-}
-
-bool PaxAccessMethod::IndexFetchTuple(struct IndexFetchTableData * /*scan*/,
-                                      ItemPointer /*tid*/,
-                                      Snapshot /*snapshot*/,
-                                      TupleTableSlot * /*slot*/,
-                                      bool * /*call_again*/,
-                                      bool * /*all_dead*/) {
-  NOT_SUPPORTED_YET;
-  return false;
-}
-
 void PaxAccessMethod::TupleInsertSpeculative(Relation /*relation*/,
                                              TupleTableSlot * /*slot*/,
                                              CommandId /*cid*/, int /*options*/,
@@ -556,10 +638,10 @@ uint64 PaxAccessMethod::RelationSize(Relation rel, ForkNumber fork_number) {
   if (fork_number != MAIN_FORKNUM) return 0;
 
   // Get the oid of pg_pax_blocks_xxx from pg_pax_tables
-  GetPaxTablesEntryAttributes(rel->rd_id, &pax_aux_oid, NULL, NULL);
+  pax_aux_oid = ::paxc::GetPaxAuxRelid(rel->rd_id);
 
   // Scan pg_pax_blocks_xxx to calculate size of micro partition
-  pax_aux_rel = heap_open(pax_aux_oid, AccessShareLock);
+  pax_aux_rel = table_open(pax_aux_oid, AccessShareLock);
   aux_tup_desc = RelationGetDescr(pax_aux_rel);
 
   aux_scan = systable_beginscan(pax_aux_rel, InvalidOid, false, NULL, 0, NULL);
@@ -576,7 +658,7 @@ uint64 PaxAccessMethod::RelationSize(Relation rel, ForkNumber fork_number) {
   }
 
   systable_endscan(aux_scan);
-  heap_close(pax_aux_rel, AccessShareLock);
+  table_close(pax_aux_rel, AccessShareLock);
 
   return pax_size;
 }
@@ -599,7 +681,7 @@ void PaxAccessMethod::EstimateRelSize(Relation rel, int32 * /*attr_widths*/,
   TupleDesc aux_tup_desc;
   HeapTuple aux_tup;
   SysScanDesc aux_scan;
-  uint32 total_tuples = 0;
+  uint64 total_tuples = 0;
   uint64 pax_size = 0;
 
   // Even an empty table takes at least one page,
@@ -610,10 +692,10 @@ void PaxAccessMethod::EstimateRelSize(Relation rel, int32 * /*attr_widths*/,
   *allvisfrac = 0;
 
   // Get the oid of pg_pax_blocks_xxx from pg_pax_tables
-  GetPaxTablesEntryAttributes(rel->rd_id, &pax_aux_oid, NULL, NULL);
+  pax_aux_oid = ::paxc::GetPaxAuxRelid(rel->rd_id);
 
   // Scan pg_pax_blocks_xxx to get attributes
-  pax_aux_rel = heap_open(pax_aux_oid, AccessShareLock);
+  pax_aux_rel = table_open(pax_aux_oid, AccessShareLock);
   aux_tup_desc = RelationGetDescr(pax_aux_rel);
 
   aux_scan = systable_beginscan(pax_aux_rel, InvalidOid, false, NULL, 0, NULL);
@@ -640,20 +722,122 @@ void PaxAccessMethod::EstimateRelSize(Relation rel, int32 * /*attr_widths*/,
   }
 
   systable_endscan(aux_scan);
-  heap_close(pax_aux_rel, AccessShareLock);
+  table_close(pax_aux_rel, AccessShareLock);
 
   *tuples = static_cast<double>(total_tuples);
   *pages = RelationGuessNumberOfBlocksFromSize(pax_size);
 }
 
 double PaxAccessMethod::IndexBuildRangeScan(
-    Relation /*heap_relation*/, Relation /*index_relation*/,
-    IndexInfo * /*index_info*/, bool /*allow_sync*/, bool /*anyvisible*/,
-    bool /*progress*/, BlockNumber /*start_blockno*/, BlockNumber /*numblocks*/,
-    IndexBuildCallback /*callback*/, void * /*callback_state*/,
-    TableScanDesc /*scan*/) {
-  NOT_SUPPORTED_YET;
-  return 0.0;
+    Relation heap_relation, Relation index_relation, IndexInfo *index_info,
+    bool /*allow_sync*/, bool anyvisible, bool progress,
+    BlockNumber start_blockno, BlockNumber numblocks,
+    IndexBuildCallback callback, void *callback_state, TableScanDesc scan) {
+  Datum values[INDEX_MAX_KEYS];
+  bool isnull[INDEX_MAX_KEYS];
+  double reltuples = 0;
+  ExprState *predicate;
+  TupleTableSlot *slot;
+  EState *estate;
+  ExprContext *econtext;
+  Snapshot snapshot;
+
+  bool checking_uniqueness;
+  bool need_unregister_snapshot;
+  BlockNumber previous_blkno = InvalidBlockNumber;
+
+  Assert(OidIsValid(index_relation->rd_rel->relam));
+  Assert(!IsSystemRelation(heap_relation));
+
+  checking_uniqueness =
+      (index_info->ii_Unique || index_info->ii_ExclusionOps != NULL);
+  // "Any visible" mode is not compatible with uniqueness checks; make sure
+  // only one of those is requested.
+  (void)anyvisible;  // keep compiler quiet for release version
+  Assert(!(anyvisible && checking_uniqueness));
+
+  slot = table_slot_create(heap_relation, NULL);
+  estate = CreateExecutorState();
+  econtext = GetPerTupleExprContext(estate);
+  econtext->ecxt_scantuple = slot;
+  predicate = ExecPrepareQual(index_info->ii_Predicate, estate);
+
+  if (!scan) {
+    snapshot = RegisterSnapshot(GetTransactionSnapshot());
+    scan = table_beginscan(heap_relation, snapshot, 0, NULL);
+    need_unregister_snapshot = true;
+  } else {
+    snapshot = scan->rs_snapshot;
+    need_unregister_snapshot = false;
+  }
+
+  // FIXME: Only brin index uses partial index now. setup start_blockno
+  // and numblocks is too late after beginscan is called now, because
+  // the current micro partition is opened. The workaround is ugly to
+  // check and close the current micro partition and open another one.
+  if (start_blockno != 0 || numblocks != InvalidBlockNumber)
+    elog(ERROR, "PAX doesn't support partial index scan now");
+
+  while (table_scan_getnextslot(scan, ForwardScanDirection, slot)) {
+    CHECK_FOR_INTERRUPTS();
+
+    if (progress) {
+      BlockNumber blkno = pax::GetBlockNumber(slot->tts_tid);
+      if (previous_blkno == InvalidBlockNumber)
+        previous_blkno = blkno;
+      else if (previous_blkno != blkno) {
+        pgstat_progress_update_param(PROGRESS_SCAN_BLOCKS_DONE,
+                                     blkno - start_blockno);
+        previous_blkno = blkno;
+      }
+    }
+    reltuples += 1;
+
+    MemoryContextReset(econtext->ecxt_per_tuple_memory);
+
+    /*
+     * In a partial index, discard tuples that don't satisfy the
+     * predicate.
+     */
+    if (predicate && !ExecQual(predicate, econtext)) continue;
+
+    /*
+     * For the current heap tuple, extract all the attributes we use in
+     * this index, and note which are null.  This also performs evaluation
+     * of any expressions needed.
+     */
+    FormIndexDatum(index_info, slot, estate, values, isnull);
+
+    /*
+     * You'd think we should go ahead and build the index tuple here, but
+     * some index AMs want to do further processing on the data first.  So
+     * pass the values[] and isnull[] arrays, instead.
+     */
+    callback(index_relation, &slot->tts_tid, values, isnull, true,
+             callback_state);
+  }
+
+  /* Report scan progress one last time. */
+  if (progress && previous_blkno != InvalidBlockNumber)
+    pgstat_progress_update_param(PROGRESS_SCAN_BLOCKS_DONE,
+                                 previous_blkno + 1 - start_blockno);
+
+  table_endscan(scan);
+  if (need_unregister_snapshot) UnregisterSnapshot(snapshot);
+
+  ExecDropSingleTupleTableSlot(slot);
+  FreeExecutorState(estate);
+
+  /* These may have been pointing to the now-gone estate */
+  index_info->ii_ExpressionsState = NIL;
+  index_info->ii_PredicateState = NULL;
+
+  return reltuples;
+}
+
+bool PaxAccessMethod::IndexUniqueCheck(Relation rel, ItemPointer tid,
+                                       Snapshot snapshot, bool *all_dead) {
+  return paxc::IndexUniqueCheck(rel, tid, snapshot, all_dead);
 }
 
 void PaxAccessMethod::IndexValidateScan(Relation /*heap_relation*/,
@@ -664,83 +848,107 @@ void PaxAccessMethod::IndexValidateScan(Relation /*heap_relation*/,
   NOT_IMPLEMENTED_YET;
 }
 
-#define PAX_COPY_OPT(pax_opts_, pax_opt_name_)                                \
-  do {                                                                        \
-    PaxOptions *pax_opts = reinterpret_cast<PaxOptions *>(pax_opts_);         \
-    int pax_name_offset_ = *reinterpret_cast<int *>(pax_opts->pax_opt_name_); \
-    if (pax_name_offset_)                                                     \
-      strlcpy(pax_opts->pax_opt_name_,                                        \
-              reinterpret_cast<char *>(pax_opts) + pax_name_offset_,          \
-              sizeof(pax_opts->pax_opt_name_));                               \
-  } while (0)
-bytea *PaxAccessMethod::Amoptions(Datum reloptions, char /*relkind*/,
-                                  bool validate) {
-  void *rdopts;
-
-  rdopts = build_reloptions(reloptions, validate, self_relopt_kind,
-                            sizeof(PaxOptions), kSelfReloptTab,
-                            lengthof(kSelfReloptTab));
-  // adjust string values
-  PAX_COPY_OPT(rdopts, storage_format);
-  PAX_COPY_OPT(rdopts, compress_type);
-
-  return reinterpret_cast<bytea *>(rdopts);
-}
-#undef PAX_COPY_OPT
-
+// Swap data between two pax tables, but not swap oids
+// 1. swap partition-spec in pg_pax_tables
+// 2. swap relation content for aux table and toast
 void PaxAccessMethod::SwapRelationFiles(Oid relid1, Oid relid2,
                                         TransactionId frozen_xid,
                                         MultiXactId cutoff_multi) {
-  HeapTuple tuple1;
-  HeapTuple tuple2;
+  HeapTuple old_tuple1;
+  HeapTuple old_tuple2;
   Relation pax_rel;
+  TupleDesc desc;
+  ScanKeyData key[1];
+  SysScanDesc scan;
 
-  Oid b_relid1;
-  Oid b_relid2;
+  Oid aux_relid1;
+  Oid aux_relid2;
 
-  pax_rel = table_open(PaxTablesRelationId, RowExclusiveLock);
+  pax_rel = table_open(PAX_TABLES_RELATION_ID, RowExclusiveLock);
+  desc = RelationGetDescr(pax_rel);
 
-  tuple1 = SearchSysCacheCopy1(PAXTABLESID, relid1);
-  if (!HeapTupleIsValid(tuple1))
-    ereport(ERROR, (errcode(ERRCODE_UNDEFINED_SCHEMA),
-                    errmsg("cache lookup failed with relid=%u for aux relation "
-                           "in pg_pax_tables.",
-                           relid1)));
+  // save ctid, auxrelid and partition-spec for the first pax relation
+  ScanKeyInit(&key[0], ANUM_PG_PAX_TABLES_RELID, BTEqualStrategyNumber, F_OIDEQ,
+              ObjectIdGetDatum(relid1));
 
-  tuple2 = SearchSysCacheCopy1(PAXTABLESID, relid2);
-  if (!HeapTupleIsValid(tuple2))
-    ereport(ERROR, (errcode(ERRCODE_UNDEFINED_SCHEMA),
-                    errmsg("cache lookup failed with relid=%u for aux relation "
-                           "in pg_pax_tables.",
-                           relid2)));
+  scan = systable_beginscan(pax_rel, PAX_TABLES_RELID_INDEX_ID, true, nullptr,
+                            1, key);
+  old_tuple1 = systable_getnext(scan);
+  if (!HeapTupleIsValid(old_tuple1))
+    ereport(ERROR, (errmsg("relid=%u is not a pax relation", relid1)));
 
-  // swap the entries
-  {
-    Form_pg_pax_tables form1;
-    Form_pg_pax_tables form2;
+  old_tuple1 = heap_copytuple(old_tuple1);
+  systable_endscan(scan);
 
-    int16 temp_compresslevel;
-    NameData temp_compresstype;
+  // save ctid, auxrelid and partition-spec for the second pax relation
+  ScanKeyInit(&key[0], ANUM_PG_PAX_TABLES_RELID, BTEqualStrategyNumber, F_OIDEQ,
+              ObjectIdGetDatum(relid2));
+  scan = systable_beginscan(pax_rel, PAX_TABLES_RELID_INDEX_ID, true, nullptr,
+                            1, key);
+  old_tuple2 = systable_getnext(scan);
+  if (!HeapTupleIsValid(old_tuple2))
+    ereport(ERROR, (errmsg("relid=%u is not a pax relation", relid2)));
 
-    form1 = (Form_pg_pax_tables)GETSTRUCT(tuple1);
-    form2 = (Form_pg_pax_tables)GETSTRUCT(tuple2);
+  old_tuple2 = heap_copytuple(old_tuple2);
+  systable_endscan(scan);
 
-    Assert(((Form_pg_pax_tables)GETSTRUCT(tuple1))->relid == relid1);
-    Assert(((Form_pg_pax_tables)GETSTRUCT(tuple2))->relid == relid2);
+  // swap the entries
+  {
+    HeapTuple tuple1;
+    HeapTuple tuple2;
+    Datum values[NATTS_PG_PAX_TABLES];
+    bool nulls[NATTS_PG_PAX_TABLES];
+    Datum datum;
+    bool isnull;
+
+    datum =
+        heap_getattr(old_tuple1, ANUM_PG_PAX_TABLES_AUXRELID, desc, &isnull);
+    Assert(!isnull);
+    aux_relid1 = DatumGetObjectId(datum);
+
+    values[ANUM_PG_PAX_TABLES_RELID - 1] = ObjectIdGetDatum(relid1);
+    values[ANUM_PG_PAX_TABLES_AUXRELID - 1] = datum;
+    nulls[ANUM_PG_PAX_TABLES_RELID - 1] = false;
+    nulls[ANUM_PG_PAX_TABLES_AUXRELID - 1] = false;
+
+    datum = heap_getattr(old_tuple2, ANUM_PG_PAX_TABLES_PARTITIONSPEC, desc,
+                         &isnull);
+    if (!isnull) {
+      auto vl = reinterpret_cast<struct varlena *>(DatumGetPointer(datum));
+      vl = pg_detoast_datum_packed(vl);
+      values[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = PointerGetDatum(vl);
+    }
+    nulls[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = isnull;
 
-    b_relid1 = form1->blocksrelid;
-    b_relid2 = form2->blocksrelid;
+    tuple1 = heap_form_tuple(desc, values, nulls);
+    tuple1->t_data->t_ctid = old_tuple1->t_data->t_ctid;
+    tuple1->t_self = old_tuple1->t_self;
+    tuple1->t_tableOid = old_tuple1->t_tableOid;
 
-    memcpy(&temp_compresstype, &form1->compresstype, sizeof(NameData));
-    memcpy(&form1->compresstype, &form2->compresstype, sizeof(NameData));
-    memcpy(&form2->compresstype, &temp_compresstype, sizeof(NameData));
+    datum =
+        heap_getattr(old_tuple2, ANUM_PG_PAX_TABLES_AUXRELID, desc, &isnull);
+    Assert(!isnull);
+    aux_relid2 = DatumGetObjectId(datum);
+
+    values[ANUM_PG_PAX_TABLES_RELID - 1] = ObjectIdGetDatum(relid2);
+    values[ANUM_PG_PAX_TABLES_AUXRELID - 1] = datum;
+    nulls[ANUM_PG_PAX_TABLES_RELID - 1] = false;
+    nulls[ANUM_PG_PAX_TABLES_AUXRELID - 1] = false;
+
+    datum = heap_getattr(old_tuple1, ANUM_PG_PAX_TABLES_PARTITIONSPEC, desc,
+                         &isnull);
+    if (!isnull) {
+      auto vl = reinterpret_cast<struct varlena *>(DatumGetPointer(datum));
+      vl = pg_detoast_datum_packed(vl);
+      values[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = PointerGetDatum(vl);
+    }
+    nulls[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = isnull;
 
-    temp_compresslevel = form1->compresslevel;
-    form1->compresslevel = form2->compresslevel;
-    form2->compresslevel = temp_compresslevel;
-  }
+    tuple2 = heap_form_tuple(desc, values, nulls);
+    tuple2->t_data->t_ctid = old_tuple2->t_data->t_ctid;
+    tuple2->t_self = old_tuple2->t_self;
+    tuple2->t_tableOid = old_tuple2->t_tableOid;
 
-  {
     CatalogIndexState indstate;
 
     indstate = CatalogOpenIndexes(pax_rel);
@@ -753,23 +961,55 @@ void PaxAccessMethod::SwapRelationFiles(Oid relid1, Oid relid2,
 
   /* swap relation files for aux table */
   {
-    Relation b_rel1;
-    Relation b_rel2;
-
-    b_rel1 = relation_open(b_relid1, AccessExclusiveLock);
-    b_rel2 = relation_open(b_relid2, AccessExclusiveLock);
-
-    swap_relation_files(b_relid1, b_relid2, false, /* target_is_pg_class */
-                        true,                      /* swap_toast_by_content */
-                        true,                      /*swap_stats */
-                        true,                      /* is_internal */
+    Relation aux_rel1;
+    Relation aux_rel2;
+    ReindexParams reindex_params = {0};
+    Relation toast_rel1 = nullptr;
+    Relation toast_rel2 = nullptr;
+
+    aux_rel1 = relation_open(aux_relid1, AccessExclusiveLock);
+    aux_rel2 = relation_open(aux_relid2, AccessExclusiveLock);
+
+    if (OidIsValid(aux_rel1->rd_rel->reltoastrelid))
+      toast_rel1 =
+          relation_open(aux_rel1->rd_rel->reltoastrelid, AccessExclusiveLock);
+    if (OidIsValid(aux_rel2->rd_rel->reltoastrelid))
+      toast_rel2 =
+          relation_open(aux_rel2->rd_rel->reltoastrelid, AccessExclusiveLock);
+
+    swap_relation_files(aux_relid1, aux_relid2, false, /* target_is_pg_class */
+                        true, /* swap_toast_by_content */
+                        true, /*swap_stats */
+                        true, /* is_internal */
                         frozen_xid, cutoff_multi, NULL);
 
-    relation_close(b_rel1, NoLock);
-    relation_close(b_rel2, NoLock);
+    if (toast_rel1) relation_close(toast_rel1, NoLock);
+    if (toast_rel2) relation_close(toast_rel2, NoLock);
+    relation_close(aux_rel1, NoLock);
+    relation_close(aux_rel2, NoLock);
+
+    reindex_relation(aux_relid1, 0, &reindex_params);
+    reindex_relation(aux_relid2, 0, &reindex_params);
   }
 }
 
+bytea *PaxAccessMethod::AmOptions(Datum reloptions, char relkind,
+                                  bool validate) {
+  return paxc_default_rel_options(reloptions, relkind, validate);
+}
+
+void PaxAccessMethod::ValidateColumnEncodingClauses(List *encoding_opts) {
+  paxc_validate_column_encoding_clauses(encoding_opts);
+}
+
+List *PaxAccessMethod::TransformColumnEncodingClauses(Relation /*rel*/,
+                                                      List *encoding_opts,
+                                                      bool validate,
+                                                      bool from_type) {
+  return paxc_transform_column_encoding_clauses(encoding_opts, validate,
+                                                from_type);
+}
+
 }  // namespace paxc
 // END of C implementation
 
@@ -789,10 +1029,11 @@ static const TableAmRoutine kPaxColumnMethods = {
     .parallelscan_reinitialize =
         paxc::PaxAccessMethod::ParallelscanReinitialize,
 
-    .index_fetch_begin = paxc::PaxAccessMethod::IndexFetchBegin,
-    .index_fetch_reset = paxc::PaxAccessMethod::IndexFetchReset,
-    .index_fetch_end = paxc::PaxAccessMethod::IndexFetchEnd,
-    .index_fetch_tuple = paxc::PaxAccessMethod::IndexFetchTuple,
+    .index_fetch_begin = pax::CCPaxAccessMethod::IndexFetchBegin,
+    .index_fetch_reset = pax::CCPaxAccessMethod::IndexFetchReset,
+    .index_fetch_end = pax::CCPaxAccessMethod::IndexFetchEnd,
+    .index_fetch_tuple = pax::CCPaxAccessMethod::IndexFetchTuple,
+    .index_unique_check = paxc::PaxAccessMethod::IndexUniqueCheck,
 
     .tuple_fetch_row_version = paxc::PaxAccessMethod::TupleFetchRowVersion,
     .tuple_tid_valid = paxc::PaxAccessMethod::TupleTidValid,
@@ -831,8 +1072,12 @@ static const TableAmRoutine kPaxColumnMethods = {
     .scan_sample_next_block = pax::CCPaxAccessMethod::ScanSampleNextBlock,
     .scan_sample_next_tuple = pax::CCPaxAccessMethod::ScanSampleNextTuple,
 
-    .amoptions = paxc::PaxAccessMethod::Amoptions,
+    .amoptions = paxc::PaxAccessMethod::AmOptions,
     .swap_relation_files = paxc::PaxAccessMethod::SwapRelationFiles,
+    .validate_column_encoding_clauses =
+        paxc::PaxAccessMethod::ValidateColumnEncodingClauses,
+    .transform_column_encoding_clauses =
+        paxc::PaxAccessMethod::TransformColumnEncodingClauses,
 };
 
 PG_MODULE_MAGIC;
@@ -841,107 +1086,168 @@ Datum pax_tableam_handler(PG_FUNCTION_ARGS) {  // NOLINT
   PG_RETURN_POINTER(&kPaxColumnMethods);
 }
 
-static void PaxValidateStorageFormat(const char *value) {
-  size_t i;
-  static const char *storage_formats[] = {
-      "orc",
-      "ppt",
-  };
-
-  for (i = 0; i < lengthof(storage_formats); i++) {
-    if (strcmp(value, storage_formats[i]) == 0) return;
+static object_access_hook_type prev_object_access_hook = NULL;
+
+static void PaxObjectAccessHook(ObjectAccessType access, Oid class_id,
+                                Oid object_id, int sub_id, void *arg) {
+  Relation rel;
+  PartitionKey pkey;
+  List *part;
+  List *pby;
+  paxc::PaxOptions *options;
+
+  if (prev_object_access_hook)
+    prev_object_access_hook(access, class_id, object_id, sub_id, arg);
+
+  if (access != OAT_POST_CREATE || class_id != RelationRelationId) return;
+
+  CommandCounterIncrement();
+  rel = relation_open(object_id, RowExclusiveLock);
+  auto ok = ((rel->rd_rel->relkind == RELKIND_RELATION ||
+              rel->rd_rel->relkind == RELKIND_MATVIEW) &&
+             rel->rd_options && RelationIsPAX(rel));
+  if (!ok) goto out;
+
+  options = reinterpret_cast<paxc::PaxOptions *>(rel->rd_options);
+  if (!options->partition_by()) {
+    if (options->partition_ranges()) {
+      elog(ERROR, "set '%s', but partition_by not specified",
+           options->partition_ranges());
+    }
+    goto out;
   }
-  ereport(ERROR, (errmsg("unsupported storage format: '%s'", value)));
-}
 
-static void PaxValidateCompresstype(const char *value) {
-  size_t i;
-  static const char *compress_types[] = {
-      "none",
-      "zlib",
-  };
+  pby = paxc_raw_parse(options->partition_by());
+  pkey = paxc::PaxRelationBuildPartitionKey(rel, pby);
+  if (pkey->partnatts > 1) elog(ERROR, "pax only support 1 partition key now");
 
-  for (i = 0; i < lengthof(compress_types); i++) {
-    if (strcmp(value, compress_types[i]) == 0) return;
-  }
-  ereport(ERROR, (errmsg("unsupported compress type: '%s'", value)));
-}
+  part = lappend(NIL, pby);
+  if (options->partition_ranges()) {
+    List *ranges;
 
-static shmem_startup_hook_type prev_shmem_startup_hook = NULL;
-static ExecutorStart_hook_type prev_executor_start = NULL;
-static ExecutorEnd_hook_type prev_executor_end = NULL;
-static uint32 executor_run_ref_count = 0;
+    ranges = paxc_parse_partition_ranges(options->partition_ranges());
+    ranges = paxc::PaxValidatePartitionRanges(rel, pkey, ranges);
+    part = lappend(part, ranges);
+  }
+  // Currently, partition_ranges must be set to partition pax tables.
+  // We hope this option be removed and automatically partition data set.
+  else
+    elog(ERROR, "partition_ranges must be set for partition_by='%s'",
+         options->partition_by());
 
-void PaxShmemInit() {
-  if (prev_shmem_startup_hook) prev_shmem_startup_hook();
+  ::paxc::PaxInitializePartitionSpec(rel, reinterpret_cast<Node *>(part));
 
-  paxc::paxc_shmem_startup();
+out:
+  relation_close(rel, NoLock);
 }
 
-static void PaxExecutorStart(QueryDesc *query_desc, int eflags) {
-  if (prev_executor_start)
-    prev_executor_start(query_desc, eflags);
-  else
-    standard_ExecutorStart(query_desc, eflags);
-
-  executor_run_ref_count++;
+static void DefineGUCs() {
+  DefineCustomBoolVariable("pax_enable_debug", "enable pax debug", NULL,
+                           &pax::pax_enable_debug, true, PGC_USERSET, 0, NULL,
+                           NULL, NULL);
+
+  DefineCustomBoolVariable("pax_enable_filter", "enable pax filter", NULL,
+                           &pax::pax_enable_filter, true, PGC_USERSET, 0, NULL,
+                           NULL, NULL);
+
+  DefineCustomIntVariable(
+      "pax_max_tuples_per_group",
+      "the default value for the limit on the number of tuples in a group",
+      NULL, &pax::pax_max_tuples_per_group, VEC_BATCH_LENGTH, 0,
+      VEC_BATCH_LENGTH * 100, PGC_USERSET, 0, NULL, NULL, NULL);
+
+#ifdef ENABLE_PLASMA
+  DefineCustomBoolVariable(
+      "pax_enable_plasma", "Enable plasma cache the set of columns", NULL,
+      &pax::pax_enable_plasma_in_mem, true, PGC_USERSET, 0, NULL, NULL, NULL);
+#endif
+
+  DefineCustomIntVariable(
+      "pax_scan_reuse_buffer_size", "set the reuse buffer size", NULL,
+      &pax::pax_scan_reuse_buffer_size, PAX_SCAN_REUSE_BUFFER_DEFAULT_SIZE,
+      PAX_SCAN_REUSE_BUFFER_MIN_SIZE, PAX_SCAN_REUSE_BUFFER_MAX_SIZE,
+      PGC_USERSET, 0, NULL, NULL, NULL);
 }
 
-static void PaxExecutorEnd(QueryDesc *query_desc) {
-  if (prev_executor_end)
-    prev_executor_end(query_desc);
-  else
-    standard_ExecutorEnd(query_desc);
+struct PaxObjectProperty {
+  const char *name;
+  Oid class_oid;
+  Oid index_oid;
+  AttrNumber attnum_oid;
+};
 
-  executor_run_ref_count--;
-  Assert(executor_run_ref_count >= 0);
-  if (executor_run_ref_count == 0) {
-    paxc::release_command_resource();
-  }
-}
+static const struct PaxObjectProperty kPaxObjectProperties[] = {
+    {"fast-sequence", PAX_FASTSEQUENCE_OID, PAX_FASTSEQUENCE_INDEX_OID,
+     ANUM_PG_PAX_FAST_SEQUENCE_OBJID},
+    {"pg_pax_tables", PAX_TABLES_RELATION_ID, PAX_TABLES_RELID_INDEX_ID,
+     ANUM_PG_PAX_TABLES_RELID},
+    // add pg_pax_tables here
+};
 
-static void PaxXactCallback(XactEvent event, void * /*arg*/) {
-  if (event == XACT_EVENT_COMMIT || event == XACT_EVENT_ABORT ||
-      event == XACT_EVENT_PARALLEL_ABORT ||
-      event == XACT_EVENT_PARALLEL_COMMIT) {
-    if (executor_run_ref_count > 0) {
-      executor_run_ref_count = 0;
-      paxc::release_command_resource();
-    }
+static const struct PaxObjectProperty *FindPaxObjectProperty(Oid class_id) {
+  for (const auto &property : kPaxObjectProperties) {
+    const auto p = &property;
+    if (p->class_oid == class_id) return p;
   }
+  return NULL;
 }
 
-void _PG_init(void) {  // NOLINT
-  if (!process_shared_preload_libraries_in_progress) {
-    ereport(ERROR, (errmsg("pax must be loaded via shared_preload_libraries")));
-    return;
-  }
+static void PaxDeleteObject(struct CustomObjectClass * /*self*/,
+                            const ObjectAddress *object, int /*flags*/) {
+  Relation rel;
+  HeapTuple tup;
+  SysScanDesc scan;
+  ScanKeyData skey[1];
+
+  const auto object_property = FindPaxObjectProperty(object->classId);
+  Assert(object_property);
+  Assert(object_property->class_oid == object->classId);
+
+  rel = table_open(object->classId, RowExclusiveLock);
+  ScanKeyInit(&skey[0], object_property->attnum_oid, BTEqualStrategyNumber,
+              F_OIDEQ, ObjectIdGetDatum(object->objectId));
+
+  scan =
+      systable_beginscan(rel, object_property->index_oid, true, NULL, 1, skey);
 
-  paxc::paxc_shmem_request();
+  /* we expect exactly one match */
+  tup = systable_getnext(scan);
+  if (!HeapTupleIsValid(tup))
+    elog(ERROR, "could not find tuple for %s %u", object_property->name,
+         object->objectId);
 
-  prev_shmem_startup_hook = shmem_startup_hook;
-  shmem_startup_hook = PaxShmemInit;
+  CatalogTupleDelete(rel, &tup->t_self);
 
-  prev_executor_start = ExecutorStart_hook;
-  ExecutorStart_hook = PaxExecutorStart;
+  systable_endscan(scan);
 
-  prev_executor_end = ExecutorEnd_hook;
-  ExecutorEnd_hook = PaxExecutorEnd;
+  table_close(rel, RowExclusiveLock);
+}
+
+static struct CustomObjectClass pax_fastsequence_coc = {
+    .class_id = PAX_FASTSEQUENCE_OID,
+    .do_delete = PaxDeleteObject,
+};
+
+static struct CustomObjectClass pax_tables_coc = {
+    .class_id = PAX_TABLES_RELATION_ID,
+    .do_delete = PaxDeleteObject,
+};
+
+void _PG_init(void) {  // NOLINT
+  prev_object_access_hook = object_access_hook;
+  object_access_hook = PaxObjectAccessHook;
 
   ext_dml_init_hook = pax::CCPaxAccessMethod::ExtDmlInit;
   ext_dml_finish_hook = pax::CCPaxAccessMethod::ExtDmlFini;
   file_unlink_hook = pax::CCPaxAccessMethod::RelationFileUnlink;
 
-  RegisterXactCallback(PaxXactCallback, NULL);
-
-  self_relopt_kind = add_reloption_kind();
-  add_string_reloption(self_relopt_kind, "storage_format", "pax storage format",
-                       "orc", PaxValidateStorageFormat, AccessExclusiveLock);
-  add_string_reloption(self_relopt_kind, "compresstype", "pax compress type",
-                       PAX_DEFAULT_COMPRESSTYPE, PaxValidateCompresstype,
-                       AccessExclusiveLock);
-  add_int_reloption(self_relopt_kind, "compresslevel", "pax compress level",
-                    PAX_DEFAULT_COMPRESSLEVEL, AO_MIN_COMPRESSLEVEL,
-                    AO_MAX_COMPRESSLEVEL, AccessExclusiveLock);
+  register_custom_object_class(&pax_fastsequence_coc);
+  register_custom_object_class(&pax_tables_coc);
+
+  DefineGUCs();
+
+  RegisterResourceReleaseCallback(paxc::FdHandleAbortCallback, NULL);
+
+  paxc::paxc_reg_rel_options();
 }
 }  // extern "C"
diff --git a/contrib/pax_storage/src/cpp/access/pax_access_handle.h b/contrib/pax_storage/src/cpp/access/pax_access_handle.h
index 2bca0ba15a7..d88afbb2917 100644
--- a/contrib/pax_storage/src/cpp/access/pax_access_handle.h
+++ b/contrib/pax_storage/src/cpp/access/pax_access_handle.h
@@ -3,6 +3,7 @@
 #include "comm/cbdb_api.h"
 
 namespace paxc {
+
 class PaxAccessMethod final {
  private:
   PaxAccessMethod() = default;
@@ -22,14 +23,6 @@ class PaxAccessMethod final {
   static void ParallelscanReinitialize(Relation rel,
                                        ParallelTableScanDesc pscan);
 
-  /* Index Scan Callbacks, unsupported yet */
-  static struct IndexFetchTableData *IndexFetchBegin(Relation rel);
-  static void IndexFetchEnd(struct IndexFetchTableData *data);
-  static void IndexFetchReset(struct IndexFetchTableData *data);
-  static bool IndexFetchTuple(struct IndexFetchTableData *scan, ItemPointer tid,
-                              Snapshot snapshot, TupleTableSlot *slot,
-                              bool *call_again, bool *all_dead);
-
   /* Callbacks for non-modifying operations on individual tuples */
   static bool TupleFetchRowVersion(Relation relation, ItemPointer tid,
                                    Snapshot snapshot, TupleTableSlot *slot);
@@ -66,15 +59,18 @@ class PaxAccessMethod final {
       bool allow_sync, bool anyvisible, bool progress,
       BlockNumber start_blockno, BlockNumber numblocks,
       IndexBuildCallback callback, void *callback_state, TableScanDesc scan);
+  static bool IndexUniqueCheck(Relation rel, ItemPointer tid, Snapshot snapshot, bool *all_dead);
   static void IndexValidateScan(Relation heap_relation, Relation index_relation,
                                 IndexInfo *index_info, Snapshot snapshot,
                                 ValidateIndexState *state);
-
-  static bytea *Amoptions(Datum reloptions, char relkind, bool validate);
-
   static void SwapRelationFiles(Oid relid1, Oid relid2,
                                 TransactionId frozen_xid,
                                 MultiXactId cutoff_multi);
+
+  static bytea *AmOptions(Datum reloptions, char relkind, bool validate);
+  static void ValidateColumnEncodingClauses(List *encoding_opts);
+  static List *TransformColumnEncodingClauses(Relation rel, List *encoding_opts,
+                                              bool validate, bool from_type);
 };
 
 }  // namespace paxc
@@ -96,9 +92,17 @@ class CCPaxAccessMethod final {
                               TupleTableSlot *slot);
 
   static TableScanDesc ScanExtractColumns(Relation rel, Snapshot snapshot,
+                                          int nkeys, struct ScanKeyData *key,
                                           ParallelTableScanDesc parallel_scan,
-                                          List *targetlist, List *qual,
-                                          uint32 flags);
+                                          struct PlanState *ps, uint32 flags);
+
+  /* Index Scan Callbacks */
+  static struct IndexFetchTableData *IndexFetchBegin(Relation rel);
+  static void IndexFetchEnd(struct IndexFetchTableData *scan);
+  static void IndexFetchReset(struct IndexFetchTableData *scan);
+  static bool IndexFetchTuple(struct IndexFetchTableData *scan, ItemPointer tid,
+                              Snapshot snapshot, TupleTableSlot *slot,
+                              bool *call_again, bool *all_dead);
 
   /* Manipulations of physical tuples. */
   static void TupleInsert(Relation relation, TupleTableSlot *slot,
@@ -162,11 +166,3 @@ class CCPaxAccessMethod final {
 
 extern ext_dml_func_hook_type ext_dml_init_hook;
 extern ext_dml_func_hook_type ext_dml_finish_hook;
-
-// plain structure used by reloptions, can be accessed from C++ code.
-struct PaxOptions {
-  int32 vl_len; /* varlena header (do not touch directly!) */
-  char storage_format[16];
-  char compress_type[16];
-  int compress_level;
-};
diff --git a/contrib/pax_storage/src/cpp/access/pax_deleter.cc b/contrib/pax_storage/src/cpp/access/pax_deleter.cc
index 594bc221eb0..3af63a7e6bb 100644
--- a/contrib/pax_storage/src/cpp/access/pax_deleter.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_deleter.cc
@@ -5,18 +5,15 @@
 #include <vector>
 
 #include "access/pax_dml_state.h"
+#include "catalog/pax_aux_table.h"
 #include "comm/singleton.h"
 #include "storage/pax_itemptr.h"
-#include "storage/paxc_block_map_manager.h"
 namespace pax {
-CPaxDeleter::CPaxDeleter(const Relation rel, const Snapshot snapshot)
+CPaxDeleter::CPaxDeleter(Relation rel, Snapshot snapshot)
     : rel_(rel), snapshot_(snapshot) {}
 
-CPaxDeleter::~CPaxDeleter() = default;
-
-TM_Result CPaxDeleter::DeleteTuple(const Relation relation,
-                                   const ItemPointer tid, const CommandId cid,
-                                   const Snapshot snapshot,
+TM_Result CPaxDeleter::DeleteTuple(Relation relation, ItemPointer tid,
+                                   CommandId cid, Snapshot snapshot,
                                    TM_FailureData *tmfd) {
   CPaxDeleter *deleter =
       CPaxDmlStateLocal::Instance()->GetDeleter(relation, snapshot);
@@ -29,63 +26,64 @@ TM_Result CPaxDeleter::DeleteTuple(const Relation relation,
   }
   return result;
 }
+// used for delete tuples
+TM_Result CPaxDeleter::MarkDelete(ItemPointer tid) {
+  uint32 tuple_offset = pax::GetTupleOffset(*tid);
 
-TM_Result CPaxDeleter::MarkDelete(const ItemPointer tid) {
-  PaxItemPointer pax_tid(reinterpret_cast<PaxItemPointer *>(tid));
-  uint8 table_no = pax_tid.GetTableNo();
-  uint32 block_number = pax_tid.GetBlockNumber();
-  uint32 tuple_number = pax_tid.GetTupleNumber();
-
-  std::string block_id =
-      cbdb::GetBlockId(rel_->rd_id, table_no, block_number).ToStr();
+  std::string block_id = MapToBlockNumber(rel_, *tid);
 
   if (block_bitmap_map_.find(block_id) == block_bitmap_map_.end()) {
-    // TODO(gongxun): bitmap should support dynamic raise size
     block_bitmap_map_[block_id] =
-        std::unique_ptr<DynamicBitmap>(new DynamicBitmap());  // NOLINT
-  }
-  DynamicBitmap *bitmap = block_bitmap_map_[block_id].get();
-  if (bitmap->NumBits() <= tuple_number) {
-    bitmap->Resize(bitmap->NumBits() * 2);
+        pax_unique_ptr<Bitmap64>(PAX_NEW<Bitmap64>());  // NOLINT
+    cbdb::DeleteMicroPartitionEntry(RelationGetRelid(rel_), snapshot_,
+                                    block_id);
   }
-
-  if (bitmap->Test(tuple_number)) {
+  auto bitmap = block_bitmap_map_[block_id].get();
+  if (bitmap->Test(tuple_offset)) {
     return TM_SelfModified;
   }
-
-  bitmap->Set(tuple_number);
+  bitmap->Set(tuple_offset);
   return TM_Ok;
 }
 
-void CPaxDeleter::ExecDelete() {
-  if (block_bitmap_map_.empty()) {
-    return;
+// used for merge remaining partition files, no tuple needs to delete
+void CPaxDeleter::MarkDelete(BlockNumber pax_block_id) {
+  std::string block_id = std::to_string(pax_block_id);
+
+  if (block_bitmap_map_.find(block_id) == block_bitmap_map_.end()) {
+    block_bitmap_map_[block_id] = pax_unique_ptr<Bitmap64>(PAX_NEW<Bitmap64>());
+    cbdb::DeleteMicroPartitionEntry(RelationGetRelid(rel_), snapshot_,
+                                    block_id);
   }
+}
+
+void CPaxDeleter::ExecDelete() {
+  if (block_bitmap_map_.empty()) return;
 
-  TableDeleter table_deleter(rel_, buildDeleteIterator(),
+  TableDeleter table_deleter(rel_, BuildDeleteIterator(),
                              std::move(block_bitmap_map_), snapshot_);
   table_deleter.Delete();
 }
 
-std::unique_ptr<IteratorBase<MicroPartitionMetadata>>
-CPaxDeleter::buildDeleteIterator() {
+pax_unique_ptr<IteratorBase<MicroPartitionMetadata>>
+CPaxDeleter::BuildDeleteIterator() {
   std::vector<pax::MicroPartitionMetadata> micro_partitions;
+  auto rel_path = cbdb::BuildPaxDirectoryPath(rel_->rd_node, rel_->rd_backend);
   for (auto &it : block_bitmap_map_) {
     std::string block_id = it.first;
-    DynamicBitmap *bitmap_ptr = it.second.get();
-    BitmapIterator bitmap_it(bitmap_ptr);
-    int32 tuple_number = bitmap_it.Next(true);
-    if (tuple_number != -1) {
+    {
       pax::MicroPartitionMetadata meta_info;
 
-      meta_info.SetFileName(cbdb::BuildPaxFilePath(rel_, block_id));
+      meta_info.SetFileName(cbdb::BuildPaxFilePath(rel_path, block_id));
       meta_info.SetMicroPartitionId(std::move(block_id));
       micro_partitions.push_back(std::move(meta_info));
     }
   }
-  IteratorBase<MicroPartitionMetadata> *iter = new VectorIterator<MicroPartitionMetadata>(std::move(micro_partitions));
+  IteratorBase<MicroPartitionMetadata> *iter =
+      PAX_NEW<VectorIterator<MicroPartitionMetadata>>(
+          std::move(micro_partitions));
 
-  return std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(iter);
+  return pax_unique_ptr<IteratorBase<MicroPartitionMetadata>>(iter);
 }
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/pax_deleter.h b/contrib/pax_storage/src/cpp/access/pax_deleter.h
index 7d94ffe6efd..0312e63a742 100644
--- a/contrib/pax_storage/src/cpp/access/pax_deleter.h
+++ b/contrib/pax_storage/src/cpp/access/pax_deleter.h
@@ -7,27 +7,26 @@
 #include <string>
 
 #include "comm/bitmap.h"
+#include "comm/pax_memory.h"
 #include "storage/pax.h"
 
 namespace pax {
 class CPaxDeleter {
  public:
-  explicit CPaxDeleter(const Relation rel, const Snapshot snapshot);
-
-  static TM_Result DeleteTuple(const Relation relation, const ItemPointer tid,
-                               const CommandId cid, const Snapshot snapshot,
+  explicit CPaxDeleter(Relation rel, Snapshot snapshot);
+  ~CPaxDeleter() = default;
+  static TM_Result DeleteTuple(Relation relation, ItemPointer tid,
+                               CommandId cid, Snapshot snapshot,
                                TM_FailureData *tmfd);
 
-  TM_Result MarkDelete(const ItemPointer tid);
-
-  ~CPaxDeleter();
-
+  TM_Result MarkDelete(ItemPointer tid);
+  void MarkDelete(BlockNumber pax_block_id);
   void ExecDelete();
 
  private:
-  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> buildDeleteIterator();
-  std::map<std::string, std::unique_ptr<DynamicBitmap>> block_bitmap_map_;
-  const Relation rel_;
-  const Snapshot snapshot_;
+  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> BuildDeleteIterator();
+  std::map<std::string, std::unique_ptr<Bitmap64>> block_bitmap_map_;
+  Relation rel_;
+  Snapshot snapshot_;
 };  // class CPaxDeleter
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/pax_dml_state.cc b/contrib/pax_storage/src/cpp/access/pax_dml_state.cc
index 335eb659197..91cd996339f 100644
--- a/contrib/pax_storage/src/cpp/access/pax_dml_state.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_dml_state.cc
@@ -8,10 +8,6 @@ void CPaxDmlStateLocal::DmlStateResetCallback(void * /*arg*/) {
 }
 
 void CPaxDmlStateLocal::InitDmlState(Relation rel, CmdType operation) {
-  if (operation == CMD_UPDATE || operation == CMD_DELETE) {
-    cbdb::InitCommandResource();
-  }
-
   if (!dml_descriptor_tab_) {
     HASHCTL hash_ctl;
     Assert(!cbdb::pax_memory_context);
@@ -44,7 +40,7 @@ void CPaxDmlStateLocal::FinishDmlState(Relation rel, CmdType /*operation*/) {
     // TODO(gongxun): deleter finish
     state->deleter->ExecDelete();
 
-    delete state->deleter;
+    PAX_DELETE(state->deleter);
     state->deleter = nullptr;
     // FIXME: it's update operation, maybe we should do something here
   }
@@ -55,7 +51,7 @@ void CPaxDmlStateLocal::FinishDmlState(Relation rel, CmdType /*operation*/) {
 
     old_ctx = MemoryContextSwitchTo(cbdb::pax_memory_context);
     state->inserter->FinishInsert();
-    delete state->inserter;
+    PAX_DELETE(state->inserter);
     state->inserter = nullptr;
     MemoryContextSwitchTo(old_ctx);
   }
@@ -66,7 +62,7 @@ CPaxInserter *CPaxDmlStateLocal::GetInserter(Relation rel) {
   state = FindDmlState(cbdb::RelationGetRelationId(rel));
   // TODO(gongxun): switch memory context??
   if (state->inserter == nullptr) {
-    state->inserter = new CPaxInserter(rel);
+    state->inserter = PAX_NEW<CPaxInserter>(rel);
   }
   return state->inserter;
 }
@@ -76,7 +72,7 @@ CPaxDeleter *CPaxDmlStateLocal::GetDeleter(Relation rel, Snapshot snapshot) {
   state = FindDmlState(cbdb::RelationGetRelationId(rel));
   // TODO(gongxun): switch memory context??
   if (state->deleter == nullptr) {
-    state->deleter = new CPaxDeleter(rel, snapshot);
+    state->deleter = PAX_NEW<CPaxDeleter>(rel, snapshot);
   }
   return state->deleter;
 }
diff --git a/contrib/pax_storage/src/cpp/access/pax_inserter.cc b/contrib/pax_storage/src/cpp/access/pax_inserter.cc
index 2584efdb3d9..68d1da880b6 100644
--- a/contrib/pax_storage/src/cpp/access/pax_inserter.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_inserter.cc
@@ -4,18 +4,32 @@
 #include <utility>
 
 #include "access/pax_dml_state.h"
-#include "catalog/micro_partition_stats.h"
+#include "access/pax_partition.h"
+#include "access/paxc_rel_options.h"
 #include "catalog/pax_aux_table.h"
 #include "comm/cbdb_wrappers.h"
+#include "storage/micro_partition_stats.h"
 #include "storage/strategy.h"
 
 namespace pax {
 
-CPaxInserter::CPaxInserter(Relation rel) : rel_(rel), insert_count_(0) {
-  writer_ = new TableWriter(rel);
-  writer_->SetWriteSummaryCallback(&cbdb::AddMicroPartitionEntry)
-      ->SetFileSplitStrategy(new PaxDefaultSplitStrategy())
-      ->SetStatsCollector(new MicroPartitionStats())
+CPaxInserter::CPaxInserter(Relation rel)
+    : rel_(rel), insert_count_(0), part_obj_(nullptr), writer_(nullptr) {
+  part_obj_ = PAX_NEW<PartitionObject>();
+  auto ok = part_obj_->Initialize(rel_);
+  if (ok) {
+    writer_ = PAX_NEW<TableParitionWriter>(rel, part_obj_);
+  } else {
+    // fallback to TableWriter
+    writer_ = PAX_NEW<TableWriter>(rel);
+    part_obj_->Release();
+    PAX_DELETE(part_obj_);
+    part_obj_ = nullptr;
+  }
+
+  writer_->SetWriteSummaryCallback(&cbdb::InsertOrUpdateMicroPartitionEntry)
+      ->SetFileSplitStrategy(PAX_NEW<PaxDefaultSplitStrategy>())
+      ->SetStatsCollector(PAX_NEW<MicroPartitionStats>())
       ->Open();
 }
 
@@ -29,8 +43,7 @@ void CPaxInserter::InsertTuple(Relation relation, TupleTableSlot *slot,
     slot_getallattrs(slot);
   }
 
-  CTupleSlot cslot(slot);
-  writer_->WriteTuple(&cslot);
+  writer_->WriteTuple(slot);
 }
 
 void CPaxInserter::MultiInsert(Relation relation, TupleTableSlot **slots,
@@ -51,8 +64,14 @@ void CPaxInserter::FinishBulkInsert(Relation relation, int /*options*/) {
 
 void CPaxInserter::FinishInsert() {
   writer_->Close();
-  delete writer_;
+  PAX_DELETE(writer_);
   writer_ = nullptr;
+
+  if (part_obj_) {
+    part_obj_->Release();
+    PAX_DELETE(part_obj_);
+    part_obj_ = nullptr;
+  }
 }
 
 void CPaxInserter::TupleInsert(Relation relation, TupleTableSlot *slot,
diff --git a/contrib/pax_storage/src/cpp/access/pax_inserter.h b/contrib/pax_storage/src/cpp/access/pax_inserter.h
index abd191981bf..92300769755 100644
--- a/contrib/pax_storage/src/cpp/access/pax_inserter.h
+++ b/contrib/pax_storage/src/cpp/access/pax_inserter.h
@@ -4,9 +4,9 @@
 
 #include "storage/micro_partition_metadata.h"
 #include "storage/pax.h"
-
+#include "storage/pax_table_partition_writer.h"
 namespace pax {
-
+class PartitionObject;
 class CPaxInserter {
  public:
   explicit CPaxInserter(Relation rel);
@@ -29,6 +29,7 @@ class CPaxInserter {
   Relation rel_;
   uint32 insert_count_;
 
+  PartitionObject *part_obj_;
   TableWriter *writer_;
 };  // class CPaxInserter
 
diff --git a/contrib/pax_storage/src/cpp/access/pax_partition.cc b/contrib/pax_storage/src/cpp/access/pax_partition.cc
new file mode 100644
index 00000000000..9533677a969
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/pax_partition.cc
@@ -0,0 +1,745 @@
+#include "access/pax_partition.h"
+
+#include "comm/cbdb_api.h"
+
+#include "access/pax_access_handle.h"
+#include "catalog/pg_pax_tables.h"
+#include "comm/cbdb_wrappers.h"
+
+namespace paxc {
+// support optional `EVERY` syntax:
+// FROM(start_value) TO(end_value) [ EVERY(interval) ]
+struct PaxPartitionEveryIterator {
+  PartitionKey key;
+  Datum from_value;
+  Datum to_value;
+
+  ExprState *plus_expr_state;
+  ParamListInfo plus_expr_params;
+  EState *estate;
+
+  Datum current_start;
+  Datum current_end;
+  bool ended;
+
+  ParseState *pstate;
+};
+
+static int PartitionCheckBound(PartitionKey key, PartitionBoundSpec *spec);
+
+static void PaxPartitionDestroyEveryIterator(
+    struct PaxPartitionEveryIterator *iter) {
+  if (iter->estate) FreeExecutorState(iter->estate);
+  pfree(iter);
+}
+
+// See the implementation in PartEveryIterator
+static struct PaxPartitionEveryIterator *PaxPartitionInitEveryIterator(
+    ParseState *pstate, PartitionKey key, Node *from, Node *to, Node *every) {
+  Assert(key->partnatts == 1);
+  auto part_col_typid = get_partition_col_typid(key, 0);
+  auto part_col_typmod = get_partition_col_typmod(key, 0);
+  auto part_col_collation = get_partition_col_collation(key, 0);
+  Datum from_value;
+  Datum to_value;
+  Const *c;
+
+  auto iter =
+      (PaxPartitionEveryIterator *)palloc0(sizeof(PaxPartitionEveryIterator));
+  Assert(from && to && every);
+
+  c = castNode(Const, from);
+  if (c->constisnull)
+    elog(ERROR, "cann't use NULL with range partition specification");
+  from_value = c->constvalue;
+
+  c = castNode(Const, to);
+  if (c->constisnull)
+    elog(ERROR, "cann't use NULL with range partition specification");
+  to_value = c->constvalue;
+
+  auto param = makeNode(Param);
+  param->paramid = 1;
+  param->paramtype = part_col_typid;
+  param->paramtypmod = part_col_typmod;
+  param->paramcollid = part_col_collation;
+  param->location = -1;
+
+  auto plus_expr = (Node *)make_op(
+      pstate,
+      list_make2(makeString((char *)"pg_catalog"), makeString((char *)"+")),
+      (Node *)param, (Node *)every, pstate->p_last_srf, -1);
+
+  if (IsA(plus_expr, CollateExpr)) {
+    auto expr_collation = exprCollation(plus_expr);
+    if (OidIsValid(expr_collation) && expr_collation != part_col_collation)
+      elog(ERROR,
+           "collation of partition bound value for column %d doesn't match "
+           "partition key collation \"%s\"",
+           get_partition_col_attnum(key, 0),
+           get_collation_name(part_col_collation));
+  }
+  plus_expr = coerce_to_target_type(
+      pstate, plus_expr, exprType(plus_expr), part_col_typid, part_col_typmod,
+      COERCION_ASSIGNMENT, COERCE_IMPLICIT_CAST, -1);
+  if (plus_expr == NULL)
+    ereport(ERROR,
+            (errcode(ERRCODE_DATATYPE_MISMATCH),
+             errmsg("specified value cannot be cast to type %s for column %d",
+                    format_type_be(part_col_typid),
+                    get_partition_col_attnum(key, 0))));
+
+  iter->key = key;
+  iter->from_value = from_value;
+  iter->to_value = to_value;
+
+  iter->plus_expr_params = makeParamList(1);
+  iter->plus_expr_params->params[0].value = (Datum)0;
+  iter->plus_expr_params->params[0].isnull = true;
+  iter->plus_expr_params->params[0].pflags = 0;
+  iter->plus_expr_params->params[0].ptype = part_col_typid;
+  iter->estate = CreateExecutorState();
+  iter->estate->es_param_list_info = iter->plus_expr_params;
+
+  iter->plus_expr_state =
+      ExecInitExprWithParams((Expr *)plus_expr, iter->plus_expr_params);
+
+  iter->current_end = iter->from_value;
+  iter->current_start = (Datum)0;
+  iter->ended = false;
+
+  iter->pstate = pstate;
+
+  return iter;
+}
+
+static List *PaxPartitionBuildDatums(PartitionKey key, Datum *datums) {
+  List *result = NIL;
+  for (int i = 0; i < key->partnatts; i++) {
+    Const *c;
+    PartitionRangeDatum *prd;
+    c = makeConst(
+        key->parttypid[i], key->parttypmod[i], key->parttypcoll[i],
+        key->parttyplen[i],
+        datumCopy(datums[i], key->parttypbyval[i], key->parttyplen[i]), false,
+        key->parttypbyval[i]);
+
+    prd = makeNode(PartitionRangeDatum);
+    prd->kind = PARTITION_RANGE_DATUM_VALUE;
+    prd->value = (Node *)c;
+    result = lappend(result, prd);
+  }
+  return result;
+}
+
+static PartitionBoundSpec *PaxPartitionNextPartBound(
+    struct PaxPartitionEveryIterator *iter) {
+  if (iter->ended) return nullptr;
+
+  bool isnull;
+
+  iter->plus_expr_params->params[0].isnull = false;
+  iter->plus_expr_params->params[0].value = iter->current_end;
+
+  auto next_start = iter->current_end;
+  auto next_end = ExecEvalExprSwitchContext(
+      iter->plus_expr_state, GetPerTupleExprContext(iter->estate), &isnull);
+  if (isnull)
+    ereport(ERROR, (errcode(ERRCODE_INVALID_TABLE_DEFINITION),
+                    errmsg("could not compute next partition boundary with "
+                           "EVERY, plus-operator returned NULL"),
+                    parser_errposition(iter->pstate, -1)));
+
+  auto cmpval = DatumGetInt32(FunctionCall2Coll(&iter->key->partsupfunc[0],
+                                                iter->key->partcollation[0],
+                                                next_end, iter->to_value));
+  if (cmpval >= 0) {
+    iter->ended = true;
+    next_end = iter->to_value;
+  }
+  // sanity check in case next_start >= next_end
+  cmpval = DatumGetInt32(FunctionCall2Coll(&iter->key->partsupfunc[0],
+                                           iter->key->partcollation[0],
+                                           next_start, next_end));
+  if (cmpval >= 0) elog(ERROR, "invalid range bound with EVERY");
+
+  iter->current_start = next_start;
+  iter->current_end = next_end;
+
+  // build PartitionBoundSpec for [iter->current_start, iter->current_end)
+  PartitionBoundSpec *boundspec;
+
+  boundspec = makeNode(PartitionBoundSpec);
+  boundspec->strategy = PARTITION_STRATEGY_RANGE;
+  boundspec->is_default = false;
+  boundspec->lowerdatums =
+      PaxPartitionBuildDatums(iter->key, &iter->current_start);
+  boundspec->upperdatums =
+      PaxPartitionBuildDatums(iter->key, &iter->current_end);
+
+  return boundspec;
+}
+
+static Node *GetConstValue(List *datums) {
+  auto prd = (PartitionRangeDatum *)linitial(datums);
+  Assert(IsA(prd, PartitionRangeDatum));
+  Assert(prd->kind == PARTITION_RANGE_DATUM_VALUE);
+
+  auto c = (Const *)prd->value;
+  Assert(c && IsA(c, Const) && !c->constisnull);
+  return (Node *)c;
+}
+
+// generate a list of partition bound specs
+static List *TransformPartitionExtension(ParseState *pstate, Relation relation,
+                                         PartitionKey key,
+                                         PartitionRangeExtension *range_ext) {
+  List *result = NIL;
+  PartitionBoundSpec *range;
+
+  auto every = range_ext->every;
+  auto spec = transformPartitionBound(pstate, relation, key, &range_ext->spec);
+  if (!every) return list_make1(spec);
+
+  if (PartitionCheckBound(key, spec) >= 0)
+    elog(ERROR, "invalid range bound: from %s to %s every(X)",
+         get_range_partbound_string(spec->lowerdatums),
+         get_range_partbound_string(spec->upperdatums));
+
+  // calculate partition by every expression
+  if (key->partnatts != 1 || key->partnatts != list_length(every))
+    elog(ERROR, "pax partition EVERY only support one column");
+
+  auto ev = (Node *)linitial(every);
+  auto iter = PaxPartitionInitEveryIterator(
+      pstate, key, GetConstValue(spec->lowerdatums),
+      GetConstValue(spec->upperdatums),
+      (Node *)transformExpr(pstate, ev, EXPR_KIND_PARTITION_BOUND));
+
+  while ((range = PaxPartitionNextPartBound(iter))) {
+    result = lappend(result, range);
+  }
+  PaxPartitionDestroyEveryIterator(iter);
+  return result;
+}
+
+static bool PaxLoadPartitionSpec(Oid relid, List **partparams_list,
+                                 List **partboundspec_list) {
+  Node *part;
+  List *list;
+
+  ::paxc::GetPaxTablesEntryAttributes(relid, NULL, &part);
+  if (!part) return false;
+
+  list = castNode(List, part);
+  Assert(list_length(list) == 2);
+  *partparams_list = castNode(List, list_nth(list, 0));
+  *partboundspec_list = castNode(List, list_nth(list, 1));
+  return true;
+}
+
+static inline PartitionRangeDatumKind RangeDatumToKind(List *datums, int i) {
+  PartitionRangeDatum *rd = castNode(PartitionRangeDatum, list_nth(datums, i));
+  return rd->kind;
+}
+static inline Datum RangeDatumToValue(List *datums, int i) {
+  PartitionRangeDatum *rd = castNode(PartitionRangeDatum, list_nth(datums, i));
+  Const *c = castNode(Const, rd->value);
+  Assert(c && !c->constisnull);
+  return c->constvalue;
+}
+// Reference: partition_rbound_cmp()
+int PartitionComparePartitionKeys(PartitionKey key, List *datums1,
+                                  List *datums2) {
+  Assert(key->partnatts == list_length(datums1));
+  Assert(key->partnatts == list_length(datums2));
+  FmgrInfo *partsupfunc = key->partsupfunc;
+  Oid *partcollation = key->partcollation;
+  int natts = key->partnatts;
+  int i;
+  int32 colnum = 0;
+  int32 cmpval = 0;
+  for (i = 0; i < natts; i++) {
+    colnum++;
+    auto kind1 = RangeDatumToKind(datums1, i);
+    auto kind2 = RangeDatumToKind(datums2, i);
+
+    if (kind1 < kind2) return -colnum;
+    if (kind1 > kind2) return colnum;
+    if (kind1 != PARTITION_RANGE_DATUM_VALUE) {
+      /*
+       * The column bounds are both MINVALUE or both MAXVALUE. No later
+       * columns should be considered, but we still need to compare
+       * whether they are upper or lower bounds.
+       */
+      break;
+    }
+    cmpval = DatumGetInt32(FunctionCall2Coll(&partsupfunc[i], partcollation[i],
+                                             RangeDatumToValue(datums1, i),
+                                             RangeDatumToValue(datums2, i)));
+    if (cmpval != 0) break;
+  }
+  return cmpval == 0 ? 0 : (cmpval < 0 ? -colnum : colnum);
+}
+
+static int PartitionCheckBound(PartitionKey key, PartitionBoundSpec *spec) {
+  return PartitionComparePartitionKeys(key, spec->lowerdatums,
+                                       spec->upperdatums);
+}
+
+int PartitionBoundSpecCmp(const ListCell *a, const ListCell *b, void *arg) {
+  auto spec1 = lfirst_node(PartitionBoundSpec, a);
+  auto spec2 = lfirst_node(PartitionBoundSpec, b);
+  auto key = static_cast<PartitionKey>(arg);
+  return PartitionComparePartitionKeys(key, spec1->lowerdatums,
+                                       spec2->lowerdatums);
+}
+
+bool PartitionCheckBounds(PartitionKey key, List *spec_list) {
+  ListCell *lc;
+  int i;
+  int nparts = list_length(spec_list);
+  bool ok = true;
+
+  Assert(nparts > 0);
+
+  // self bound check
+  foreach (lc, spec_list) {
+    auto spec = lfirst_node(PartitionBoundSpec, lc);
+
+    if (spec->strategy != key->strategy)
+      elog(ERROR, "strategy not match with partition key");
+    if (spec->is_default) elog(ERROR, "unexpected default partition");
+    if (list_length(spec->lowerdatums) != key->partnatts)
+      elog(ERROR,
+           "number of lower bound values mismatches the number of partition "
+           "keys");
+    if (list_length(spec->upperdatums) != key->partnatts)
+      elog(ERROR,
+           "number of upper bound values mismatches the number of partition "
+           "keys");
+
+    ok = PartitionCheckBound(key, spec) < 0;
+    if (!ok) goto out;
+  }
+
+  // cross bound check, only checks whether prev.upper <= cur.lower
+  list_sort_arg(spec_list, PartitionBoundSpecCmp, key);
+  for (i = 1; i < nparts; i++) {
+    auto spec1 = castNode(PartitionBoundSpec, list_nth(spec_list, i - 1));
+    auto spec2 = castNode(PartitionBoundSpec, list_nth(spec_list, i));
+    // the upper value should be less than or equal to the lower value of the
+    // next part
+    ok = PartitionComparePartitionKeys(key, spec1->upperdatums,
+                                       spec2->lowerdatums) <= 0;
+    if (!ok) break;
+  }
+out:
+  return ok;
+}
+
+List *PaxValidatePartitionRanges(Relation relation, PartitionKey key,
+                                 List *raw_partbound_list) {
+  ParseState *pstate = make_parsestate(NULL);
+  List *spec_list = NIL;
+  int nparts;
+  bool ok;
+
+  nparts = list_length(raw_partbound_list);
+  Assert(nparts > 0);
+
+  for (int i = 0; i < nparts; i++) {
+    auto spec =
+        static_cast<PartitionRangeExtension *>(list_nth(raw_partbound_list, i));
+    Assert(IsA(spec, PartitionBoundSpec));
+    auto part_list = TransformPartitionExtension(pstate, relation, key, spec);
+    spec_list = list_concat(spec_list, part_list);
+    pfree(part_list);
+  }
+
+  // check whether bounds overlaps
+  ok = paxc::PartitionCheckBounds(key, spec_list);
+  if (!ok) elog(ERROR, "partition bounds have overlaps");
+
+  list_free_deep(raw_partbound_list);
+  free_parsestate(pstate);
+
+  return spec_list;
+}
+
+// Reference: RelationBuildPartitionKey
+PartitionKey PaxRelationBuildPartitionKey(Relation relation,
+                                          List *partparams_list) {
+  int i;
+  PartitionKey key;
+  Oid *partopclass;
+  ListCell *partexprs_item;
+  int16 procnum;
+
+  Assert(RelationIsPAX(relation));
+
+  key = (PartitionKey)palloc0(sizeof(PartitionKeyData));
+  key->strategy = PARTITION_STRATEGY_RANGE;
+  key->partnatts = list_length(partparams_list);
+  key->partattrs = (AttrNumber *)palloc(key->partnatts * sizeof(AttrNumber));
+  key->partopfamily = (Oid *)palloc(key->partnatts * sizeof(Oid));
+  key->partopcintype = (Oid *)palloc(key->partnatts * sizeof(Oid));
+  key->partsupfunc = (FmgrInfo *)palloc0(key->partnatts * sizeof(FmgrInfo));
+
+  key->partcollation = (Oid *)palloc(key->partnatts * sizeof(Oid));
+  key->parttypid = (Oid *)palloc(key->partnatts * sizeof(Oid));
+  key->parttypmod = (int32 *)palloc(key->partnatts * sizeof(int32));
+  key->parttyplen = (int16 *)palloc(key->partnatts * sizeof(int16));
+  key->parttypbyval = (bool *)palloc(key->partnatts * sizeof(bool));
+  key->parttypalign = (char *)palloc(key->partnatts * sizeof(char));
+  key->parttypcoll = (Oid *)palloc(key->partnatts * sizeof(Oid));
+
+  partopclass = (Oid *)palloc(key->partnatts * sizeof(Oid));
+  ComputePartitionAttrs(NULL, relation, partparams_list, key->partattrs, NULL,
+                        partopclass, key->partcollation, key->strategy);
+
+  /* determine support function number to search for */
+  procnum = (key->strategy == PARTITION_STRATEGY_HASH) ? HASHEXTENDED_PROC
+                                                       : BTORDER_PROC;
+
+  // We don't have expressions as our partition keys, but keep
+  // the code the same as the kernel.
+  partexprs_item = list_head(key->partexprs);
+  for (i = 0; i < key->partnatts; i++) {
+    AttrNumber attno = key->partattrs[i];
+    HeapTuple opclasstup;
+    Form_pg_opclass opclassform;
+    Oid funcid;
+
+    /* Collect opfamily information */
+    opclasstup = SearchSysCache1(CLAOID, ObjectIdGetDatum(partopclass[i]));
+    if (!HeapTupleIsValid(opclasstup))
+      elog(ERROR, "cache lookup failed for opclass %u", partopclass[i]);
+
+    opclassform = (Form_pg_opclass)GETSTRUCT(opclasstup);
+    key->partopfamily[i] = opclassform->opcfamily;
+    key->partopcintype[i] = opclassform->opcintype;
+
+    /* Get a support function for the specified opfamily and datatypes */
+    funcid = get_opfamily_proc(opclassform->opcfamily, opclassform->opcintype,
+                               opclassform->opcintype, procnum);
+    if (!OidIsValid(funcid))
+      ereport(
+          ERROR,
+          (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
+           errmsg("operator class \"%s\" of access method %s is missing "
+                  "support function %d for type %s",
+                  NameStr(opclassform->opcname),
+                  (key->strategy == PARTITION_STRATEGY_HASH) ? "hash" : "btree",
+                  procnum, format_type_be(opclassform->opcintype))));
+
+    fmgr_info_cxt(funcid, &key->partsupfunc[i], CurrentMemoryContext);
+
+    /* Collect type information */
+    if (attno != 0) {
+      Form_pg_attribute att = TupleDescAttr(relation->rd_att, attno - 1);
+
+      key->parttypid[i] = att->atttypid;
+      key->parttypmod[i] = att->atttypmod;
+      key->parttypcoll[i] = att->attcollation;
+    } else {
+      if (partexprs_item == NULL)
+        elog(ERROR, "wrong number of partition key expressions");
+
+      key->parttypid[i] = exprType(static_cast<Node *>(lfirst(partexprs_item)));
+      key->parttypmod[i] =
+          exprTypmod(static_cast<Node *>(lfirst(partexprs_item)));
+      key->parttypcoll[i] =
+          exprCollation(static_cast<Node *>(lfirst(partexprs_item)));
+
+      partexprs_item = lnext(key->partexprs, partexprs_item);
+    }
+    get_typlenbyvalalign(key->parttypid[i], &key->parttyplen[i],
+                         &key->parttypbyval[i], &key->parttypalign[i]);
+
+    ReleaseSysCache(opclasstup);
+  }
+  pfree(partopclass);
+  return key;
+}
+
+static PartitionDesc PaxRelationBuildPartitionDesc(PartitionKey key,
+                                                   List *partboundspec_list,
+                                                   MemoryContext tmp_ctx,
+                                                   MemoryContext target_ctx) {
+  PartitionDesc partdesc;
+  PartitionBoundInfo boundinfo;
+  PartitionBoundSpec **boundspecs = NULL;
+  int nparts;
+  MemoryContext saved_cxt;
+  int *mapping;
+
+  saved_cxt = MemoryContextSwitchTo(tmp_ctx);
+  nparts = list_length(partboundspec_list);
+  boundspecs =
+      (PartitionBoundSpec **)palloc(nparts * sizeof(PartitionBoundSpec *));
+  for (int i = 0; i < nparts; i++)
+    boundspecs[i] =
+        static_cast<PartitionBoundSpec *>(list_nth(partboundspec_list, i));
+
+  /*
+   * Create PartitionBoundInfo and mapping, working in the caller's context.
+   * This could fail, but we haven't done any damage if so.
+   */
+  boundinfo = partition_bounds_create(boundspecs, nparts, key, &mapping);
+  pfree(boundspecs);
+
+  MemoryContextSwitchTo(target_ctx);
+  partdesc = (PartitionDescData *)palloc0(sizeof(PartitionDescData));
+  partdesc->nparts = nparts;
+  partdesc->detached_exist = false;
+  partdesc->boundinfo = partition_bounds_copy(boundinfo, key);
+  pfree(boundinfo);
+
+  // PAX doesn't have child partition tables
+  partdesc->oids = NULL;
+  partdesc->is_leaf = NULL;
+  /* Return to caller's context, and blow away the temporary context. */
+  MemoryContextSwitchTo(saved_cxt);
+  return partdesc;
+}
+
+static void PaxFormPartitionKeyDatum(PartitionKey key, TupleTableSlot *slot,
+                                     Datum *values, bool *isnull) {
+  for (int i = 0; i < key->partnatts; i++) {
+    AttrNumber keycol = key->partattrs[i];
+
+    Assert(keycol > 0);
+    values[i] = slot_getattr(slot, keycol, &isnull[i]);
+  }
+}
+
+bool PartitionObjectInternal::Initialize(Relation pax_rel) {
+  MemoryContext tmp_ctx;
+  MemoryContext saved_ctx;
+  List *partparams_list;
+  List *partboundspec_list;
+  PartitionKey key = NULL;
+  PartitionDesc desc = NULL;
+  bool ok;
+
+  Assert(pax_rel);
+  pax_rel_ = pax_rel;
+
+  tmp_ctx = AllocSetContextCreate(CurrentMemoryContext, "tmp pax partition ctx",
+                                  ALLOCSET_DEFAULT_SIZES);
+  mctx_ = AllocSetContextCreate(CurrentMemoryContext, "pax partition ctx",
+                                ALLOCSET_DEFAULT_SIZES);
+  MemoryContextCopyAndSetIdentifier(mctx_, RelationGetRelationName(pax_rel));
+
+  saved_ctx = MemoryContextSwitchTo(tmp_ctx);
+  ok = PaxLoadPartitionSpec(RelationGetRelid(pax_rel), &partparams_list,
+                            &partboundspec_list);
+  if (!ok) goto out;
+
+  MemoryContextSwitchTo(mctx_);
+
+  // The partition keys have no strict constraint for DDLs.
+  // The column names/types may be changed later by the user, but the PAX code
+  // is not aware of it. So, we ignore these inconsistent changes for partition
+  // writer.
+  PG_TRY();
+  {
+    key = PaxRelationBuildPartitionKey(pax_rel, partparams_list);
+    InitializeMergeInfo(key, partboundspec_list, tmp_ctx, mctx_);
+
+    desc =
+        PaxRelationBuildPartitionDesc(key, partboundspec_list, tmp_ctx, mctx_);
+    partition_bound_spec_ = static_cast<List *>(copyObject(partboundspec_list));
+  }
+  PG_CATCH();
+  {
+    // fall back to not use the partition writer
+    ok = false;
+    FlushErrorState();
+  }
+  PG_END_TRY();
+  partition_key_ = key;
+  partition_desc_ = desc;
+out:
+  MemoryContextSwitchTo(saved_ctx);
+  MemoryContextDelete(tmp_ctx);
+  return ok;
+}
+
+void PartitionObjectInternal::InitializeMergeInfo(PartitionKey key,
+                                                  List *partboundspec_list,
+                                                  MemoryContext tmp_ctx,
+                                                  MemoryContext target_ctx) {
+  // gather whether the adjacent bounds are continuous
+  // NOTE: the bounds are already sorted.
+  MemoryContext saved_ctx;
+  int *merge_index;
+  int nparts;
+  int merge_len;
+
+  saved_ctx = MemoryContextSwitchTo(tmp_ctx);
+  nparts = list_length(partboundspec_list);
+  merge_index = (int *)palloc(2 * nparts * sizeof(int));
+  merge_index[0] = 0;
+  merge_len = 1;
+  for (int i = 1; i < nparts; i++) {
+    PartitionBoundSpec *spec1 =
+        castNode(PartitionBoundSpec, list_nth(partboundspec_list, i - 1));
+    PartitionBoundSpec *spec2 =
+        castNode(PartitionBoundSpec, list_nth(partboundspec_list, i));
+
+    auto cmpval = PartitionComparePartitionKeys(key, spec1->upperdatums,
+                                                spec2->lowerdatums);
+    Assert(cmpval <= 0);
+    if (cmpval != 0) {
+      merge_index[merge_len++] = i - 1;
+      merge_index[merge_len++] = i;
+    }
+  }
+  merge_index[merge_len++] = nparts - 1;
+
+  Assert(merge_len % 2 == 0);
+  MemoryContextSwitchTo(target_ctx);
+  merge_len_ = merge_len;
+  merge_index_ = (int *)palloc(merge_len * sizeof(int));
+  memcpy(merge_index_, merge_index, merge_len * sizeof(int));
+  pfree(merge_index);
+
+  MemoryContextSwitchTo(saved_ctx);
+}
+
+void PartitionObjectInternal::Release() {
+  pax_rel_ = nullptr;
+  partition_key_ = nullptr;
+  partition_desc_ = nullptr;
+  partition_bound_spec_ = nullptr;
+  if (mctx_) {
+    MemoryContextDelete(mctx_);
+    mctx_ = nullptr;
+  }
+}
+
+int PartitionObjectInternal::NumPartitions() const {
+  Assert(pax_rel_ && partition_key_ && partition_desc_ && mctx_);
+  return list_length(partition_bound_spec_);
+}
+
+int PartitionObjectInternal::NumPartitionKeys() const {
+  Assert(pax_rel_ && partition_key_ && partition_desc_ && mctx_);
+  return get_partition_natts(partition_key_);
+}
+
+int PartitionObjectInternal::FindPartition(TupleTableSlot *slot) {
+  Datum values[PARTITION_MAX_KEYS];
+  bool isnull[PARTITION_MAX_KEYS];
+
+  Assert(pax_rel_ && partition_key_ && partition_desc_ && mctx_);
+  PaxFormPartitionKeyDatum(partition_key_, slot, values, isnull);
+  return get_partition_for_tuple(partition_key_, partition_desc_, values,
+                                 isnull);
+}
+
+}  // namespace paxc
+
+namespace pax {
+bool PartitionObject::Initialize(Relation pax_rel) {
+  // FIXME: We MUST catch some types of exceptions and assumes
+  // the partition should be ignored. Because the partition constraint
+  // may be broken by:
+  // 1. rename column name
+  // 2. change column type
+  // 3. drop one or more columns in the partition keys
+  CBDB_WRAP_START;
+  { return stub_.Initialize(pax_rel); }
+  CBDB_WRAP_END;
+}
+void PartitionObject::Release() {
+  CBDB_WRAP_START;
+  { stub_.Release(); }
+  CBDB_WRAP_END;
+}
+
+int PartitionObject::FindPartition(TupleTableSlot *slot) {
+  CBDB_WRAP_START;
+  { return stub_.FindPartition(slot); }
+  CBDB_WRAP_END;
+}
+std::pair<int *, size_t> PartitionObject::GetMergeListInfo() {
+  return {stub_.merge_index_, stub_.merge_len_};
+}
+
+}  // namespace pax
+
+extern "C" {
+// CREATE FUNCTION pax_dump_ranges(relid Oid) RETURNS SETOF TEXT AS
+// '$libdir/pax', 'PaxPartitionDumpRanges'
+// LANGUAGE C STRICT;
+// UDF about partition
+PG_FUNCTION_INFO_V1(PaxPartitionDumpRanges);
+struct PartitionRangeDumpContext {
+  List *boundspec_list;
+  MemoryContext mctx;
+  int index;
+};
+
+Datum PaxPartitionDumpRanges(PG_FUNCTION_ARGS) {
+  PartitionRangeDumpContext *ctx;
+  FuncCallContext *funcctx;
+
+  if (SRF_IS_FIRSTCALL()) {
+    Oid relid = PG_GETARG_OID(0);
+    MemoryContext tmp_ctx;
+    MemoryContext old_ctx;
+    List *partparams;
+    List *partboundspecs;
+    bool ok;
+
+    funcctx = SRF_FIRSTCALL_INIT();
+    tmp_ctx =
+        AllocSetContextCreate(funcctx->multi_call_memory_ctx,
+                              "tmp pax partition ctx", ALLOCSET_DEFAULT_SIZES);
+    old_ctx = MemoryContextSwitchTo(tmp_ctx);
+
+    ok = paxc::PaxLoadPartitionSpec(relid, &partparams, &partboundspecs);
+    if (!ok) partboundspecs = nullptr;
+
+    ctx =
+        (PartitionRangeDumpContext *)palloc(sizeof(PartitionRangeDumpContext));
+    ctx->boundspec_list = partboundspecs;
+    ctx->mctx = tmp_ctx;
+    ctx->index = 0;
+    funcctx->user_fctx = (void *)ctx;
+    MemoryContextSwitchTo(old_ctx);
+  }
+
+  funcctx = SRF_PERCALL_SETUP();
+  ctx = (PartitionRangeDumpContext *)funcctx->user_fctx;
+  while (ctx->index < list_length(ctx->boundspec_list)) {
+    StringInfoData str;
+    char *value_list;
+    text *range;
+    PartitionBoundSpec *spec =
+        castNode(PartitionBoundSpec, list_nth(ctx->boundspec_list, ctx->index));
+    ++ctx->index;
+
+    initStringInfo(&str);
+    appendStringInfoString(&str, "from");
+    value_list = get_range_partbound_string(spec->lowerdatums);
+    appendStringInfoString(&str, value_list);
+    pfree(value_list);
+
+    appendStringInfoString(&str, " to");
+    value_list = get_range_partbound_string(spec->upperdatums);
+    appendStringInfoString(&str, value_list);
+    pfree(value_list);
+
+    range = cstring_to_text(str.data);
+    pfree(str.data);
+    SRF_RETURN_NEXT(funcctx, PointerGetDatum(range));
+  }
+
+  MemoryContextDelete(ctx->mctx);
+  SRF_RETURN_DONE(funcctx);
+}
+}
diff --git a/contrib/pax_storage/src/cpp/access/pax_partition.h b/contrib/pax_storage/src/cpp/access/pax_partition.h
new file mode 100644
index 00000000000..2e7ed5ea05e
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/pax_partition.h
@@ -0,0 +1,75 @@
+#pragma once
+
+#include "comm/cbdb_api.h"
+
+#include <vector>
+
+namespace pax {
+class PartitionObject;
+}
+
+struct PartitionRangeExtension {
+  struct PartitionBoundSpec spec;
+  List *every;
+};
+namespace paxc {
+
+extern PartitionKey PaxRelationBuildPartitionKey(Relation relation,
+                                                 List *partparams_list);
+extern bool PartitionCheckBounds(PartitionKey key, int nparts,
+                                 PartitionBoundSpec **partboundspecs);
+extern List *PaxValidatePartitionRanges(Relation relation, PartitionKey key,
+                                        List *raw_partbound_list);
+
+class PartitionObjectInternal {
+ public:
+  bool Initialize(Relation pax_rel);
+  void Release();
+
+  // Get number of partitions, excluding the default partition
+  int NumPartitions() const;
+  int NumPartitionKeys() const;
+  // -1 if default partition, >=0 leaf partition
+  int FindPartition(TupleTableSlot *slot);
+  PartitionKey GetPartitionKey() { return partition_key_; }
+  PartitionDesc GetPartitionDesc() { return partition_desc_; }
+
+ private:
+  void InitializeMergeInfo(PartitionKey key, List *partboundspec_list,
+                           MemoryContext tmp_ctx, MemoryContext target_ctx);
+
+  friend class pax::PartitionObject;
+  Relation pax_rel_ = nullptr;
+  PartitionKey partition_key_ = nullptr;
+  PartitionDesc partition_desc_ = nullptr;
+  int *merge_index_ = nullptr;
+  size_t merge_len_ = 0;
+  List *partition_bound_spec_ = nullptr;
+  MemoryContext mctx_ = nullptr;
+};
+}  // namespace paxc
+
+namespace pax {
+class PartitionObject {
+ public:
+  bool Initialize(Relation pax_rel);
+  void Release();
+
+  PartitionKey GetPartitionKey() { return stub_.GetPartitionKey(); }
+  PartitionDesc GetPartitionDesc() { return stub_.GetPartitionDesc(); }
+
+  // Get number of partitions, excluding the default partition
+  int NumPartitions() const { return stub_.NumPartitions(); }
+  // Get number of the partition keys
+  int NumPartitionKeys() const { return stub_.NumPartitionKeys(); }
+
+  // -1 if default partition, >= 0 leaf partition
+  int FindPartition(TupleTableSlot *slot);
+
+  std::pair<int *, size_t> GetMergeListInfo();
+
+ private:
+  paxc::PartitionObjectInternal stub_;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/pax_scanner.cc b/contrib/pax_storage/src/cpp/access/pax_scanner.cc
index 9abd53ade28..3b4054b4bf2 100644
--- a/contrib/pax_storage/src/cpp/access/pax_scanner.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_scanner.cc
@@ -1,19 +1,147 @@
 #include "access/pax_scanner.h"
 
 #include "access/pax_access_handle.h"
+#include "catalog/pax_aux_table.h"
+#include "catalog/pg_pax_tables.h"
+#include "comm/guc.h"
+#include "comm/pax_memory.h"
 #include "storage/local_file_system.h"
 #include "storage/micro_partition.h"
 #include "storage/micro_partition_iterator.h"
+#include "storage/micro_partition_stats.h"
 #include "storage/orc/orc.h"
 #include "storage/pax.h"
 #include "storage/pax_buffer.h"
+#include "storage/pax_defined.h"
+
+#ifdef ENABLE_PLASMA
+#include "storage/cache/pax_plasma_cache.h"
+#endif
+
+#ifdef VEC_BUILD
+#include "utils/am_vec.h"
+#endif
+
+namespace paxc {
+bool IndexUniqueCheck(Relation rel, ItemPointer tid, Snapshot snapshot,
+                      bool * /*all_dead*/) {
+  paxc::ScanAuxContext context;
+  HeapTuple tuple;
+  char block_name[NAMEDATALEN];
+  Oid aux_relid;
+  bool exists;
+
+  aux_relid = ::paxc::GetPaxAuxRelid(RelationGetRelid(rel));
+  snprintf(block_name, sizeof(block_name), "%u", pax::GetBlockNumber(*tid));
+  context.BeginSearchMicroPartition(aux_relid, InvalidOid, snapshot,
+                                    AccessShareLock, block_name);
+  tuple = context.SearchMicroPartitionEntry();
+  exists = HeapTupleIsValid(tuple);
+  context.EndSearchMicroPartition(AccessShareLock);
+  return exists;
+}
+}  // namespace paxc
 
 namespace pax {
 
+PaxIndexScanDesc::PaxIndexScanDesc(Relation rel) : base_{.rel = rel} {
+  Assert(rel);
+  Assert(&base_ == reinterpret_cast<IndexFetchTableData *>(this));
+  rel_path_ = cbdb::BuildPaxDirectoryPath(rel->rd_node, rel->rd_backend);
+}
+
+PaxIndexScanDesc::~PaxIndexScanDesc() {
+  if (reader_) {
+    reader_->Close();
+    PAX_DELETE(reader_);
+  }
+}
+
+bool PaxIndexScanDesc::FetchTuple(ItemPointer tid, Snapshot snapshot,
+                                  TupleTableSlot *slot, bool *call_again,
+                                  bool *all_dead) {
+  BlockNumber block = pax::GetBlockNumber(*tid);
+  if (block != current_block_ || !reader_) {
+    if (!OpenMicroPartition(block, snapshot)) return false;
+  }
+
+  Assert(current_block_ == block && reader_);
+  if (call_again) *call_again = false;
+  if (all_dead) *all_dead = false;
+
+  auto ok = reader_->GetTuple(slot, pax::GetTupleOffset(*tid));
+  if (ok) {
+    SetBlockNumber(&slot->tts_tid, block);
+    ExecStoreVirtualTuple(slot);
+  }
+
+  return ok;
+}
+
+bool PaxIndexScanDesc::OpenMicroPartition(BlockNumber block,
+                                          Snapshot snapshot) {
+  bool ok;
+
+  Assert(block != current_block_);
+
+  ok = cbdb::IsMicroPartitionVisible(base_.rel, block, snapshot);
+  if (ok) {
+    MicroPartitionReader::ReaderOptions options;
+
+    auto block_name = std::to_string(block);
+    auto file_name = cbdb::BuildPaxFilePath(rel_path_, block_name);
+    options.block_id = block_name;
+    auto file = Singleton<LocalFileSystem>::GetInstance()->Open(
+        file_name, fs::kReadMode);
+    auto reader = PAX_NEW<OrcReader>(file);
+    reader->Open(options);
+    if (reader_) {
+      reader_->Close();
+      PAX_DELETE(reader_);
+    }
+    reader_ = reader;
+    current_block_ = block;
+  }
+
+  return ok;
+}
+
+bool PaxScanDesc::BitmapNextBlock(struct TBMIterateResult *tbmres) {
+  cindex_ = 0;
+  if (!index_desc_) {
+    index_desc_ = PAX_NEW<PaxIndexScanDesc>(rs_base_.rs_rd);
+  }
+  return true;
+}
+
+bool PaxScanDesc::BitmapNextTuple(struct TBMIterateResult *tbmres,
+                                  TupleTableSlot *slot) {
+  ItemPointerData tid;
+  if (tbmres->ntuples < 0) {
+    // lossy bitmap. The maximum value of the last 16 bits in CTID is
+    // 0x7FFF + 1, i.e. 0x8000. See layout of ItemPointerData in PAX
+    if (cindex_ > 0X8000) elog(ERROR, "unexpected offset in pax");
+
+    ItemPointerSet(&tid, tbmres->blockno, cindex_);
+  } else if (cindex_ < tbmres->ntuples) {
+    // The maximum value of the last 16 bits in CTID is 0x7FFF + 1,
+    // i.e. 0x8000. See layout of ItemPointerData in PAX
+    if (tbmres->offsets[cindex_] > 0X8000)
+      elog(ERROR, "unexpected offset in pax");
+
+    ItemPointerSet(&tid, tbmres->blockno, tbmres->offsets[cindex_]);
+  } else {
+    return false;
+  }
+  ++cindex_;
+  return index_desc_->FetchTuple(&tid, rs_base_.rs_snapshot, slot, nullptr,
+                                 nullptr);
+}
+
 TableScanDesc PaxScanDesc::BeginScan(Relation relation, Snapshot snapshot,
-                                     int nkeys, struct ScanKeyData *key,
+                                     int nkeys, struct ScanKeyData * /*key*/,
                                      ParallelTableScanDesc pscan, uint32 flags,
-                                     PaxFilter *filter) {
+                                     PaxFilter *filter, bool build_bitmap) {
   PaxScanDesc *desc;
   MemoryContext old_ctx;
   TableReader::ReaderOptions reader_options{};
@@ -22,7 +150,7 @@ TableScanDesc PaxScanDesc::BeginScan(Relation relation, Snapshot snapshot,
       offsetof(PaxScanDesc, rs_base_) == 0,
       "rs_base should be the first field and aligned to the object address");
 
-  desc = new PaxScanDesc();
+  desc = PAX_NEW<PaxScanDesc>();
 
   desc->memory_context_ = cbdb::AllocSetCtxCreate(
       CurrentMemoryContext, "Pax Storage", PAX_ALLOCSET_DEFAULT_SIZES);
@@ -33,157 +161,224 @@ TableScanDesc PaxScanDesc::BeginScan(Relation relation, Snapshot snapshot,
   desc->rs_base_.rs_nkeys = nkeys;
   desc->rs_base_.rs_flags = flags;
   desc->rs_base_.rs_parallel = pscan;
-  desc->key_ = key;
-  desc->reused_buffer_ = new DataBuffer<char>(32 * 1024 * 1024);  // 32mb
+  desc->reused_buffer_ = PAX_NEW<DataBuffer<char>>(pax_scan_reuse_buffer_size);
   desc->filter_ = filter;
+  if (!desc->filter_) {
+    desc->filter_ = PAX_NEW<PaxFilter>();
+  }
+
+  if (!desc->filter_->GetColumnProjection().first) {
+    auto natts = cbdb::RelationGetAttributesNumber(relation);
+    auto cols = PAX_NEW_ARRAY<bool>(natts);
+    memset(cols, true, natts);
+    desc->filter_->SetColumnProjection(cols, natts);
+  }
+
 #ifdef VEC_BUILD
-  if (flags & (1 << 12)) {
-    desc->vec_adapter_ = new VecAdapter(cbdb::RelationGetTupleDesc(relation));
+  if (flags & SO_TYPE_VECTOR) {
+    desc->vec_adapter_ =
+        PAX_NEW<VecAdapter>(cbdb::RelationGetTupleDesc(relation), build_bitmap);
     reader_options.is_vec = true;
     reader_options.adapter = desc->vec_adapter_;
   }
-#endif
+#endif  // VEC_BUILD
+
+#ifdef ENABLE_PLASMA
+  if (pax_enable_plasma_in_mem) {
+    std::string plasma_socket_path =
+        std::string(desc->plasma_socket_path_prefix_);
+    plasma_socket_path.append(std::to_string(PostPortNumber));
+    plasma_socket_path.append("\0");
+    PaxPlasmaCache::CacheOptions cache_options;
+    cache_options.domain_socket = plasma_socket_path;
+    cache_options.memory_quota = 0;
+    cache_options.waitting_ms = 0;
+
+    desc->pax_cache_ = PAX_NEW<PaxPlasmaCache>(std::move(cache_options));
+    auto status = desc->pax_cache_->Initialize();
+    if (!status.Ok()) {
+      elog(WARNING, "Plasma cache client init failed, message: %s",
+           status.Error().c_str());
+      PAX_DELETE(desc->pax_cache_);
+      desc->pax_cache_ = nullptr;
+    }
+
+    reader_options.pax_cache = desc->pax_cache_;
+  }
 
-  // init shared memory
-  cbdb::InitCommandResource();
+#endif  // ENABLE_PLASMA
 
   old_ctx = MemoryContextSwitchTo(desc->memory_context_);
 
   // build reader
-  reader_options.build_bitmap = true;
+  reader_options.build_bitmap = build_bitmap;
   reader_options.reused_buffer = desc->reused_buffer_;
   reader_options.rel_oid = desc->rs_base_.rs_rd->rd_id;
   reader_options.filter = filter;
 
   auto iter = MicroPartitionInfoIterator::New(relation, snapshot);
   if (filter && filter->HasMicroPartitionFilter()) {
-    auto wrap = new FilterIterator<MicroPartitionMetadata>(
+    auto wrap = PAX_NEW<FilterIterator<MicroPartitionMetadata>>(
         std::move(iter), [filter, relation](const auto &x) {
-          return filter->TestMicroPartitionScan(x.GetStats(),
-                                                RelationGetDescr(relation));
+          MicroPartitionStatsProvider provider(x.GetStats());
+          auto ok = filter->TestScan(provider, RelationGetDescr(relation),
+                                     PaxFilterStatisticsKind::kFile);
+          return ok;
         });
     iter = std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(wrap);
   }
-  desc->reader_ = new TableReader(std::move(iter), reader_options);
+  desc->reader_ = PAX_NEW<TableReader>(std::move(iter), reader_options);
   desc->reader_->Open();
 
   MemoryContextSwitchTo(old_ctx);
   return &desc->rs_base_;
 }
 
-void PaxScanDesc::EndScan(TableScanDesc scan) {
-  PaxScanDesc *desc = ScanToDesc(scan);
+void PaxScanDesc::EndScan() {
+  if (pax_enable_debug && filter_) {
+    filter_->LogStatistics();
+  }
 
-  Assert(desc->reader_);
-  desc->reader_->Close();
+  Assert(reader_);
+  reader_->Close();
 
-  delete desc->reused_buffer_;
-  delete desc->reader_;
-  delete desc->filter_;
+  PAX_DELETE(reused_buffer_);
+  PAX_DELETE(reader_);
+  PAX_DELETE(filter_);
 
 #ifdef VEC_BUILD
-  delete desc->vec_adapter_;
+  PAX_DELETE(vec_adapter_);
 #endif
+
+#ifdef ENABLE_PLASMA
+  if (pax_cache_) {
+    pax_cache_->Destroy();
+    PAX_DELETE(pax_cache_);
+  }
+#endif
+
+  PAX_DELETE(index_desc_);
+
   // TODO(jiaqizho): please double check with abort transaction @gongxun
-  Assert(desc->memory_context_);
-  cbdb::MemoryCtxDelete(desc->memory_context_);
-  delete desc;
+  Assert(memory_context_);
+  cbdb::MemoryCtxDelete(memory_context_);
+  auto self = this;
+  PAX_DELETE(self);
 }
 
 TableScanDesc PaxScanDesc::BeginScanExtractColumns(
-    Relation rel, Snapshot snapshot, ParallelTableScanDesc parallel_scan,
-    List *targetlist, List *qual, uint32 flags) {
+    Relation rel, Snapshot snapshot, int /*nkeys*/,
+    struct ScanKeyData * /*key*/, ParallelTableScanDesc parallel_scan,
+    struct PlanState *ps, uint32 flags) {
   TableScanDesc paxscan;
   PaxFilter *filter;
+  List *targetlist = ps->plan->targetlist;
+  List *qual = ps->plan->qual;
   auto natts = cbdb::RelationGetAttributesNumber(rel);
   bool *cols;
   bool found = false;
+  bool build_bitmap = true;
+  PaxcExtractcolumnContext extract_column;
+
+  filter = PAX_NEW<PaxFilter>();
 
-  filter = new PaxFilter();
+  Assert(natts >= 0);
 
-  cols = new bool[natts];
+  cols = PAX_NEW_ARRAY<bool>(natts);
   memset(cols, false, natts);
 
+  extract_column.cols = cols;
+  extract_column.natts = natts;
+
   found = cbdb::ExtractcolumnsFromNode(reinterpret_cast<Node *>(targetlist),
-                                       cols, natts);
+                                       &extract_column);
   found = cbdb::ExtractcolumnsFromNode(reinterpret_cast<Node *>(qual), cols,
                                        natts) ||
           found;
+  build_bitmap = cbdb::IsSystemAttrNumExist(&extract_column,
+                                            SelfItemPointerAttributeNumber);
 
   // In some cases (for example, count(*)), targetlist and qual may be null,
   // extractcolumns_walker will return immediately, so no columns are specified.
   // We always scan the first column.
-  if (!found) cols[0] = true;
+  if (!found && !build_bitmap && natts > 0) cols[0] = true;
 
   // The `cols` life cycle will be bound to `PaxFilter`
   filter->SetColumnProjection(cols, natts);
 
-  {
+  if (pax_enable_filter) {
     ScanKey scan_keys = nullptr;
     int n_scan_keys = 0;
     auto ok = pax::BuildScanKeys(rel, qual, false, &scan_keys, &n_scan_keys);
     if (ok) filter->SetScanKeys(scan_keys, n_scan_keys);
+
+    if (gp_enable_predicate_pushdown
+#ifdef VEC_BUILD
+        && !(flags & SO_TYPE_VECTOR)
+#endif
+       )
+      filter->BuildExecutionFilterForColumns(rel, ps);
   }
-  paxscan = BeginScan(rel, snapshot, 0, nullptr, parallel_scan, flags, filter);
+  paxscan = BeginScan(rel, snapshot, 0, nullptr, parallel_scan, flags, filter,
+                      build_bitmap);
 
   return paxscan;
 }
 
 // FIXME: shall we take these parameters into account?
-void PaxScanDesc::ReScan(TableScanDesc scan) {
-  PaxScanDesc *desc = ScanToDesc(scan);
+void PaxScanDesc::ReScan(ScanKey /*key*/, bool /*set_params*/,
+                         bool /*allow_strat*/, bool /*allow_sync*/,
+                         bool /*allow_pagemode*/) {
   MemoryContext old_ctx;
-  Assert(desc && desc->reader_);
+  Assert(reader_);
 
-  old_ctx = MemoryContextSwitchTo(desc->memory_context_);
-  desc->reader_->ReOpen();
+  old_ctx = MemoryContextSwitchTo(memory_context_);
+  reader_->ReOpen();
   MemoryContextSwitchTo(old_ctx);
 }
 
-bool PaxScanDesc::ScanGetNextSlot(TableScanDesc scan, TupleTableSlot *slot) {
-  PaxScanDesc *desc = ScanToDesc(scan);
+bool PaxScanDesc::GetNextSlot(TupleTableSlot *slot) {
   MemoryContext old_ctx;
   bool ok = false;
 
-  CTupleSlot cslot(slot);
-  old_ctx = MemoryContextSwitchTo(desc->memory_context_);
+  old_ctx = MemoryContextSwitchTo(memory_context_);
 
-  ok = desc->reader_->ReadTuple(&cslot);
+  Assert(reader_);
+  ok = reader_->ReadTuple(slot);
 
   MemoryContextSwitchTo(old_ctx);
   return ok;
 }
 
-bool PaxScanDesc::ScanAnalyzeNextBlock(TableScanDesc scan,
-                                       BlockNumber blockno) {
-  PaxScanDesc *desc = ScanToDesc(scan);
-  desc->target_tuple_id_ = blockno;
-
+bool PaxScanDesc::ScanAnalyzeNextBlock(BlockNumber blockno,
+                                       BufferAccessStrategy /*bstrategy*/) {
+  target_tuple_id_ = blockno;
   return true;
 }
 
-bool PaxScanDesc::ScanAnalyzeNextTuple(TableScanDesc scan, double *liverows,
-                                       const double *deadrows,
+bool PaxScanDesc::ScanAnalyzeNextTuple(TransactionId /*oldest_xmin*/,
+                                       double *liverows,
+                                       const double * /* deadrows */,
                                        TupleTableSlot *slot) {
-  PaxScanDesc *desc = ScanToDesc(scan);
   MemoryContext old_ctx;
   bool ok = false;
 
-  old_ctx = MemoryContextSwitchTo(desc->memory_context_);
-  Assert(*deadrows == 0);  // not dead rows in pax latest snapshot
-  while (desc->next_tuple_id_ < desc->target_tuple_id_) {
-    ok = PaxScanDesc::ScanGetNextSlot(scan, slot);
+  old_ctx = MemoryContextSwitchTo(memory_context_);
+  while (next_tuple_id_ < target_tuple_id_) {
+    ok = GetNextSlot(slot);
     if (!ok) break;
-    desc->next_tuple_id_++;
+    next_tuple_id_++;
+  }
+  if (next_tuple_id_ == target_tuple_id_) {
+    ok = GetNextSlot(slot);
+    next_tuple_id_++;
+    if (ok) *liverows += 1;
   }
   MemoryContextSwitchTo(old_ctx);
-  if (ok) *liverows += 1;
   return ok;
 }
 
-bool PaxScanDesc::ScanSampleNextBlock(TableScanDesc scan,
-                                      SampleScanState *scanstate) {
-  PaxScanDesc *desc = ScanToDesc(scan);
+bool PaxScanDesc::ScanSampleNextBlock(SampleScanState *scanstate) {
   MemoryContext old_ctx;
   TsmRoutine *tsm = scanstate->tsmroutine;
   BlockNumber blockno = 0;
@@ -193,39 +388,36 @@ bool PaxScanDesc::ScanSampleNextBlock(TableScanDesc scan,
   double allvisfrac = 0;
   bool ok = false;
 
-  old_ctx = MemoryContextSwitchTo(desc->memory_context_);
+  old_ctx = MemoryContextSwitchTo(memory_context_);
 
-  if (desc->total_tuples_ == 0) {
-    paxc::PaxAccessMethod::EstimateRelSize(scan->rs_rd, &attrwidths, &pages,
+  if (total_tuples_ == 0) {
+    paxc::PaxAccessMethod::EstimateRelSize(rs_base_.rs_rd, &attrwidths, &pages,
                                            &total_tuples, &allvisfrac);
-    desc->total_tuples_ = total_tuples;
+    total_tuples_ = total_tuples;
   }
 
   if (tsm->NextSampleBlock)
-    blockno = tsm->NextSampleBlock(scanstate, desc->total_tuples_);
+    blockno = tsm->NextSampleBlock(scanstate, total_tuples_);
   else
-    blockno = system_nextsampleblock(scanstate, desc->total_tuples_);
+    blockno = system_nextsampleblock(scanstate, total_tuples_);
 
   ok = BlockNumberIsValid(blockno);
-  if (ok) {
-    desc->fetch_tuple_id_ = blockno;
-  }
+  if (ok) fetch_tuple_id_ = blockno;
 
   MemoryContextSwitchTo(old_ctx);
   return ok;
 }
 
-bool PaxScanDesc::ScanSampleNextTuple(TableScanDesc scan,
+bool PaxScanDesc::ScanSampleNextTuple(SampleScanState * /*scanstate*/,
                                       TupleTableSlot *slot) {
-  PaxScanDesc *desc = ScanToDesc(scan);
   MemoryContext old_ctx;
   bool ok = false;
 
-  old_ctx = MemoryContextSwitchTo(desc->memory_context_);
-  while (desc->next_tuple_id_ < desc->fetch_tuple_id_) {
-    ok = PaxScanDesc::ScanGetNextSlot(scan, slot);
+  old_ctx = MemoryContextSwitchTo(memory_context_);
+  while (next_tuple_id_ < fetch_tuple_id_) {
+    ok = GetNextSlot(slot);
     if (!ok) break;
-    desc->next_tuple_id_++;
+    next_tuple_id_++;
   }
   MemoryContextSwitchTo(old_ctx);
   return ok;
diff --git a/contrib/pax_storage/src/cpp/access/pax_scanner.h b/contrib/pax_storage/src/cpp/access/pax_scanner.h
index f06ab6c9fb8..33f6754855c 100644
--- a/contrib/pax_storage/src/cpp/access/pax_scanner.h
+++ b/contrib/pax_storage/src/cpp/access/pax_scanner.h
@@ -2,52 +2,84 @@
 
 #include "comm/cbdb_api.h"
 
+#include <unordered_set>
+
 #include "storage/pax.h"
 #include "storage/pax_filter.h"
 #ifdef VEC_BUILD
 #include "storage/vec/pax_vec_adapter.h"
 #endif
+
+namespace paxc {
+bool IndexUniqueCheck(Relation rel, ItemPointer tid, Snapshot snapshot,
+                      bool *all_dead);
+}
+
 namespace pax {
+class PaxIndexScanDesc final {
+ public:
+  explicit PaxIndexScanDesc(Relation rel);
+  ~PaxIndexScanDesc();
+  bool FetchTuple(ItemPointer tid, Snapshot snapshot, TupleTableSlot *slot,
+                  bool *call_again, bool *all_dead);
+  inline IndexFetchTableData *ToBase() { return &base_; }
+  static inline PaxIndexScanDesc *FromBase(IndexFetchTableData *base) {
+    return reinterpret_cast<PaxIndexScanDesc *>(base);
+  }
+
+ private:
+  bool OpenMicroPartition(BlockNumber block, Snapshot snapshot);
+
+  IndexFetchTableData base_;
+  BlockNumber current_block_ = InvalidBlockNumber;
+  MicroPartitionReader *reader_ = nullptr;
+  std::string rel_path_;
+};
 
 class PaxScanDesc {
  public:
   static TableScanDesc BeginScan(Relation relation, Snapshot snapshot,
                                  int nkeys, struct ScanKeyData *key,
                                  ParallelTableScanDesc pscan, uint32 flags,
-                                 PaxFilter *filter);
-
-  static void ReScan(TableScanDesc scan);
-  static void EndScan(TableScanDesc scan);
+                                 PaxFilter *filter, bool build_bitmap);
 
   static TableScanDesc BeginScanExtractColumns(
-      Relation rel, Snapshot snapshot, ParallelTableScanDesc parallel_scan,
-      List *targetlist, List *qual, uint32 flags);
+      Relation rel, Snapshot snapshot, int nkeys, struct ScanKeyData *key,
+      ParallelTableScanDesc parallel_scan, struct PlanState *ps, uint32 flags);
 
-  static bool ScanGetNextSlot(TableScanDesc scan, TupleTableSlot *slot);
+  void EndScan();
+  void ReScan(ScanKey key, bool set_params, bool allow_strat, bool allow_sync,
+              bool allow_pagemode);
 
-  static bool ScanAnalyzeNextBlock(TableScanDesc scan, BlockNumber blockno);
-  static bool ScanAnalyzeNextTuple(TableScanDesc scan, double *liverows,
-                                   const double *deadrows,
-                                   TupleTableSlot *slot);
+  bool GetNextSlot(TupleTableSlot *slot);
 
-  static bool ScanSampleNextBlock(TableScanDesc scan,
-                                  SampleScanState *scanstate);
+  bool ScanAnalyzeNextBlock(BlockNumber blockno,
+                            BufferAccessStrategy bstrategy);
+  bool ScanAnalyzeNextTuple(TransactionId oldest_xmin, double *liverows,
+                            const double *deadrows, TupleTableSlot *slot);
 
-  static bool ScanSampleNextTuple(TableScanDesc scan, TupleTableSlot *slot);
+  bool ScanSampleNextBlock(SampleScanState *scanstate);
 
-  ~PaxScanDesc() = default;
+  bool ScanSampleNextTuple(SampleScanState *scanstate, TupleTableSlot *slot);
 
- private:
-  PaxScanDesc() = default;
+  bool BitmapNextBlock(struct TBMIterateResult *tbmres);
+  bool BitmapNextTuple(struct TBMIterateResult *tbmres, TupleTableSlot *slot);
+
+  ~PaxScanDesc() = default;
 
-  static inline PaxScanDesc *ScanToDesc(TableScanDesc scan) {
+  static inline PaxScanDesc *ToDesc(TableScanDesc scan) {
     auto desc = reinterpret_cast<PaxScanDesc *>(scan);
     return desc;
   }
 
+ private:
+  template <typename T, typename... Args>
+  friend T *PAX_NEW(Args &&...args);
+  PaxScanDesc() = default;
+
  private:
   TableScanDescData rs_base_{};
-  const ScanKeyData *key_ = nullptr;
+
   TableReader *reader_ = nullptr;
 
   DataBuffer<char> *reused_buffer_ = nullptr;
@@ -67,6 +99,15 @@ class PaxScanDesc {
 #ifdef VEC_BUILD
   VecAdapter *vec_adapter_ = nullptr;
 #endif
+
+#ifdef ENABLE_PLASMA
+  const std::string plasma_socket_path_prefix_ = "/tmp/.s.plasma.";
+  PaxCache *pax_cache_ = nullptr;
+#endif
+
+  // used only by bitmap index scan
+  PaxIndexScanDesc *index_desc_ = nullptr;
+  int cindex_ = 0;
 };  // class PaxScanDesc
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/pax_updater.cc b/contrib/pax_storage/src/cpp/access/pax_updater.cc
index e5f79c23ee2..3fbb8787c54 100644
--- a/contrib/pax_storage/src/cpp/access/pax_updater.cc
+++ b/contrib/pax_storage/src/cpp/access/pax_updater.cc
@@ -8,19 +8,29 @@ namespace pax {
 TM_Result CPaxUpdater::UpdateTuple(
     const Relation relation, const ItemPointer otid, TupleTableSlot *slot,
     const CommandId cid, const Snapshot snapshot, const Snapshot /*crosscheck*/,
-    const bool /*wait*/, TM_FailureData * /*tmfd*/,
-    LockTupleMode * /*lockmode*/, bool * /*update_indexes*/) {
+    const bool /*wait*/, TM_FailureData * tmfd,
+    LockTupleMode * lockmode, bool *update_indexes) {
   TM_Result result;
-  CPaxDeleter *deleter =
-      CPaxDmlStateLocal::Instance()->GetDeleter(relation, snapshot);
+
+  auto dml_state = CPaxDmlStateLocal::Instance();
+  auto deleter = dml_state->GetDeleter(relation, snapshot);
+  auto inserter = dml_state->GetInserter(relation);
+
   Assert(deleter != nullptr);
-  CPaxInserter *inserter = CPaxDmlStateLocal::Instance()->GetInserter(relation);
   Assert(inserter != nullptr);
 
+  *lockmode = LockTupleExclusive;
   result = deleter->MarkDelete(otid);
-  // FIXME(gongxun): check result and return TM_SelfModified if needed
 
-  inserter->InsertTuple(relation, slot, cid, 0, nullptr);
+  if (result == TM_Ok) {
+    inserter->InsertTuple(relation, slot, cid, 0, nullptr);
+    *update_indexes = true;
+  } else {
+    // FIXME: set tmfd correctly.
+    // FYI, ao ignores both tmfd and lockmode
+    tmfd->ctid = *otid;
+    *update_indexes = false;
+  }
   // TODO(gongxun): update pgstat info
   return result;
 }
diff --git a/contrib/pax_storage/src/cpp/access/paxc_gram.y b/contrib/pax_storage/src/cpp/access/paxc_gram.y
new file mode 100644
index 00000000000..84ca498fd99
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/paxc_gram.y
@@ -0,0 +1,575 @@
+%{
+#include "postgres.h"
+
+
+#include "nodes/pg_list.h"
+#include "parser/parser.h"
+#include "parser/parse_type.h"
+#include "parser/scanner.h"
+#include "parser/scansup.h"
+#include "utils/builtins.h"
+#include "utils/datetime.h"
+
+#include "access/paxc_scanner.h"
+
+/* Location tracking support --- simpler than bison's default */
+#define YYLLOC_DEFAULT(Current, Rhs, N) \
+        do { \
+                if (N) \
+                        (Current) = (Rhs)[1]; \
+                else \
+                        (Current) = (Rhs)[0]; \
+        } while (0)
+
+#define parser_errposition(pos)  scanner_errposition(pos, yyscanner)
+#define parser_yyerror(msg)  scanner_yyerror(yyscanner, msg)
+
+/*
+ * Bison doesn't allocate anything that needs to live across parser calls,
+ * so we can easily have it use palloc instead of malloc.  This prevents
+ * memory leaks if we error out during parsing.  Note this only works with
+ * bison >= 2.0.  However, in bison 1.875 the default is to use alloca()
+ * if possible, so there's not really much problem anyhow, at least if
+ * you're building with gcc.
+ */
+#define YYMALLOC palloc
+#define YYFREE   pfree
+
+static void paxc_yyerror(core_yyscan_t yyscanner, const char *message);
+static int paxc_yylex(core_yyscan_t yyscanner);
+static int paxc_scanner_errposition(int location);
+static List *paxc_result;
+
+%}
+
+/* %pure-parser */
+%expect 0
+%name-prefix="paxc_yy"
+%locations
+%parse-param {core_yyscan_t yyscanner}
+%lex-param   {core_yyscan_t yyscanner}
+
+%union
+{
+    core_YYSTYPE            core_yystype;
+    /* these fields must match core_YYSTYPE: */
+    int                              ival;
+    char                            *str;
+    const char                      *keyword;
+
+    bool                            boolean;
+    List                            *list;
+    Node                            *node;
+    TypeName                        *typnam;
+    PartitionElem           *partelem;
+    PartitionSpec           *partspec;
+    PartitionBoundSpec      *partboundspec;
+}
+
+/* %type <list> top_level_stmt */
+%type <list> partition_by part_params any_name opt_collate attrs opt_qualified_name
+%type <partelem>        part_elem
+%type <str> ColId attr_name
+
+// FIXME: types for partition ranges
+//%type <list> partition_ranges expr_list opt_type_modifiers
+//%type <partboundspec> partition_range
+//%type <node> AexprConst a_expr c_expr
+//%type <typnam> Numeric opt_float ConstTypename ConstDatetime ConstInterval ConstCharacter CharacterWithLength CharacterWithoutLength ConstBit BitWithLength BitWithoutLength
+//%type <boolean> opt_varying opt_timezone
+//%type <list>    opt_interval interval_second
+//%type <str>  Sconst character
+//%type <ival> Iconst
+
+%token <str>    IDENT
+//%token <str>    FCONST SCONST BCONST XCONST
+//%token <ival>   ICONST 
+
+%token <keyword> COLLATE
+//%token <keyword> TRUE_P FALSE_P HOUR_P YEAR_P NULL_P MONTH_P TO VARYING VARCHAR TIMESTAMP BIT TIME INTERVAL DAY_P MINUTE_P SECOND_P CHARACTER NATIONAL NCHAR CHAR_P ZONE INT_P INTEGER SMALLINT BIGINT REAL FLOAT_P DOUBLE_P PRECISION DECIMAL_P DEC NUMERIC BOOLEAN_P FROM
+
+%token WITH_LA WITHOUT_LA
+
+
+%%
+
+top_level_stmt:
+    partition_by { paxc_result = $1; }
+//    | partition_ranges { paxc_result = $1; }
+    ;
+
+partition_by: part_params { $$ = $1; }
+    ;
+part_params:
+      part_elem                                     { $$ = list_make1($1); }
+    | part_params ',' part_elem                     { $$ = lappend($1, $3); }
+    ;
+
+part_elem: ColId opt_collate opt_qualified_name
+            {
+                PartitionElem *n = makeNode(PartitionElem);
+
+                n->name = $1;
+                n->expr = NULL;
+                n->collation = $2;
+                n->opclass = $3;
+                n->location = @1;
+                $$ = n;
+            }
+/*
+                        | func_expr_windowless opt_collate opt_qualified_name
+                                {
+                                        PartitionElem *n = makeNode(PartitionElem);
+
+                                        n->name = NULL;
+                                        n->expr = $1;
+                                        n->collation = $2;
+                                        n->opclass = $3;
+                                        n->location = @1;
+                                        $$ = n;
+                                }
+                        | '(' a_expr ')' opt_collate opt_qualified_name
+                                {
+                                        PartitionElem *n = makeNode(PartitionElem);
+
+                                        n->name = NULL;
+                                        n->expr = $2;
+                                        n->collation = $4;
+                                        n->opclass = $5;
+                                        n->location = @1;
+                                        $$ = n;
+                                }
+*/
+    ;
+
+/* Column identifier --- names that can be column, table, etc names.
+ */
+ColId: IDENT  { $$ = $1; }
+    ;
+opt_collate: COLLATE any_name   { $$ = $2; }
+    | /*EMPTY*/             { $$ = NIL; }
+    ;
+
+any_name:
+      ColId                 { $$ = list_make1(makeString($1)); }
+    | ColId attrs           { $$ = lcons(makeString($1), $2); }
+    ;
+
+attrs: '.' attr_name        { $$ = list_make1(makeString($2)); }
+    | attrs '.' attr_name   { $$ = lappend($1, makeString($3)); }
+    ;
+
+attr_name: IDENT { $$ = $1; }
+    ;
+
+/* opclass */
+opt_qualified_name: any_name    { $$ = $1; }
+    | /*EMPTY*/                 { $$ = NIL; }
+    ;
+
+//partition_ranges: partition_ranges ',' partition_range { $$ = lappend($1, $3); }
+//    | partition_range { $$ = list_make1($1); }
+//    ;
+//
+//partition_range: FROM '(' expr_list ')' TO '(' expr_list ')'
+//    {
+//        PartitionBoundSpec *n = makeNode(PartitionBoundSpec);
+//
+//        n->strategy = PARTITION_STRATEGY_RANGE;
+//        n->is_default = false;
+//        n->lowerdatums = $3;
+//        n->upperdatums = $7;
+//
+//        $$ = n;
+//    }
+//    ;
+//
+//expr_list:  a_expr { $$ = list_make1($1); }
+//    | expr_list ',' a_expr { $$ = lappend($1, $3); }
+//    ;
+//
+//a_expr: c_expr      { $$ = $1; }
+//    ;
+//c_expr: AexprConst  { $$ = $1; }
+//    ;
+//
+///*
+// * Constants
+// */
+//AexprConst: Iconst { $$ = makeIntConst($1, @1); }
+//    | FCONST { $$ = makeFloatConst($1, @1); }
+//    | Sconst { $$ = makeStringConst($1, @1); }
+//    | BCONST { $$ = makeBitStringConst($1, @1); }
+//    | XCONST
+//        {
+//            /* This is a bit constant per SQL99:
+//             * Without Feature F511, "BIT data type",
+//             * a <general literal> shall not be a
+//             * <bit string literal> or a <hex string literal>.
+//             */
+//            $$ = makeBitStringConst($1, @1);
+//        }
+//    | ConstTypename Sconst { $$ = makeStringConstCast($2, @2, $1); }
+//    | ConstInterval Sconst opt_interval
+//        {
+//            TypeName   *t = $1;
+//
+//            t->typmods = $3;
+//            $$ = makeStringConstCast($2, @2, t);
+//        }
+//    | ConstInterval '(' Iconst ')' Sconst
+//        {
+//            TypeName   *t = $1;
+//
+//            t->typmods = list_make2(makeIntConst(INTERVAL_FULL_RANGE, -1),
+//                                    makeIntConst($3, @3));
+//            $$ = makeStringConstCast($5, @5, t);
+//        }
+//    | TRUE_P { $$ = makeBoolAConst(true, @1); }
+//    | FALSE_P { $$ = makeBoolAConst(false, @1); }
+//    | NULL_P { $$ = makeNullAConst(@1); }
+//    ;
+//
+//Iconst: ICONST      { $$ = $1; };
+//Sconst: SCONST      { $$ = $1; };
+//
+//ConstTypename:
+//      Numeric           { $$ = $1; }
+//    | ConstBit          { $$ = $1; }
+//    | ConstCharacter    { $$ = $1; }
+//    | ConstDatetime     { $$ = $1; }
+//    ;
+//
+///* ConstBit is like Bit except "BIT" defaults to unspecified length */
+///* See notes for ConstCharacter, which addresses same issue for "CHAR" */
+//ConstBit: BitWithLength { $$ = $1; }
+//    | BitWithoutLength
+//        {
+//            $$ = $1;
+//            $$->typmods = NIL;
+//        }
+//    ;
+//
+//BitWithLength: BIT opt_varying '(' expr_list ')'
+//    {
+//        char *typname;
+//
+//        typname = $2 ? "varbit" : "bit";
+//        $$ = SystemTypeName(typname);
+//        $$->typmods = $4;
+//        $$->location = @1;
+//    }
+//    ;
+//
+//BitWithoutLength: BIT opt_varying
+//    {
+//        /* bit defaults to bit(1), varbit to no limit */
+//        if ($2)
+//        {
+//            $$ = SystemTypeName("varbit");
+//        }
+//        else
+//        {
+//            $$ = SystemTypeName("bit");
+//            $$->typmods = list_make1(makeIntConst(1, -1));
+//        }
+//        $$->location = @1;
+//    }
+//    ;
+//
+//ConstCharacter:  CharacterWithLength
+//        {
+//            $$ = $1;
+//        }
+//    | CharacterWithoutLength
+//        {
+//            /* Length was not specified so allow to be unrestricted.
+//             * This handles problems with fixed-length (bpchar) strings
+//             * which in column definitions must default to a length
+//             * of one, but should not be constrained if the length
+//             * was not specified.
+//             */
+//            $$ = $1;
+//            $$->typmods = NIL;
+//        }
+//    ;
+//
+//CharacterWithLength:  character '(' Iconst ')'
+//    {
+//        $$ = SystemTypeName($1);
+//        $$->typmods = list_make1(makeIntConst($3, @3));
+//        $$->location = @1;
+//    }
+//    ;
+//
+//CharacterWithoutLength:  character
+//    {
+//        $$ = SystemTypeName($1);
+//        /* char defaults to char(1), varchar to no limit */
+//        if (strcmp($1, "bpchar") == 0)
+//            $$->typmods = list_make1(makeIntConst(1, -1));
+//        $$->location = @1;
+//    }
+//    ;
+//
+//character: CHARACTER opt_varying { $$ = $2 ? "varchar": "bpchar"; }
+//    | CHAR_P opt_varying { $$ = $2 ? "varchar": "bpchar"; }
+//    | VARCHAR { $$ = "varchar"; }
+//    | NATIONAL CHARACTER opt_varying { $$ = $3 ? "varchar": "bpchar"; }
+//    | NATIONAL CHAR_P opt_varying { $$ = $3 ? "varchar": "bpchar"; }
+//    | NCHAR opt_varying { $$ = $2 ? "varchar": "bpchar"; }
+//    ;
+//
+//opt_varying: VARYING    { $$ = true; }
+//    | /*EMPTY*/         { $$ = false; }
+//    ;
+//
+///*
+// * SQL date/time types
+// */
+//ConstDatetime:
+//    TIMESTAMP '(' Iconst ')' opt_timezone
+//        {
+//            if ($5)
+//                $$ = SystemTypeName("timestamptz");
+//            else
+//                $$ = SystemTypeName("timestamp");
+//            $$->typmods = list_make1(makeIntConst($3, @3));
+//            $$->location = @1;
+//        }
+//    | TIMESTAMP opt_timezone
+//        {
+//            if ($2)
+//                $$ = SystemTypeName("timestamptz");
+//            else
+//                $$ = SystemTypeName("timestamp");
+//            $$->location = @1;
+//        }
+//    | TIME '(' Iconst ')' opt_timezone
+//        {
+//            if ($5)
+//                $$ = SystemTypeName("timetz");
+//            else
+//                $$ = SystemTypeName("time");
+//            $$->typmods = list_make1(makeIntConst($3, @3));
+//            $$->location = @1;
+//        }
+//    | TIME opt_timezone
+//        {
+//            if ($2)
+//                $$ = SystemTypeName("timetz");
+//            else
+//                $$ = SystemTypeName("time");
+//            $$->location = @1;
+//        }
+//    ;
+//
+//ConstInterval: INTERVAL
+//    {
+//        $$ = SystemTypeName("interval");
+//        $$->location = @1;
+//    }
+//    ;
+//
+//opt_timezone: WITH_LA TIME ZONE     { $$ = true; }
+//    | WITHOUT_LA TIME ZONE          { $$ = false; }
+//    | /*EMPTY*/                     { $$ = false; }
+//    ;
+//
+//opt_interval:
+//      YEAR_P { $$ = list_make1(makeIntConst(INTERVAL_MASK(YEAR), @1)); }
+//    | MONTH_P { $$ = list_make1(makeIntConst(INTERVAL_MASK(MONTH), @1)); }
+//    | DAY_P { $$ = list_make1(makeIntConst(INTERVAL_MASK(DAY), @1)); }
+//    | HOUR_P { $$ = list_make1(makeIntConst(INTERVAL_MASK(HOUR), @1)); }
+//    | MINUTE_P { $$ = list_make1(makeIntConst(INTERVAL_MASK(MINUTE), @1)); }
+//    | interval_second { $$ = $1; }
+//    | YEAR_P TO MONTH_P
+//        {
+//            $$ = list_make1(makeIntConst(INTERVAL_MASK(YEAR) |
+//                                         INTERVAL_MASK(MONTH), @1));
+//        }
+//    | DAY_P TO HOUR_P
+//        {
+//            $$ = list_make1(makeIntConst(INTERVAL_MASK(DAY) |
+//                                         INTERVAL_MASK(HOUR), @1));
+//        }
+//    | DAY_P TO MINUTE_P
+//        {
+//            $$ = list_make1(makeIntConst(INTERVAL_MASK(DAY) |
+//                                         INTERVAL_MASK(HOUR) |
+//                                         INTERVAL_MASK(MINUTE), @1));
+//        }
+//    | DAY_P TO interval_second
+//        {
+//            $$ = $3;
+//            linitial($$) = makeIntConst(INTERVAL_MASK(DAY) |
+//                                        INTERVAL_MASK(HOUR) |
+//                                        INTERVAL_MASK(MINUTE) |
+//                                        INTERVAL_MASK(SECOND), @1);
+//        }
+//    | HOUR_P TO MINUTE_P
+//        {
+//            $$ = list_make1(makeIntConst(INTERVAL_MASK(HOUR) |
+//                                         INTERVAL_MASK(MINUTE), @1));
+//        }
+//    | HOUR_P TO interval_second
+//        {
+//            $$ = $3;
+//            linitial($$) = makeIntConst(INTERVAL_MASK(HOUR) |
+//                                        INTERVAL_MASK(MINUTE) |
+//                                        INTERVAL_MASK(SECOND), @1);
+//        }
+//    | MINUTE_P TO interval_second
+//        {
+//            $$ = $3;
+//            linitial($$) = makeIntConst(INTERVAL_MASK(MINUTE) |
+//                                        INTERVAL_MASK(SECOND), @1);
+//        }
+//    | /*EMPTY*/ { $$ = NIL; }
+//    ;
+//
+//interval_second:
+//    SECOND_P
+//        {
+//            $$ = list_make1(makeIntConst(INTERVAL_MASK(SECOND), @1));
+//        }
+//    | SECOND_P '(' Iconst ')'
+//        {
+//            $$ = list_make2(makeIntConst(INTERVAL_MASK(SECOND), @1),
+//                            makeIntConst($3, @3));
+//        }
+//    ;
+//
+//opt_type_modifiers: '(' expr_list ')'       { $$ = $2; }
+//    | /* EMPTY */                           { $$ = NIL; }
+//    ;
+//
+///*
+// * SQL numeric data types
+// */
+//Numeric:
+//      INT_P
+//        {
+//                $$ = SystemTypeName("int4");
+//                $$->location = @1;
+//        }
+//    | INTEGER
+//        {
+//                $$ = SystemTypeName("int4");
+//                $$->location = @1;
+//        }
+//    | SMALLINT
+//        {
+//                $$ = SystemTypeName("int2");
+//                $$->location = @1;
+//        }
+//    | BIGINT
+//        {
+//                $$ = SystemTypeName("int8");
+//                $$->location = @1;
+//        }
+//    | REAL
+//        {
+//                $$ = SystemTypeName("float4");
+//                $$->location = @1;
+//        }
+//    | FLOAT_P opt_float
+//        {
+//                $$ = $2;
+//                $$->location = @1;
+//        }
+//    | DOUBLE_P PRECISION
+//        {
+//                $$ = SystemTypeName("float8");
+//                $$->location = @1;
+//        }
+//    | DECIMAL_P opt_type_modifiers
+//        {
+//                $$ = SystemTypeName("numeric");
+//                $$->typmods = $2;
+//                $$->location = @1;
+//        }
+//    | DEC opt_type_modifiers
+//        {
+//                $$ = SystemTypeName("numeric");
+//                $$->typmods = $2;
+//                $$->location = @1;
+//        }
+//    | NUMERIC opt_type_modifiers
+//        {
+//                $$ = SystemTypeName("numeric");
+//                $$->typmods = $2;
+//                $$->location = @1;
+//        }
+//    | BOOLEAN_P
+//        {
+//                $$ = SystemTypeName("bool");
+//                $$->location = @1;
+//        }
+//    ;
+//
+//opt_float:      '(' Iconst ')'
+//        {
+//                /*
+//                 * Check FLOAT() precision limits assuming IEEE floating
+//                 * types - thomas 1997-09-18
+//                 */
+//                if ($2 < 1)
+//                        ereport(ERROR,
+//                                        (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+//                                         errmsg("precision for type float must be at least 1 bit"),
+//                                         parser_errposition(@2)));
+//                else if ($2 <= 24)
+//                        $$ = SystemTypeName("float4");
+//                else if ($2 <= 53)
+//                        $$ = SystemTypeName("float8");
+//                else
+//                        ereport(ERROR,
+//                                        (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+//                                         errmsg("precision for type float must be less than 54 bits"),
+//                                         parser_errposition(@2)));
+//        }
+//    | /*EMPTY*/ { $$ = SystemTypeName("float8"); }
+//    ;
+//
+
+%%
+
+static int paxc_scanner_errposition(int location) {
+  return location;
+}
+
+static void paxc_yyerror(core_yyscan_t yyscanner, const char *message) {
+  ereport(ERROR, (errcode(ERRCODE_SYNTAX_ERROR),
+                  errmsg("%s", _(message))));
+}
+static int paxc_yylex(core_yyscan_t yyscanner) {
+  return core_yylex(&paxc_yylval.core_yystype, &paxc_yylloc, yyscanner);
+}
+
+static core_yyscan_t paxc_scanner_init(const char *str, core_yy_extra_type *extra) {
+  paxc_result = NIL;
+  return scanner_init(str, extra, &ScanKeywords, ScanKeywordTokens);
+}
+
+static void paxc_scanner_finish(core_yyscan_t yyscanner) {
+  scanner_finish(yyscanner);
+  paxc_result = NIL;
+}
+
+List *paxc_raw_parse(const char *str) {
+  core_yyscan_t yyscanner;
+  core_yy_extra_type extra;
+  List *result;
+  int                     yyresult;
+
+  yyscanner = paxc_scanner_init(str, &extra);
+  yyresult = paxc_yyparse(yyscanner);
+  if (yyresult != 0)
+    elog(ERROR, "pacx_yyparse returned %d", yyresult);
+
+  result = paxc_result;
+  paxc_scanner_finish(yyscanner);
+  return result;
+}
+
diff --git a/contrib/pax_storage/src/cpp/access/paxc_rel_options.cc b/contrib/pax_storage/src/cpp/access/paxc_rel_options.cc
new file mode 100644
index 00000000000..fc230b874d3
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/paxc_rel_options.cc
@@ -0,0 +1,270 @@
+#include "access/paxc_rel_options.h"
+
+namespace paxc {
+
+typedef struct {
+  const char *optname; /* option's name */
+  const pax::ColumnEncoding_Kind kind;
+} relopt_compress_type_mapping;
+
+static const relopt_compress_type_mapping kSelfRelCompressMap[] = {
+    {ColumnEncoding_Kind_NO_ENCODED_STR,
+     pax::ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED},
+    {ColumnEncoding_Kind_RLE_V2_STR,
+     pax::ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2},
+    {ColumnEncoding_Kind_DIRECT_DELTA_STR,
+     pax::ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA},
+    {ColumnEncoding_Kind_COMPRESS_ZSTD_STR,
+     pax::ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZSTD},
+    {ColumnEncoding_Kind_COMPRESS_ZLIB_STR,
+     pax::ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZLIB},
+};
+
+typedef struct {
+  const char *optname; /* option's name */
+  const pax::PaxStorageFormat format;
+} relopt_format_type_mapping;
+
+static const relopt_format_type_mapping kSelfRelFormatMap[] = {
+    {STORAGE_FORMAT_TYPE_ORC, pax::PaxStorageFormat::kTypeStorageOrcNonVec},
+    {STORAGE_FORMAT_TYPE_ORC_VEC, pax::PaxStorageFormat::kTypeStorageOrcVec},
+};
+
+// reloptions structure and variables.
+static relopt_kind self_relopt_kind;
+
+#define PAX_COPY_STR_OPT(pax_opts_, pax_opt_name_)                            \
+  do {                                                                        \
+    PaxOptions *pax_opts = reinterpret_cast<PaxOptions *>(pax_opts_);         \
+    int pax_name_offset_ = *reinterpret_cast<int *>(pax_opts->pax_opt_name_); \
+    if (pax_name_offset_)                                                     \
+      strlcpy(pax_opts->pax_opt_name_,                                        \
+              reinterpret_cast<char *>(pax_opts) + pax_name_offset_,          \
+              sizeof(pax_opts->pax_opt_name_));                               \
+  } while (0)
+
+static const char *kSelfColumnEncodingClauseWhiteList[] = {
+    PAX_SOPT_COMPTYPE,
+    PAX_SOPT_COMPLEVEL,
+};
+
+static const relopt_parse_elt kSelfReloptTab[] = {
+    // no allow set with encoding
+    {PAX_SOPT_STORAGE_FORMAT, RELOPT_TYPE_STRING,
+     offsetof(PaxOptions, storage_format)},
+    // allow with encoding
+    {PAX_SOPT_COMPTYPE, RELOPT_TYPE_STRING,
+     offsetof(PaxOptions, compress_type)},
+    {PAX_SOPT_COMPLEVEL, RELOPT_TYPE_INT, offsetof(PaxOptions, compress_level)},
+    {PAX_SOPT_PARTITION_BY, RELOPT_TYPE_STRING,
+     offsetof(PaxOptions, partition_by_offset)},
+    {PAX_SOPT_PARTITION_RANGES, RELOPT_TYPE_STRING,
+     offsetof(PaxOptions, partition_ranges_offset)},
+};
+
+static void paxc_validate_rel_options_storage_format(const char *value) {
+  size_t i;
+
+  for (i = 0; i < lengthof(kSelfRelFormatMap); i++) {
+    if (strcmp(value, kSelfRelFormatMap[i].optname) == 0) return;
+  }
+  ereport(ERROR, (errmsg("unsupported storage format: '%s'", value)));
+}
+
+static void paxc_validate_rel_options_compress_type(const char *value) {
+  size_t i;
+
+  for (i = 0; i < lengthof(kSelfRelCompressMap); i++) {
+    if (strcmp(value, kSelfRelCompressMap[i].optname) == 0) return;
+  }
+  ereport(ERROR, (errmsg("unsupported compress type: '%s'", value)));
+}
+
+static void paxc_validate_rel_option(PaxOptions *options) {
+  Assert(options);
+  if (strcmp(ColumnEncoding_Kind_NO_ENCODED_STR, options->compress_type) == 0 ||
+      strcmp(ColumnEncoding_Kind_RLE_V2_STR, options->compress_type) == 0 ||
+      strcmp(ColumnEncoding_Kind_DIRECT_DELTA_STR, options->compress_type) ==
+          0) {
+    if (options->compress_level != 0) {
+      ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+                      errmsg("compresslevel=%d should setting is not work for "
+                             "current encoding.",
+                             options->compress_level)));
+    }
+  }
+}
+
+bytea *paxc_default_rel_options(Datum reloptions, char /*relkind*/,
+                                bool validate) {
+  Assert(self_relopt_kind != 0);
+  bytea *rdopts = (bytea *)build_reloptions(
+      reloptions, validate, self_relopt_kind, sizeof(PaxOptions),
+      kSelfReloptTab, lengthof(kSelfReloptTab));
+
+  PAX_COPY_STR_OPT(rdopts, storage_format);
+  PAX_COPY_STR_OPT(rdopts, compress_type);
+  return rdopts;
+}
+
+PaxOptions **paxc_relation_get_attribute_options(Relation rel) {
+  Datum *dats;
+  PaxOptions **opts;
+  int i;
+
+  Assert(rel && OidIsValid(RelationGetRelid(rel)));
+
+  opts = (PaxOptions **)palloc0(RelationGetNumberOfAttributes(rel) *
+                                sizeof(PaxOptions *));
+
+  dats = get_rel_attoptions(RelationGetRelid(rel),
+                            RelationGetNumberOfAttributes(rel));
+
+  for (i = 0; i < RelationGetNumberOfAttributes(rel); i++) {
+    if (DatumGetPointer(dats[i]) != NULL) {
+      opts[i] = (PaxOptions *)paxc_default_rel_options(dats[i], 0, false);
+      pfree(DatumGetPointer(dats[i]));
+    }
+  }
+  pfree(dats);
+
+  return opts;
+}
+
+static void paxc_validate_single_column_encoding_clauses(
+    List *single_column_encoding) {
+  ListCell *cell = NULL;
+  Datum d;
+  PaxOptions *option = NULL;
+  /* not allow caller pass the `PAX_SOPT_STORAGE_FORMAT`
+   */
+  foreach (cell, single_column_encoding) {
+    DefElem *def = (DefElem *)lfirst(cell);
+    bool not_in_white_list = true;
+
+    if (!def->defname) {
+      continue;
+    }
+
+    for (size_t i = 0; i < lengthof(kSelfColumnEncodingClauseWhiteList); i++) {
+      if (strcmp(kSelfColumnEncodingClauseWhiteList[i], def->defname) == 0) {
+        not_in_white_list = false;
+        break;
+      }
+    }
+
+    if (not_in_white_list) {
+      ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+                      errmsg("%s not allow setting in ENCODING CLAUSES.",
+                             def->defname)));
+    }
+  }
+
+  d = transformRelOptions(PointerGetDatum(NULL), single_column_encoding, NULL,
+                          NULL, true, false);
+
+  option = (PaxOptions *)paxc_default_rel_options(d, 0, true);
+  paxc_validate_rel_option(option);
+}
+
+void paxc_validate_column_encoding_clauses(List *encoding_opts) {
+  ListCell *lc;
+  foreach (lc, encoding_opts) {
+    ColumnReferenceStorageDirective *crsd =
+        (ColumnReferenceStorageDirective *)lfirst(lc);
+    paxc_validate_single_column_encoding_clauses(crsd->encoding);
+  }
+}
+
+List *paxc_transform_column_encoding_clauses(List *encoding_opts, bool validate,
+                                             bool fromType) {
+  List *ret_list = NIL;
+
+  if (fromType) {
+    return NIL;
+  }
+
+  ret_list = list_copy(encoding_opts);
+  /* there are no need to do column encoding clauses transform in pax
+   * because pax will setting default encoding inside
+   */
+  if (validate) {
+    paxc_validate_single_column_encoding_clauses(encoding_opts);
+  }
+
+  /* if column no setting the encoding clauses
+   * in transformColumnEncoding will pass the relation option
+   * to column encoding clauses, should remove the
+   * `PAX_SOPT_STORAGE_FORMAT` from it.
+   */
+  ListCell *cell = NULL;
+  foreach (cell, ret_list) {
+    DefElem *def = (DefElem *)lfirst(cell);
+    bool not_in_white_list = true;
+    if (!def->defname) {
+      continue;
+    }
+
+    for (size_t i = 0; i < lengthof(kSelfColumnEncodingClauseWhiteList); i++) {
+      if (strcmp(kSelfColumnEncodingClauseWhiteList[i], def->defname) == 0) {
+        not_in_white_list = false;
+        break;
+      }
+    }
+
+    if (not_in_white_list) {
+      ret_list = foreach_delete_current(ret_list, cell);
+    }
+  }
+
+  return ret_list;
+}
+
+void paxc_reg_rel_options() {
+  self_relopt_kind = add_reloption_kind();
+  add_string_reloption(
+      self_relopt_kind, PAX_SOPT_STORAGE_FORMAT, "pax storage format", "orc",
+      paxc_validate_rel_options_storage_format, AccessExclusiveLock);
+  add_string_reloption(self_relopt_kind, PAX_SOPT_COMPTYPE, "pax compress type",
+                       PAX_DEFAULT_COMPRESSTYPE,
+                       paxc_validate_rel_options_compress_type,
+                       AccessExclusiveLock);
+  add_int_reloption(self_relopt_kind, PAX_SOPT_COMPLEVEL, "pax compress level",
+                    PAX_DEFAULT_COMPRESSLEVEL, PAX_MIN_COMPRESSLEVEL,
+                    PAX_MAX_COMPRESSLEVEL, AccessExclusiveLock);
+  add_string_reloption(self_relopt_kind, PAX_SOPT_PARTITION_BY, "partition by",
+                       NULL, NULL, AccessExclusiveLock);
+  add_string_reloption(self_relopt_kind, PAX_SOPT_PARTITION_RANGES,
+                       "partition ranges", NULL, NULL, AccessExclusiveLock);
+}
+
+}  // namespace paxc
+
+namespace pax {
+
+ColumnEncoding_Kind CompressKeyToColumnEncodingKind(const char *encoding_str) {
+  Assert(encoding_str);
+
+  for (size_t i = 0; i < lengthof(paxc::kSelfRelCompressMap); i++) {
+    if (strcmp(paxc::kSelfRelCompressMap[i].optname, encoding_str) == 0) {
+      return paxc::kSelfRelCompressMap[i].kind;
+    }
+  }
+
+  CBDB_RAISE(cbdb::CException::kExTypeLogicError);
+}
+
+PaxStorageFormat StorageFormatKeyToPaxStorageFormat(
+    const char *storage_format_str) {
+  Assert(storage_format_str);
+
+  for (size_t i = 0; i < lengthof(paxc::kSelfRelFormatMap); i++) {
+    if (strcmp(paxc::kSelfRelFormatMap[i].optname, storage_format_str) == 0) {
+      return paxc::kSelfRelFormatMap[i].format;
+    }
+  }
+
+  CBDB_RAISE(cbdb::CException::kExTypeLogicError);
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/paxc_rel_options.h b/contrib/pax_storage/src/cpp/access/paxc_rel_options.h
new file mode 100644
index 00000000000..cc66575610b
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/paxc_rel_options.h
@@ -0,0 +1,110 @@
+#pragma once
+
+#include "comm/cbdb_api.h"
+
+#include "exceptions/CException.h"
+#include "storage/pax_defined.h"
+#include "storage/proto/proto_wrappers.h"  // for ColumnEncoding_Kind
+
+namespace paxc {
+
+#define ColumnEncoding_Kind_NO_ENCODED_STR "none"
+#define ColumnEncoding_Kind_RLE_V2_STR "rle"
+#define ColumnEncoding_Kind_DIRECT_DELTA_STR "delta"
+#define ColumnEncoding_Kind_COMPRESS_ZSTD_STR "zstd"
+#define ColumnEncoding_Kind_COMPRESS_ZLIB_STR "zlib"
+
+#define STORAGE_FORMAT_TYPE_ORC "orc"
+#define STORAGE_FORMAT_TYPE_ORC_VEC "orc_vec"
+#define STORAGE_FORMAT_TYPE_DEFAULT STORAGE_FORMAT_TYPE_ORC
+
+#define PAX_DEFAULT_COMPRESSLEVEL AO_DEFAULT_COMPRESSLEVEL
+#define PAX_MIN_COMPRESSLEVEL AO_MIN_COMPRESSLEVEL
+#define PAX_MAX_COMPRESSLEVEL AO_MAX_COMPRESSLEVEL
+#define PAX_DEFAULT_COMPRESSTYPE ColumnEncoding_Kind_NO_ENCODED_STR
+
+#define PAX_SOPT_STORAGE_FORMAT "storage_format"
+#define PAX_SOPT_COMPTYPE SOPT_COMPTYPE
+#define PAX_SOPT_COMPLEVEL SOPT_COMPLEVEL
+#define PAX_SOPT_PARTITION_BY "partition_by"
+#define PAX_SOPT_PARTITION_RANGES "partition_ranges"
+
+// plain structure used by reloptions, can be accessed from C++ code.
+struct PaxOptions {
+  // Pax needs to define the StdRdOptions instead of just vl_len. 
+  // This is because many places in the CBDB assume that option in 
+  // relation can be cast into StdRdOptions.
+  StdRdOptions rd_options; 
+  char storage_format[16];
+  char compress_type[16];
+  int compress_level;
+  int partition_by_offset = 0;
+  int partition_ranges_offset = 0;
+
+  char *partition_by() {
+    return partition_by_offset == 0
+               ? NULL
+               : reinterpret_cast<char *>(this) + partition_by_offset;
+  }
+  char *partition_ranges() {
+    return partition_ranges_offset == 0
+               ? NULL
+               : reinterpret_cast<char *>(this) + partition_ranges_offset;
+  }
+};
+
+#define RelationGetOptions(relation, field_name, default_opt)     \
+  ((relation)->rd_options                                         \
+       ? ((paxc::PaxOptions *)(relation)->rd_options)->field_name \
+       : (default_opt))
+
+/*
+ * used to register pax rel options
+ */
+void paxc_reg_rel_options();
+
+/*
+ * parse the rel options in `pg_attribute_encoding` and relation
+ * if no ENCODING setting in `pg_attribute_encoding` will fill with
+ * the default one
+ */
+bytea *paxc_default_rel_options(Datum reloptions, char /*relkind*/,
+                                bool validate);
+
+/*
+ * parse the attr options from `pg_attribute_encoding`
+ * if no ENCODING setting in `pg_attribute_encoding` will fill with
+ * the default one
+ */
+PaxOptions **paxc_relation_get_attribute_options(Relation rel);
+
+/*
+ * validate the ENCODING CLAUSES
+ * like `CREATE TABLE t1 (c1 int, COLUMN c1 ENCODING (key=value)) using
+ * pax`
+ */
+void paxc_validate_column_encoding_clauses(List *encoding_opts);
+
+/*
+ * transform the ENCODING options if key no setting
+ * validate will become true only when the encoding syntax is true
+ * like `CREATE TABLE t1 (c1 int ENCODING (key=value)) using pax`
+ *
+ * pax no need transform the ENCODING options if key no setting
+ * it will deal the default value inside pax colomn
+ */
+List *paxc_transform_column_encoding_clauses(List *encoding_opts, bool validate,
+                                             bool fromType);
+
+}  // namespace paxc
+
+namespace pax {
+
+// use to transform compress type str to encoding kind
+extern ColumnEncoding_Kind CompressKeyToColumnEncodingKind(
+    const char *encoding_str);
+
+extern PaxStorageFormat StorageFormatKeyToPaxStorageFormat(
+    const char *storage_format_str);
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/access/paxc_scanner.cc b/contrib/pax_storage/src/cpp/access/paxc_scanner.cc
new file mode 100644
index 00000000000..43d628ee25f
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/paxc_scanner.cc
@@ -0,0 +1,131 @@
+#include "access/paxc_scanner.h"
+
+#include "access/pax_partition.h"
+
+#define blank_char(ch) ((ch) == ' ' || (ch) == '\t' || (ch) == '\n')
+#define ident_char(ch) (((ch) >= 'a' && (ch) <= 'z') || \
+                        ((ch) >= 'A' && (ch) <= 'Z') || \
+                        ((ch) >= '0' && (ch) <= '9') || \
+                        (ch) == '_')
+
+static inline const char *paxc_eat_blank(const char *s) {
+  while (blank_char(*s))
+    s++;
+  return s;
+}
+
+static inline const char *paxc_expect_char(const char *s, char ch) {
+  const char *p = paxc_eat_blank(s);
+  if (*p != ch)
+    elog(ERROR, "invalid syntax for partition range:'%s' at '%s'", s, p);
+
+  return p + 1;
+}
+
+static const char *paxc_expect_ident(const char *s, const char *ident) {
+  const char *p = s;
+  const char *q;
+  size_t n;
+
+  n = strlen(ident);
+  p = paxc_eat_blank(s);
+  if (strncasecmp(p, ident, n) != 0)
+    elog(ERROR, "unexpected ident: %s, want %s", s, ident);
+  q = p + n;
+  if (ident_char(*q))
+    elog(ERROR, "unexpected ident: %s, want %s", s, ident);
+
+  return q;
+}
+
+static const char *paxc_parse_single_integer(const char *expr, Node **result) {
+  const char *p;
+  char *endptr;
+  int val;
+
+  p = paxc_eat_blank(expr);
+  val = strtol(p, &endptr, 10);
+  A_Const *n = makeNode(A_Const);
+
+  n->val.type = T_Integer;
+  n->val.val.ival = val;
+  n->location = -1;
+  *result = (Node *)n;
+
+  return endptr;
+}
+
+static const char *paxc_parse_expr_list(const char *expr_list, List **result) {
+  const char *p = expr_list;
+
+  *result = NIL;
+  p = paxc_eat_blank(expr_list);
+  while (*p) {
+    Node *value = NULL;
+    p = paxc_parse_single_integer(p, &value);
+    Assert(value);
+
+    *result = lappend(*result, value);
+
+    p = paxc_eat_blank(p);
+    if (*p != ',') break;
+    p++;
+  }
+  return p;
+}
+
+List *paxc_parse_partition_ranges(const char *ranges) {
+  const char *p = ranges;
+  List *result = NIL;
+  if (!p || *p == '\0') return NIL;
+
+  while (*p && (p = paxc_expect_ident(p, "from"))) {
+    List *from_list = NIL;
+    List *to_list = NIL;
+    List *every_list = NIL;
+
+    p = paxc_expect_char(p, '(');
+    p = paxc_parse_expr_list(p, &from_list);
+    p = paxc_expect_char(p, ')');
+    Assert(from_list);
+
+    p = paxc_expect_ident(p, "to");
+    p = paxc_expect_char(p, '(');
+    p = paxc_parse_expr_list(p, &to_list);
+    p = paxc_expect_char(p, ')');
+    Assert(to_list);
+
+    p = paxc_eat_blank(p);
+    if (strncasecmp(p, "every", 5) == 0) {
+      // from(X) to(Y) every(Z)
+      p += 5;
+      p = paxc_expect_char(p, '(');
+      p = paxc_parse_expr_list(p, &every_list);
+      p = paxc_expect_char(p, ')');
+      Assert(every_list);
+      p = paxc_eat_blank(p);
+    }
+    if (*p == ',') {
+      p++;
+    } else if (*p != '\0') {
+      elog(ERROR, "unexpected range delimiter: %s", p);
+    }
+    
+    if (list_length(from_list) == 0 ||
+        list_length(from_list) != list_length(to_list)) {
+      elog(ERROR, "the lengths of expr_list are not equal in from and to: %d %d",
+      list_length(from_list), list_length(to_list));
+    }
+
+    PartitionRangeExtension *ext = (PartitionRangeExtension *)palloc0(sizeof(PartitionRangeExtension));
+    PartitionBoundSpec *n = &ext->spec;
+    n->type = T_PartitionBoundSpec;
+    n->strategy = PARTITION_STRATEGY_RANGE;
+    n->is_default = false;
+    n->lowerdatums = from_list;
+    n->upperdatums = to_list;
+    ext->every = every_list;
+    result = lappend(result, ext);
+  }
+  return result;
+}
diff --git a/contrib/pax_storage/src/cpp/access/paxc_scanner.h b/contrib/pax_storage/src/cpp/access/paxc_scanner.h
new file mode 100644
index 00000000000..79ca99f9537
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/access/paxc_scanner.h
@@ -0,0 +1,13 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+struct List;
+extern struct List *paxc_raw_parse(const char *str);
+extern struct List *paxc_parse_partition_ranges(const char *ranges);
+
+#ifdef __cplusplus
+}
+#endif
diff --git a/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.cc b/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.cc
deleted file mode 100644
index 3e0bd53d103..00000000000
--- a/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.cc
+++ /dev/null
@@ -1,341 +0,0 @@
-#include "catalog/micro_partition_stats.h"
-
-#include "comm/cbdb_api.h"
-
-#include "comm/cbdb_wrappers.h"
-#include "storage/micro_partition_metadata.h"
-#include "storage/proto/proto_wrappers.h"
-
-namespace pax {
-// SetStatsMessage may be called several times in a write,
-// one for each micro partition, so all members need to reset.
-// Some metainfo like typid, collation, oids for less/greater,
-// fmgr should be exactly consistent.
-MicroPartitionStats *MicroPartitionStats::SetStatsMessage(
-    pax::stats::MicroPartitionStatisticsInfo *stats, int natts) {
-  FmgrInfo finfo;
-  std::tuple<Oid, Oid, Oid, Oid> zero_oids = {InvalidOid, InvalidOid, InvalidOid, InvalidOid};
-
-  Assert(natts > 0);
-  Assert(stats && stats->columnstats_size() == 0);
-  initial_check_ = false;
-  stats_ = stats;
-
-  memset(&finfo, 0, sizeof(finfo));
-  procs_.clear();
-  finfos_.clear();
-  status_.clear();
-  for (int i = 0; i < natts; i++) {
-    procs_.emplace_back(zero_oids);
-    finfos_.emplace_back(std::pair<FmgrInfo, FmgrInfo>({finfo, finfo}));
-    status_.emplace_back('u');
-    auto columnstats = stats_->add_columnstats();
-    Assert(columnstats->allnull());
-    Assert(!columnstats->hasnull());
-  }
-  Assert(stats_->columnstats_size() == natts);
-  return this;
-}
-
-void MicroPartitionStats::AddRow(TupleTableSlot *slot) {
-  auto desc = slot->tts_tupleDescriptor;
-  auto n = desc->natts;
-
-  if (!initial_check_) {
-    DoInitialCheck(desc);
-    initial_check_ = true;
-  }
-  CBDB_CHECK(status_.size() == static_cast<size_t>(n),
-             cbdb::CException::ExType::kExTypeSchemaNotMatch);
-  for (auto i = 0; i < n; i++) {
-    auto att = &desc->attrs[i];
-
-    AssertImply(att->attisdropped, slot->tts_isnull[i]);
-    if (slot->tts_isnull[i])
-      AddNullColumn(i);
-    else
-      AddNonNullColumn(i, slot->tts_values[i], desc);
-  }
-}
-
-void MicroPartitionStats::AddNullColumn(int column_index) {
-  Assert(column_index >= 0);
-  Assert(column_index < static_cast<int>(procs_.size()));
-
-  auto column_stats = stats_->mutable_columnstats(column_index);
-  column_stats->set_hasnull(true);
-}
-
-void MicroPartitionStats::AddNonNullColumn(int column_index, Datum value,
-                                           TupleDesc desc) {
-  Assert(column_index >= 0);
-  Assert(column_index < static_cast<int>(procs_.size()));
-
-  auto att = TupleDescAttr(desc, column_index);
-  auto collation = att->attcollation;
-  auto typlen = att->attlen;
-  auto typbyval = att->attbyval;
-  auto column_stats = stats_->mutable_columnstats(column_index);
-  column_stats->set_allnull(false);
-
-  // update min/max
-  switch (status_[column_index]) {
-    case 'x':
-      break;
-    case 'y':
-      Assert(column_stats->minmaxstats().has_typid());
-      Assert(column_stats->minmaxstats().has_minimal());
-      Assert(column_stats->minmaxstats().has_maximum());
-      Assert(column_stats->minmaxstats().has_proclt());
-      Assert(column_stats->minmaxstats().has_procgt());
-      Assert(column_stats->minmaxstats().has_procle());
-      Assert(column_stats->minmaxstats().has_procge());
-      Assert(column_stats->minmaxstats().typid() == att->atttypid);
-      Assert(column_stats->minmaxstats().collation() == collation);
-
-      UpdateMinMaxValue(column_index, value, collation, typlen, typbyval);
-      break;
-    case 'n': {
-      auto minmax = column_stats->mutable_minmaxstats();
-
-      Assert(!minmax->has_proclt());
-      Assert(!minmax->has_procgt());
-      Assert(!minmax->has_procle());
-      Assert(!minmax->has_procge());
-      Assert(!minmax->has_typid());
-      Assert(!minmax->has_minimal());
-      Assert(!minmax->has_maximum());
-
-      minmax->set_typid(att->atttypid);
-      minmax->set_collation(collation);
-      minmax->set_proclt(std::get<0>(procs_[column_index]));
-      minmax->set_procgt(std::get<1>(procs_[column_index]));
-      minmax->set_procle(std::get<2>(procs_[column_index]));
-      minmax->set_procge(std::get<3>(procs_[column_index]));
-      minmax->set_minimal(ToValue(value, typlen, typbyval));
-      minmax->set_maximum(ToValue(value, typlen, typbyval));
-      status_[column_index] = 'y';
-      break;
-    }
-    default:
-      Assert(false);
-  }
-}
-
-void MicroPartitionStats::UpdateMinMaxValue(int column_index, Datum datum,
-                                            Oid collation, int typlen,
-                                            bool typbyval) {
-  Assert(initial_check_);
-  Assert(column_index >= 0 && static_cast<size_t>(column_index) < status_.size());
-  Assert(status_[column_index] == 'y');
-
-  auto &finfos = finfos_[column_index];
-  auto minmax =
-      stats_->mutable_columnstats(column_index)->mutable_minmaxstats();
-  bool ok;
-
-  {
-    const auto &min = minmax->minimal();
-    auto val = FromValue(min, typlen, typbyval, &ok);
-    CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-    auto update =
-        DatumGetBool(cbdb::FunctionCall2Coll(&finfos.first, collation, datum, val));
-    if (update) minmax->set_minimal(ToValue(datum, typlen, typbyval));
-  }
-  {
-    const auto &max = minmax->maximum();
-    auto val = FromValue(max, typlen, typbyval, &ok);
-    CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-    auto update =
-        DatumGetBool(cbdb::FunctionCall2Coll(&finfos.second, collation, datum, val));
-    if (update) minmax->set_maximum(ToValue(datum, typlen, typbyval));
-  }
-}
-
-bool MicroPartitionStats::GetStrategyProcinfo(
-    Oid typid, std::tuple<Oid, Oid, Oid, Oid> &procids,
-    std::pair<FmgrInfo, FmgrInfo> &finfos) {
-  return cbdb::MinMaxGetStrategyProcinfo(typid, &std::get<0>(procids), &finfos.first,
-                                         BTLessStrategyNumber) &&
-         cbdb::MinMaxGetStrategyProcinfo(typid, &std::get<1>(procids), &finfos.second,
-                                         BTGreaterStrategyNumber) &&
-         cbdb::MinMaxGetStrategyProcinfo(typid, &std::get<2>(procids), nullptr,
-                                         BTLessEqualStrategyNumber) &&
-         cbdb::MinMaxGetStrategyProcinfo(typid, &std::get<3>(procids), nullptr,
-                                         BTGreaterEqualStrategyNumber);
-}
-
-void MicroPartitionStats::DoInitialCheck(TupleDesc desc) {
-  auto natts = desc->natts;
-
-  Assert(natts == static_cast<int>(status_.size()));
-  Assert(natts == stats_->columnstats_size());
-  Assert(status_.size() == procs_.size());
-  Assert(status_.size() == finfos_.size());
-
-  for (int i = 0; i < natts; i++) {
-    auto att = TupleDescAttr(desc, i);
-    if (att->attisdropped ||
-        !GetStrategyProcinfo(att->atttypid, procs_[i], finfos_[i])) {
-      status_[i] = 'x';
-      continue;
-    }
-    status_[i] = 'n';
-  }
-}
-
-Datum MicroPartitionStats::FromValue(const std::string &s, int typlen,
-                                     bool typbyval, bool *ok) {
-  const char *p = s.data();
-  *ok = true;
-  if (typbyval) {
-    Assert(typlen > 0);
-    switch (typlen) {
-      case 1: {
-        int8 i = *reinterpret_cast<const int8 *>(p);
-        return cbdb::Int8ToDatum(i);
-      }
-      case 2: {
-        int16 i = *reinterpret_cast<const int16 *>(p);
-        return cbdb::Int16ToDatum(i);
-      }
-      case 4: {
-        int32 i = *reinterpret_cast<const int32 *>(p);
-        return cbdb::Int32ToDatum(i);
-      }
-      case 8: {
-        int64 i = *reinterpret_cast<const int64 *>(p);
-        return cbdb::Int64ToDatum(i);
-      }
-      default:
-        Assert(!"unexpected typbyval, len not in 1,2,4,8");
-        *ok = false;
-        break;
-    }
-    return 0;
-  }
-
-  Assert(typlen == -1 || typlen > 0);
-  return PointerGetDatum(p);
-}
-
-std::string MicroPartitionStats::ToValue(Datum datum, int typlen,
-                                         bool typbyval) {
-  if (typbyval) {
-    Assert(typlen > 0);
-    switch (typlen) {
-      case 1: {
-        int8 i = cbdb::DatumToInt8(datum);
-        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
-      }
-      case 2: {
-        int16 i = cbdb::DatumToInt16(datum);
-        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
-      }
-      case 4: {
-        int32 i = cbdb::DatumToInt32(datum);
-        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
-      }
-      case 8: {
-        int64 i = cbdb::DatumToInt64(datum);
-        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
-      }
-      default:
-        Assert(!"unexpected typbyval, len not in 1,2,4,8");
-        break;
-    }
-    CBDB_RAISE(cbdb::CException::kExTypeLogicError);
-  }
-
-  if (typlen == -1) {
-    void *v;
-    int len;
-
-    v = cbdb::PointerAndLenFromDatum(datum, &len);
-    Assert(v && len != -1);
-    return std::string(reinterpret_cast<char *>(v), len);
-  }
-  // byref but fixed size
-  Assert(typlen > 0);
-  return std::string(reinterpret_cast<char *>(cbdb::DatumToPointer(datum)),
-                     typlen);
-}
-}  // namespace pax
-
-static inline const char *BoolToString(bool b) { return b ? "true" : "false"; }
-
-static char *TypeValueToCString(Oid typid, Oid collation,
-                                const std::string &value) {
-  FmgrInfo finfo;
-  HeapTuple tuple;
-  Form_pg_type form;
-  Datum datum;
-  bool ok;
-
-  tuple = SearchSysCache1(TYPEOID, ObjectIdGetDatum(typid));
-  if (!HeapTupleIsValid(tuple))
-    elog(ERROR, "cache lookup failed for type %u", typid);
-
-  form = (Form_pg_type)GETSTRUCT(tuple);
-  Assert(OidIsValid(form->typoutput));
-
-  datum = pax::MicroPartitionStats::FromValue(value, form->typlen,
-                                              form->typbyval, &ok);
-  if (!ok)
-    elog(ERROR, "unexpected typlen: %d\n", form->typlen);
-
-  fmgr_info_cxt(form->typoutput, &finfo, CurrentMemoryContext);
-  datum = FunctionCall1Coll(&finfo, collation, datum);
-  ReleaseSysCache(tuple);
-
-  return DatumGetCString(datum);
-}
-
-// define stat type for custom output
-extern "C" {
-extern Datum MicroPartitionStatsInput(PG_FUNCTION_ARGS);
-extern Datum MicroPartitionStatsOutput(PG_FUNCTION_ARGS);
-PG_FUNCTION_INFO_V1(MicroPartitionStatsInput);
-PG_FUNCTION_INFO_V1(MicroPartitionStatsOutput);
-}
-
-Datum MicroPartitionStatsInput(PG_FUNCTION_ARGS) {
-  ereport(ERROR, (errmsg("unsupport MicroPartitionStatsInput")));
-  (void)fcinfo;
-  PG_RETURN_POINTER(NULL);
-}
-
-Datum MicroPartitionStatsOutput(PG_FUNCTION_ARGS) {
-  struct varlena *v = PG_GETARG_VARLENA_PP(0);
-  pax::stats::MicroPartitionStatisticsInfo stats;
-  StringInfoData str;
-
-  bool ok = stats.ParseFromArray(VARDATA_ANY(v), VARSIZE_ANY_EXHDR(v));
-  if (!ok) ereport(ERROR, (errmsg("micropartition stats is corrupt")));
-
-  initStringInfo(&str);
-  for (int i = 0, n = stats.columnstats_size(); i < n; i++) {
-    const auto &column = stats.columnstats(i);
-
-    if (i > 0) appendStringInfoChar(&str, ',');
-
-    appendStringInfo(&str, "[(%s,%s)", BoolToString(column.allnull()),
-                     BoolToString(column.hasnull()));
-
-    if (!column.has_minmaxstats()) {
-      appendStringInfoString(&str, ",None]");
-      continue;
-    }
-
-    const auto &minmax = column.minmaxstats();
-    appendStringInfo(&str, ",(%u,%u,%u,%u,%s,%s)]", minmax.typid(),
-                     minmax.collation(), minmax.proclt(),
-                     minmax.procgt(),
-                     TypeValueToCString(minmax.typid(), minmax.collation(),
-                                        minmax.minimal()),
-                     TypeValueToCString(minmax.typid(), minmax.collation(),
-                                        minmax.maximum()));
-  }
-
-  PG_RETURN_CSTRING(str.data);
-}
diff --git a/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.h b/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.h
deleted file mode 100644
index 56be8e8cddf..00000000000
--- a/contrib/pax_storage/src/cpp/catalog/micro_partition_stats.h
+++ /dev/null
@@ -1,51 +0,0 @@
-#pragma once
-#include "comm/cbdb_api.h"
-
-#include <string>
-#include <utility>
-#include <vector>
-
-namespace pax {
-namespace stats {
-class MicroPartitionStatisticsInfo;
-}
-
-class MicroPartitionStats final {
- public:
-  MicroPartitionStats() = default;
-  MicroPartitionStats *SetStatsMessage(
-      pax::stats::MicroPartitionStatisticsInfo *stats, int natts);
-
-  void AddRow(TupleTableSlot *slot);
-
-  static std::string ToValue(Datum datum, int typlen, bool typbyval);
-  static Datum FromValue(const std::string &s, int typlen, bool typbyval, bool *ok);
-
- private:
-  void AddNullColumn(int column_index);
-  void AddNonNullColumn(int column_index, Datum value, TupleDesc desc);
-  void DoInitialCheck(TupleDesc desc);
-  void UpdateMinMaxValue(int column_index, Datum datum, Oid collation,
-                         int typlen, bool typbyval);
-  static bool GetStrategyProcinfo(Oid typid, std::tuple<Oid, Oid, Oid, Oid> &procids,
-                                  std::pair<FmgrInfo, FmgrInfo> &finfos);
-
-  // stats_: only references the info object by pointer
-  pax::stats::MicroPartitionStatisticsInfo *stats_ = nullptr;
-
-  // less: tuple[0], greater: tuple[1], le: tuple[2], ge: tuple[3]
-  std::vector<std::tuple<Oid, Oid, Oid, Oid>> procs_;
-  // less: pair[0], greater: pair[1]
-  std::vector<std::pair<FmgrInfo, FmgrInfo>> finfos_;
-
-  // status to indicate whether the oids are initialized
-  // or the min-max values are initialized
-  // 'u': all is uninitialized
-  // 'x': column doesn't support min-max
-  // 'n': oids are initialized, but min-max value is missing
-  // 'y': min-max is set, needs update.
-  std::vector<char> status_;
-  bool initial_check_ = false;
-};
-
-}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/catalog/pax_aux_table.cc b/contrib/pax_storage/src/cpp/catalog/pax_aux_table.cc
index 906d8d9fd22..44d97f25694 100644
--- a/contrib/pax_storage/src/cpp/catalog/pax_aux_table.cc
+++ b/contrib/pax_storage/src/cpp/catalog/pax_aux_table.cc
@@ -3,14 +3,14 @@
 #include "comm/cbdb_api.h"
 
 #include <uuid/uuid.h>
-
 #include <utility>
 
+#include "catalog/pax_fastsequence.h"
+#include "catalog/pg_pax_tables.h"
 #include "comm/cbdb_wrappers.h"
 #include "storage/file_system.h"
 #include "storage/local_file_system.h"
 #include "storage/micro_partition_metadata.h"
-#include "storage/paxc_block_map_manager.h"
 
 namespace paxc {
 
@@ -46,26 +46,20 @@ static void CPaxTransactionalTruncateTable(Oid aux_relid) {
 // 2.create table outside transactional block, insert data
 // and truncate table inside transactional block.
 static void CPaxNontransactionalTruncateTable(Relation rel) {
-  HeapTuple tuple;
   Relation aux_rel;
   Oid aux_relid;
 
-  tuple = SearchSysCache1(PAXTABLESID, RelationGetRelid(rel));
-  if (!HeapTupleIsValid(tuple))
-    ereport(ERROR, (errcode(ERRCODE_UNDEFINED_SCHEMA),
-                    errmsg("cache lookup failed with relid=%u for aux relation "
-                           "in pg_pax_tables.",
-                           RelationGetRelid(rel))));
-  aux_relid = ((Form_pg_pax_tables)GETSTRUCT(tuple))->blocksrelid;
-  ReleaseSysCache(tuple);
+  aux_relid = ::paxc::GetPaxAuxRelid(RelationGetRelid(rel));
   Assert(OidIsValid(aux_relid));
 
   aux_rel = relation_open(aux_relid, AccessExclusiveLock);
   heap_truncate_one_rel(aux_rel);
   relation_close(aux_rel, NoLock);
+
+  paxc::CPaxInitializeFastSequenceEntry(RelationGetRelid(rel), FASTSEQUENCE_INIT_TYPE_INPLACE);
 }
 
-static void CPaxCreateMicroPartitionTable(const Relation rel) {
+void CPaxCreateMicroPartitionTable(Relation rel) {
   Relation pg_class_desc;
   char aux_relname[32];
   Oid relid;
@@ -79,7 +73,7 @@ static void CPaxCreateMicroPartitionTable(const Relation rel) {
 
   // 1. create blocks table.
   snprintf(aux_relname, sizeof(aux_relname), "pg_pax_blocks_%u", pax_relid);
-  aux_namespace_id = PG_PAXAUX_NAMESPACE;
+  aux_namespace_id = PG_EXTAUX_NAMESPACE;
   aux_relid = GetNewOidForRelation(pg_class_desc, ClassOidIndexId,
                                    Anum_pg_class_oid,  // new line
                                    aux_relname, aux_namespace_id);
@@ -91,12 +85,18 @@ static void CPaxCreateMicroPartitionTable(const Relation rel) {
   // TODO(chenhongjie): uncompressed and compressed ptblocksize are needed.
   TupleDescInitEntry(tupdesc, (AttrNumber)ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKSIZE,
                      "ptblocksize", INT4OID, -1, 0);
-  TupleDescInitEntry(tupdesc, (AttrNumber)ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS,
+  TupleDescInitEntry(tupdesc,
+                     (AttrNumber)ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS,
                      "ptstatistics", PAX_AUX_STATS_TYPE_OID, -1, 0);
+  {
+    // Add constraints for the aux table
+    auto attr = TupleDescAttr(tupdesc, ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1);
+    attr->attnotnull = true;
+  }
   relid = heap_create_with_catalog(
       aux_relname, aux_namespace_id, InvalidOid, aux_relid, InvalidOid,
       InvalidOid, rel->rd_rel->relowner, HEAP_TABLE_AM_OID, tupdesc, NIL,
-      RELKIND_RELATION, rel->rd_rel->relpersistence, rel->rd_rel->relisshared,
+      RELKIND_RELATION, RELPERSISTENCE_PERMANENT, rel->rd_rel->relisshared,
       RelationIsMapped(rel), ONCOMMIT_NOOP, NULL, /* GP Policy */
       (Datum)0, false,                            /* use _user_acl */
       true, true, InvalidOid, NULL,               /* typeaddress */
@@ -104,8 +104,10 @@ static void CPaxCreateMicroPartitionTable(const Relation rel) {
   Assert(relid == aux_relid);
   table_close(pg_class_desc, NoLock);
 
+  NewRelationCreateToastTable(relid, (Datum)0);
+
   // 2. insert entry into pg_pax_tables.
-  InsertPaxTablesEntry(pax_relid, aux_relid, "", 0);
+  ::paxc::InsertPaxTablesEntry(pax_relid, aux_relid, NULL);
 
   // 3. record pg_depend, pg_pax_blocks_<xxx> depends relation.
   {
@@ -123,84 +125,115 @@ static void CPaxCreateMicroPartitionTable(const Relation rel) {
     base.classId = RelationRelationId;
     base.objectId = pax_relid;
     base.objectSubId = 0;
-    aux.classId = PaxTablesRelationId;
+    aux.classId = PAX_TABLES_RELATION_ID;
     aux.objectId = pax_relid;
     aux.objectSubId = 0;
     recordDependencyOn(&aux, &base, DEPENDENCY_INTERNAL);
   }
-}
-
-static void CPaxDeletePaxBlockEntry(Oid relid, Snapshot pax_meta_data_snapshot,
-                         const char *blockname) {
-  Relation rel;
-  ScanKeyData key[1];
-  SysScanDesc scan;
-  HeapTuple tuple;
-  NameData ptblockname;
+  CommandCounterIncrement();
 
-  rel = table_open(relid, RowExclusiveLock);
-  namestrcpy(&ptblockname, blockname);
-  ScanKeyInit(&key[0], ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME,
-              BTEqualStrategyNumber, F_NAMEEQ, NameGetDatum(&ptblockname));
-
-  // should add snapshot support
-  scan = systable_beginscan(rel, InvalidOid, false, pax_meta_data_snapshot, 1,
-                            key);
-
-  tuple = systable_getnext(scan);
-  if (HeapTupleIsValid(tuple)) {
-    CatalogTupleDelete(rel, &tuple->t_self);
+  // 4. create index on ptblockname dynamically, the index name should be pg_paxaux.pg_pax_blocks_index_xxx.
+  {
+    char aux_index_name[NAMEDATALEN];
+    IndexInfo *indexInfo;
+    List *indexColNames;
+    Relation aux_rel;
+    int16 coloptions[1];
+    Oid classObjectId[1];
+    Oid collationObjectId[1];
+
+    snprintf(aux_index_name, sizeof(aux_index_name), "%s_idx", aux_relname);
+
+    indexInfo = makeNode(IndexInfo);
+    indexInfo->ii_NumIndexAttrs = 1;
+    indexInfo->ii_NumIndexKeyAttrs = 1;
+    indexInfo->ii_IndexAttrNumbers[0] = ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME;
+    indexInfo->ii_Expressions = NIL;
+    indexInfo->ii_ExpressionsState = NIL;
+    indexInfo->ii_Predicate = NIL;
+    indexInfo->ii_PredicateState = NULL;
+    indexInfo->ii_Unique = true;
+    indexInfo->ii_ReadyForInserts = true;
+    indexInfo->ii_Concurrent = false;
+    indexInfo->ii_Am = BTREE_AM_OID;
+    indexInfo->ii_Context = CurrentMemoryContext;
+
+    collationObjectId[0] = C_COLLATION_OID;
+    classObjectId[0] = GetDefaultOpClass(NAMEOID, BTREE_AM_OID);
+    coloptions[0] = 0;
+
+    auto attr = TupleDescAttr(tupdesc, ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1);
+    indexColNames = list_make1(NameStr(attr->attname));
+
+    // ShareLock is not really needed here, but take it anyway.
+    aux_rel = table_open(aux_relid, ShareLock);
+
+    index_create(aux_rel,
+                  aux_index_name,
+                  InvalidOid,
+                  InvalidOid,
+                  InvalidOid,
+                  InvalidOid,
+                  indexInfo,
+                  indexColNames,
+                  BTREE_AM_OID,
+                  rel->rd_rel->reltablespace,
+                  collationObjectId, classObjectId, coloptions, (Datum) 0,
+                  INDEX_CREATE_IS_PRIMARY, 0, true, true, NULL);
+
+    // Unlock target table -- no one can see it
+    table_close(aux_rel, ShareLock);
+
+    // Unlock the index -- no one can see it anyway
+    //UnlockRelationOid(paxauxiliary_idxid, AccessExclusiveLock);
+
+    CommandCounterIncrement();
   }
 
-  systable_endscan(scan);
-  table_close(rel, RowExclusiveLock);
 }
 
-static void CPaxCopyPaxBlockEntry(Relation old_relation, Relation new_relation) {
+void DeleteMicroPartitionEntry(Oid pax_relid, Snapshot snapshot,
+                               const char *blockname) {
+  ScanAuxContext context;
   HeapTuple tuple;
-  SysScanDesc pax_scan;
-  Relation old_aux_rel, new_aux_rel;
-  Oid old_aux_relid = 0, new_aux_relid = 0;
+  Oid aux_relid;
 
-  HeapTuple tupcache;
-  tupcache = SearchSysCache1(PAXTABLESID, RelationGetRelid(old_relation));
-  Assert(HeapTupleIsValid(tupcache));
-  old_aux_relid = ((Form_pg_pax_tables)GETSTRUCT(tupcache))->blocksrelid;
-  ReleaseSysCache(tupcache);
+  aux_relid = ::paxc::GetPaxAuxRelid(pax_relid);
 
-  tupcache = SearchSysCache1(PAXTABLESID, RelationGetRelid(new_relation));
-  Assert(HeapTupleIsValid(tupcache));
-  new_aux_relid = ((Form_pg_pax_tables)GETSTRUCT(tupcache))->blocksrelid;
-  ReleaseSysCache(tupcache);
+  context.BeginSearchMicroPartition(aux_relid, InvalidOid, snapshot, RowExclusiveLock, blockname);
+  tuple = context.SearchMicroPartitionEntry();
+  if (!HeapTupleIsValid(tuple))
+    elog(ERROR, "delete micro partition \"%s\" failed for relation(%u)", blockname, pax_relid);
 
-  old_aux_rel = table_open(old_aux_relid, RowExclusiveLock);
-  new_aux_rel = table_open(new_aux_relid, RowExclusiveLock);
+  Assert(context.GetRelation());
+  CatalogTupleDelete(context.GetRelation(), &tuple->t_self);
 
-  pax_scan = systable_beginscan(old_aux_rel, InvalidOid, false,
-                                NULL, 0, NULL);
-  while ((tuple = systable_getnext(pax_scan)) != NULL) {
-    CatalogTupleInsert(new_aux_rel, tuple);
-  }
-  systable_endscan(pax_scan);
-  table_close(old_aux_rel, RowExclusiveLock);
-  table_close(new_aux_rel, RowExclusiveLock);
+  context.EndSearchMicroPartition(NoLock);
 }
 
-}  // namespace paxc
+void InsertMicroPartitionPlaceHolder(Oid aux_relid, const char *blockname) {
+  NameData ptblockname;
+  Datum values[NATTS_PG_PAX_BLOCK_TABLES];
+  bool nulls[NATTS_PG_PAX_BLOCK_TABLES];
 
-namespace cbdb {
-Oid GetPaxAuxRelid(Oid relid) {
-  Oid aux_relid = InvalidOid;
-  CBDB_WRAP_START;
-  {
-    GetPaxTablesEntryAttributes(relid, &aux_relid, NULL, NULL);
-    return aux_relid;
-  }
-  CBDB_WRAP_END;
+  Assert(blockname && strlen(blockname) < NAMEDATALEN);
+  namestrcpy(&ptblockname, blockname);
+
+  values[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1] = NameGetDatum(&ptblockname);
+  nulls[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1] = false;
+
+  nulls[ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT - 1] = true;
+  nulls[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKSIZE - 1] = true;
+  nulls[ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS - 1] = true;
+
+  InsertTuple(aux_relid, values, nulls);
+  CommandCounterIncrement();
 }
 
-static void InsertPaxBlockEntry(Oid relid, const char *blockname, int pttupcount,
-                         int ptblocksize, const ::pax::stats::MicroPartitionStatisticsInfo &mp_stats) {
+void InsertOrUpdateMicroPartitionPlaceHolder(Oid aux_relid,
+                                      const char *blockname,
+                                      int num_tuples, int file_size,
+                                      const ::pax::stats::MicroPartitionStatisticsInfo &mp_stats) {
   int stats_length = mp_stats.ByteSize();
   uint32 len = VARHDRSZ + stats_length;
   void *output;
@@ -209,58 +242,221 @@ static void InsertPaxBlockEntry(Oid relid, const char *blockname, int pttupcount
   Datum values[NATTS_PG_PAX_BLOCK_TABLES];
   bool nulls[NATTS_PG_PAX_BLOCK_TABLES];
 
-  output = cbdb::Palloc(len);
+  output = palloc(len);
   SET_VARSIZE(output, len);
   mp_stats.SerializeToArray(VARDATA(output), stats_length);
 
   Assert(blockname);
   namestrcpy(&ptblockname, blockname);
 
-  values[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1] =
-      NameGetDatum(&ptblockname);
+  values[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1] = NameGetDatum(&ptblockname);
   nulls[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME - 1] = false;
 
-  values[ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT - 1] = Int32GetDatum(pttupcount);
+  values[ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT - 1] = Int32GetDatum(num_tuples);
   nulls[ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT - 1] = false;
-  values[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKSIZE - 1] =
-      Int32GetDatum(ptblocksize);
+  values[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKSIZE - 1] = Int32GetDatum(file_size);
   nulls[ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKSIZE - 1] = false;
 
-  // Serialize catalog statitics information into PG bytea format and saved in aux table ptstatitics column.
+  // Serialize catalog statitics information into PG bytea format and saved in
+  // aux table ptstatitics column.
   values[ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS - 1] = PointerGetDatum(output);
   nulls[ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS - 1] = false;
 
-  CBDB_WRAP_START;
-  {
-    paxc::InsertTuple(relid, values, nulls);
+  ScanAuxContext context;
+  context.BeginSearchMicroPartition(aux_relid, InvalidOid, NULL, RowExclusiveLock, blockname);
+  auto aux_rel = context.GetRelation();
+  auto oldtuple = context.SearchMicroPartitionEntry();
+  if (!HeapTupleIsValid(oldtuple))
+    elog(ERROR, "micro partition doesn't exist before inserting tuples");
+
+  if (num_tuples > 0) {
+    auto newtuple = heap_form_tuple(RelationGetDescr(aux_rel), values, nulls);
+
+    newtuple->t_data->t_ctid = oldtuple->t_data->t_ctid;
+    newtuple->t_self = oldtuple->t_self;
+    newtuple->t_tableOid = oldtuple->t_tableOid;
+    CatalogTupleUpdate(aux_rel, &newtuple->t_self, newtuple);
+    heap_freetuple(newtuple);
+  } else {
+    CatalogTupleDelete(aux_rel, &oldtuple->t_self);
+  }
+  context.EndSearchMicroPartition(NoLock);
+
+  pfree(output);
+
+  CommandCounterIncrement();
+}
+
+Oid FindAuxIndexOid(Oid aux_relid, Snapshot snapshot) {
+  ScanKeyData scankey[1];
+  Relation indrel;
+  SysScanDesc scan;
+  HeapTuple tuple;
+  Oid index_oid;
+  int index_count = 0;
+
+  ScanKeyInit(&scankey[0], Anum_pg_index_indrelid, BTEqualStrategyNumber, F_OIDEQ, ObjectIdGetDatum(aux_relid));
+  indrel = table_open(IndexRelationId, AccessShareLock);
+  scan = systable_beginscan(indrel, IndexIndrelidIndexId, true, snapshot, 1, scankey);
+
+  index_oid = InvalidOid;
+  while (HeapTupleIsValid(tuple = systable_getnext(scan))) {
+    auto index = (Form_pg_index) GETSTRUCT(tuple);
+    index_count++;
+    if (!index->indislive || !index->indisvalid) continue;
+    index_oid = index->indexrelid;
+  }
+  systable_endscan(scan);
+  table_close(indrel, NoLock);
+
+  if (index_count != 1 || !OidIsValid(index_oid))
+    elog(ERROR, "unexpected number of index of aux table: %d", index_count);
+
+  return index_oid;
+}
+
+static inline Oid GetAuxIndexOid(Oid aux_relid, Oid *aux_index_relid, Snapshot snapshot) {
+  if (aux_index_relid) {
+    if (OidIsValid(*aux_index_relid))
+      return *aux_index_relid;
+    else
+      return *aux_index_relid = FindAuxIndexOid(aux_relid, snapshot);
+  } else {
+    return FindAuxIndexOid(aux_relid, snapshot);
+  }
+}
+
+void ScanAuxContext::BeginSearchMicroPartition(Oid aux_relid, Oid aux_index_relid, Snapshot snapshot, LOCKMODE lockmode, const char *blockname) {
+  Assert(aux_relid);
+  if (!OidIsValid(aux_index_relid) && blockname)
+    aux_index_relid = FindAuxIndexOid(aux_relid, snapshot);
+
+  aux_rel_ = table_open(aux_relid, lockmode);
+  if (blockname) {
+    ScanKeyData scankey[1];
+
+    ScanKeyInit(&scankey[0], ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME, BTEqualStrategyNumber, F_NAMEEQ, CStringGetDatum(blockname));
+    scan_ = systable_beginscan(aux_rel_, aux_index_relid, true, snapshot, 1, scankey);
+  } else {
+    scan_ = systable_beginscan(aux_rel_, aux_index_relid, false, snapshot, 0, nullptr);
+  }
+}
+
+HeapTuple ScanAuxContext::SearchMicroPartitionEntry() {
+  Assert(aux_rel_ && scan_);
+  return systable_getnext(scan_);
+}
+
+void ScanAuxContext::EndSearchMicroPartition(LOCKMODE lockmode) {
+  Assert(aux_rel_ && scan_);
+
+  systable_endscan(scan_);
+  table_close(aux_rel_, lockmode);
+  scan_ = nullptr;
+  aux_rel_ = nullptr;
+}
+
+void PaxAuxRelationSetNewFilenode(Oid aux_relid) {
+  Relation aux_rel;
+  Oid toastrelid;
+  ReindexParams reindex_params = {0};
+
+  aux_rel = relation_open(aux_relid, AccessExclusiveLock);
+  RelationSetNewRelfilenode(aux_rel, aux_rel->rd_rel->relpersistence);
+  toastrelid = aux_rel->rd_rel->reltoastrelid;
+  if (OidIsValid(toastrelid)) {
+    Relation toast_rel;
+    toast_rel = relation_open(toastrelid, AccessExclusiveLock);
+    RelationSetNewRelfilenode(toast_rel, toast_rel->rd_rel->relpersistence);
+    relation_close(toast_rel, NoLock);
   }
+  if (aux_rel->rd_rel->relhasindex)
+    reindex_relation(aux_relid, REINDEX_REL_PROCESS_TOAST, &reindex_params);
+  pgstat_count_truncate(aux_rel);
+  relation_close(aux_rel, NoLock);
+}
+
+bool IsMicroPartitionVisible(Relation pax_rel, BlockNumber block, Snapshot snapshot) {
+  struct ScanAuxContext context;
+  HeapTuple tuple;
+  Oid aux_relid;
+  char block_name[NAMEDATALEN];
+  bool ok;
+
+  aux_relid = ::paxc::GetPaxAuxRelid(RelationGetRelid(pax_rel));
+  snprintf(block_name, sizeof(block_name), "%u", block);
+
+  context.BeginSearchMicroPartition(aux_relid, InvalidOid, snapshot, AccessShareLock, block_name);
+  tuple = context.SearchMicroPartitionEntry();
+  ok = HeapTupleIsValid(tuple);
+  context.EndSearchMicroPartition(NoLock);
+
+  return ok;
+}
+
+static void CPaxCopyPaxBlockEntry(Relation old_relation,
+                                  Relation new_relation) {
+  HeapTuple tuple;
+  SysScanDesc pax_scan;
+  Relation old_aux_rel, new_aux_rel;
+  Oid old_aux_relid = 0, new_aux_relid = 0;
+
+  old_aux_relid = ::paxc::GetPaxAuxRelid(RelationGetRelid(old_relation));
+  new_aux_relid = ::paxc::GetPaxAuxRelid(RelationGetRelid(new_relation));
+  old_aux_rel = table_open(old_aux_relid, RowExclusiveLock);
+  new_aux_rel = table_open(new_aux_relid, RowExclusiveLock);
+
+  pax_scan = systable_beginscan(old_aux_rel, InvalidOid, false, NULL, 0, NULL);
+  while ((tuple = systable_getnext(pax_scan)) != NULL) {
+    CatalogTupleInsert(new_aux_rel, tuple);
+  }
+  systable_endscan(pax_scan);
+  table_close(old_aux_rel, RowExclusiveLock);
+  table_close(new_aux_rel, RowExclusiveLock);
+}
+
+}  // namespace paxc
+
+namespace cbdb {
+Oid GetPaxAuxRelid(Oid relid) {
+  CBDB_WRAP_START;
+  { return ::paxc::GetPaxAuxRelid(relid); }
   CBDB_WRAP_END;
+}
 
-  cbdb::Pfree(output);
+void DeleteMicroPartitionEntry(Oid pax_relid, Snapshot snapshot,
+                                const std::string &blockname) {
+  CBDB_WRAP_START;
+  { paxc::DeleteMicroPartitionEntry(pax_relid, snapshot, blockname.c_str()); }
+  CBDB_WRAP_END;
 }
 
-static void DeletePaxBlockEntry(Oid relid, Snapshot snapshot,
-                         const char *blockname) {
+void InsertMicroPartitionPlaceHolder(Oid pax_relid, const std::string &blockname) {
   CBDB_WRAP_START;
   {
-    paxc::CPaxDeletePaxBlockEntry(relid, snapshot, blockname);
+    Oid aux_relid;
+
+    aux_relid = ::paxc::GetPaxAuxRelid(pax_relid);
+    paxc::InsertMicroPartitionPlaceHolder(aux_relid, blockname.c_str());
   }
   CBDB_WRAP_END;
 }
+void InsertOrUpdateMicroPartitionEntry(const pax::WriteSummary &summary) {
+  CBDB_WRAP_START;
+  {
+    Oid aux_relid;
 
-void DeleteMicroPartitionEntry(Oid pax_relid,
-                               Snapshot snapshot,
-                               const std::string &block_id) {
-  Oid aux_relid = GetPaxAuxRelid(pax_relid);
-  cbdb::DeletePaxBlockEntry(aux_relid, snapshot,
-                            block_id.c_str());
+    aux_relid = ::paxc::GetPaxAuxRelid(summary.rel_oid);
+    paxc::InsertOrUpdateMicroPartitionPlaceHolder(aux_relid, summary.block_id.c_str(),
+        summary.num_tuples, summary.file_size, summary.mp_stats);
+  }
+  CBDB_WRAP_END;
 }
 
-void AddMicroPartitionEntry(const pax::WriteSummary &summary) {
-  Oid aux_relid;
-  aux_relid = GetPaxAuxRelid(summary.rel_oid);
-  cbdb::InsertPaxBlockEntry(aux_relid, summary.block_id.c_str(),
-                            summary.num_tuples, summary.file_size, summary.mp_stats);
+bool IsMicroPartitionVisible(Relation pax_rel, BlockNumber block, Snapshot snapshot) {
+  CBDB_WRAP_START;
+  { return paxc::IsMicroPartitionVisible(pax_rel, block, snapshot); }
+  CBDB_WRAP_END;
 }
 
 static void PaxTransactionalTruncateTable(Oid aux_relid) {
@@ -289,31 +485,6 @@ static void PaxCopyPaxBlockEntry(Relation old_relation, Relation new_relation) {
 }  // namespace cbdb
 
 namespace pax {
-void CCPaxAuxTable::PaxAuxRelationSetNewFilenode(Relation rel,
-                                                 const RelFileNode *newrnode,
-                                                 char persistence) {
-  HeapTuple tupcache;
-  std::string path;
-  FileSystem *fs = pax::Singleton<LocalFileSystem>::GetInstance();
-
-  tupcache = cbdb::SearchSysCache(rel, PAXTABLESID);
-  if (cbdb::TupleIsValid(tupcache)) {
-    Oid aux_relid = ((Form_pg_pax_tables)GETSTRUCT(tupcache))->blocksrelid;
-    cbdb::PaxTransactionalTruncateTable(aux_relid);
-    cbdb::ReleaseTupleCache(tupcache);
-  } else {
-    // create pg_pax_blocks_<pax_table_oid>
-    cbdb::PaxCreateMicroPartitionTable(rel);
-  }
-
-  // Create pax table relfilenode file and database directory under path base/,
-  // The relfilenode created here is to be compatible with PG normal process
-  // logic instead of being used by pax storage.
-  cbdb::RelationCreateStorageDirectory(*newrnode, persistence, SMGR_MD, rel);
-  path = cbdb::BuildPaxDirectoryPath(*newrnode, rel->rd_backend);
-  Assert(!path.empty());
-  CBDB_CHECK((fs->CreateDirectory(path) == 0), cbdb::CException::ExType::kExTypeIOError);
-}
 
 void CCPaxAuxTable::PaxAuxRelationNontransactionalTruncate(Relation rel) {
   cbdb::PaxNontransactionalTruncateTable(rel);
@@ -337,43 +508,52 @@ void CCPaxAuxTable::PaxAuxRelationCopyData(Relation rel,
   src_path = cbdb::BuildPaxDirectoryPath(rel->rd_node, rel->rd_backend);
   Assert(!src_path.empty());
 
-  // get micropatition file source folder filename list for copying.
-  filelist = fs->ListDirectory(src_path);
-  if (filelist.empty()) return;
-
   dst_path = cbdb::BuildPaxDirectoryPath(*newrnode, rel->rd_backend);
   Assert(!dst_path.empty());
 
   if (src_path.empty() || dst_path.empty())
     CBDB_RAISE(cbdb::CException::ExType::kExTypeFileOperationError);
 
-  // createnewpath is used to indicate if creating destination micropartition file directory and storage file for copying or not.
-  // 1. For RelationCopyData case, createnewpath should be set as true to explicitly create a new destination directory under
+  // createnewpath is used to indicate if creating destination micropartition
+  // file directory and storage file for copying or not.
+  // 1. For RelationCopyData case, createnewpath should be set as true to
+  // explicitly create a new destination directory under
   //    new tablespace path pg_tblspc/.
-  // 2. For RelationCopyDataForCluster case, createnewpath should be set as false cause the destination directory was already
-  //    created with a new temp table by previously calling PaxAuxRelationSetNewFilenode.
+  // 2. For RelationCopyDataForCluster case, createnewpath should be set as
+  // false cause the destination directory was already
+  //    created with a new temp table by previously calling
+  //    PaxAuxRelationSetNewFilenode.
   if (createnewpath) {
     // create pg_pax_table relfilenode file and dbid directory.
     cbdb::RelationCreateStorageDirectory(*newrnode, rel->rd_rel->relpersistence,
-                                       SMGR_MD, rel);
+                                         SMGR_MD, rel);
     // create micropartition file destination folder for copying.
-    CBDB_CHECK((fs->CreateDirectory(dst_path) == 0), cbdb::CException::ExType::kExTypeIOError);
+    CBDB_CHECK((fs->CreateDirectory(dst_path) == 0),
+               cbdb::CException::ExType::kExTypeIOError);
   }
 
+  // Get micropatition file source folder filename list for copying, if file
+  // list is empty then skip copying file directly.
+  filelist = fs->ListDirectory(src_path);
+  if (filelist.empty()) return;
+
   for (auto &iter : filelist) {
     Assert(!iter.empty());
-    src_path.append("/");
-    src_path.append(iter);
-    dst_path.append("/");
-    dst_path.append(iter);
-    fs->CopyFile(src_path, dst_path);
+    std::string src_file = src_path;
+    std::string dst_file = dst_path;
+    src_file.append("/");
+    src_file.append(iter);
+    dst_file.append("/");
+    dst_file.append(iter);
+    fs->CopyFile(src_file, dst_file);
   }
 
   // TODO(Tony) : here need to implement pending delete srcPath after set new
   // tablespace.
 }
 
-void CCPaxAuxTable::PaxAuxRelationCopyDataForCluster(Relation old_rel, Relation new_rel) {
+void CCPaxAuxTable::PaxAuxRelationCopyDataForCluster(Relation old_rel,
+                                                     Relation new_rel) {
   PaxAuxRelationCopyData(old_rel, &new_rel->rd_node, false);
   cbdb::PaxCopyPaxBlockEntry(old_rel, new_rel);
   // TODO(Tony) : here need to implement PAX re-organize semantics logic.
@@ -388,5 +568,5 @@ void CCPaxAuxTable::PaxAuxRelationFileUnlink(RelFileNode node,
   relpath = cbdb::BuildPaxDirectoryPath(node, backend);
   fs->DeleteDirectory(relpath, delete_topleveldir);
 }
-}  // namespace pax
 
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/catalog/pax_aux_table.h b/contrib/pax_storage/src/cpp/catalog/pax_aux_table.h
index 7d79f36f863..3d39ef67e4d 100644
--- a/contrib/pax_storage/src/cpp/catalog/pax_aux_table.h
+++ b/contrib/pax_storage/src/cpp/catalog/pax_aux_table.h
@@ -1,10 +1,9 @@
 #pragma once
-#include "catalog/pax_aux_table.h"
-
 #include "comm/cbdb_api.h"
 
 #include <string>
 
+#include "catalog/pax_aux_table.h"
 #include "storage/micro_partition_metadata.h"
 
 #define ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME 1
@@ -13,6 +12,37 @@
 #define ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS 4
 #define NATTS_PG_PAX_BLOCK_TABLES 4
 
+namespace paxc {
+void CPaxCreateMicroPartitionTable(Relation rel);
+
+Oid FindAuxIndexOid(Oid aux_relid, Snapshot snapshot);
+
+void InsertMicroPartitionPlaceHolder(Oid aux_relid, const char *blockname);
+void DeleteMicroPartitionEntry(Oid pax_relid, Snapshot snapshot, const char *blockname);
+// Scan aux table
+// seqscan: MicroPartitionInfoIterator
+// index scan
+struct ScanAuxContext {
+ public:
+  void BeginSearchMicroPartition(Oid aux_relid, Oid aux_index_relid,
+  Snapshot snapshot, LOCKMODE lockmode, const char *blockname);
+  void BeginSearchMicroPartition(Oid aux_relid, Snapshot snapshot, LOCKMODE lockmode) {
+    BeginSearchMicroPartition(aux_relid, InvalidOid, snapshot, lockmode, nullptr);
+  }
+  HeapTuple SearchMicroPartitionEntry();
+  void EndSearchMicroPartition(LOCKMODE lockmode);
+
+  Relation GetRelation() { return aux_rel_; }
+
+ private:
+  Relation aux_rel_ = nullptr;
+  SysScanDesc scan_ = nullptr;
+};
+
+void PaxAuxRelationSetNewFilenode(Oid aux_relid);
+bool IsMicroPartitionVisible(Relation pax_rel, BlockNumber block, Snapshot snapshot);
+}
+
 namespace pax {
 class CCPaxAuxTable final {
  public:
@@ -25,26 +55,27 @@ class CCPaxAuxTable final {
 
   static void PaxAuxRelationNontransactionalTruncate(Relation rel);
 
-  static void PaxAuxRelationCopyData(Relation rel,
-                                     const RelFileNode *newrnode,
+  static void PaxAuxRelationCopyData(Relation rel, const RelFileNode *newrnode,
                                      bool createnewpath = true);
 
-  static void PaxAuxRelationCopyDataForCluster(Relation old_rel, Relation new_rel);
+  static void PaxAuxRelationCopyDataForCluster(Relation old_rel,
+                                               Relation new_rel);
 
   static void PaxAuxRelationFileUnlink(RelFileNode node, BackendId backend,
                                        bool delete_topleveldir);
 };
+
 }  // namespace pax
 
 namespace cbdb {
 
 Oid GetPaxAuxRelid(Oid relid);
 
-void AddMicroPartitionEntry(const pax::WriteSummary &summary);
+void InsertMicroPartitionPlaceHolder(Oid pax_relid, const std::string &blockname);
+void InsertOrUpdateMicroPartitionEntry(const pax::WriteSummary &summary);
 
-void DeleteMicroPartitionEntry(Oid pax_relid,
-                               Snapshot snapshot,
-                               const std::string &block_id);
+void DeleteMicroPartitionEntry(Oid pax_relid, Snapshot snapshot,
+                               const std::string &blockname);
+bool IsMicroPartitionVisible(Relation pax_rel, BlockNumber block, Snapshot snapshot);
 
 }  // namespace cbdb
-
diff --git a/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.cc b/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.cc
new file mode 100644
index 00000000000..a78cdf9c235
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.cc
@@ -0,0 +1,175 @@
+#include "catalog/pax_fastsequence.h"
+
+#include "comm/cbdb_api.h"
+
+namespace paxc {
+
+// Get the required objid Tuple from pg_pax_fastsequence system table.
+// objid indicates single pax micro-partition table oid.
+// lock_mode indicates the lock level used when retrive data from system table.
+static HeapTuple CPaxOpenFastSequenceTable(Oid objid,
+                                           Relation *pax_fastsequence_rel,
+                                           SysScanDesc *pax_fastsequece_scan,
+                                           LOCKMODE lock_mode) {
+  ScanKeyData scankey[1];
+  HeapTuple tuple;
+  Relation rel;
+  SysScanDesc scan;
+
+  rel = table_open(PAX_FASTSEQUENCE_OID, lock_mode);
+
+  /* SELECT * FROM paxaux.pg_pax_fastsequence WHERE objid = :1 FOR UPDATE */
+  ScanKeyInit(&scankey[0], ANUM_PG_PAX_FAST_SEQUENCE_OBJID,
+              BTEqualStrategyNumber, F_OIDEQ, ObjectIdGetDatum(objid));
+
+  scan = systable_beginscan(rel, PAX_FASTSEQUENCE_INDEX_OID, true, NULL, 1,
+                            scankey);
+
+  tuple = systable_getnext(scan);
+
+  *pax_fastsequence_rel = rel;
+  *pax_fastsequece_scan = scan;
+
+  return tuple;
+}
+
+static inline void CPaxCloseFastSequenceTable(Relation pax_fastsequence_rel,
+                                       SysScanDesc pax_fastsequece_scan,
+                                       LOCKMODE lock_mode) {
+  systable_endscan(pax_fastsequece_scan);
+  table_close(pax_fastsequence_rel, lock_mode);
+}
+
+// update the existing fast sequence number for (objid).
+// This tuple is updated with the new value. Otherwise, a new tuple is inserted
+// into the table.
+static void CPaxUpdateFastsequence(Relation pax_fastsequence_rel,
+                                   HeapTuple old_tuple, TupleDesc tuple_desc,
+                                   Oid objid, int32 new_seqno) {
+  HeapTuple new_tuple;
+  Datum values[NATTS_PG_PAX_FAST_SEQUENCE_TABLES];
+  bool nulls[NATTS_PG_PAX_FAST_SEQUENCE_TABLES];
+
+  // If such a tuple does not exist, insert a new one.
+  Assert(HeapTupleIsValid(old_tuple));
+
+  values[ANUM_PG_PAX_FAST_SEQUENCE_OBJID - 1] = ObjectIdGetDatum(objid);
+  values[ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE - 1] =
+      Int32GetDatum(new_seqno);
+  nulls[ANUM_PG_PAX_FAST_SEQUENCE_OBJID - 1] = false;
+  nulls[ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE - 1] = false;
+
+  new_tuple = heap_form_tuple(tuple_desc, values, nulls);
+  Assert(HeapTupleIsValid(new_tuple));
+
+  new_tuple->t_data->t_ctid = old_tuple->t_data->t_ctid;
+  new_tuple->t_self = old_tuple->t_self;
+
+  heap_inplace_update(pax_fastsequence_rel, new_tuple);
+  heap_freetuple(new_tuple);
+}
+
+// InitializeFastSequenceEntry is used to generate and keep track of allocated
+// micropartition file number. objid indicates single pax micro-partition table
+// oid. lastsequence indicates the current allocated file number by using
+// fastsequence allocation.
+void CPaxInitializeFastSequenceEntry(Oid objid, char init_type) {
+  Relation pax_fastsequence_rel;
+  SysScanDesc scan;
+  TupleDesc desc;
+  HeapTuple tuple;
+  HeapTuple new_tuple;
+  Datum values[NATTS_PG_PAX_FAST_SEQUENCE_TABLES];
+  bool nulls[NATTS_PG_PAX_FAST_SEQUENCE_TABLES];
+
+  Assert(init_type == FASTSEQUENCE_INIT_TYPE_CREATE ||
+         init_type == FASTSEQUENCE_INIT_TYPE_INPLACE ||
+         init_type == FASTSEQUENCE_INIT_TYPE_UPDATE);
+  // Initilize a new object id and use row-based exclusive lock to avoid
+  // concurrency issue.
+  tuple = CPaxOpenFastSequenceTable(objid, &pax_fastsequence_rel, &scan,
+                                    RowExclusiveLock);
+
+  desc = RelationGetDescr(pax_fastsequence_rel);
+  values[ANUM_PG_PAX_FAST_SEQUENCE_OBJID - 1] = ObjectIdGetDatum(objid);
+  values[ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE - 1] = Int32GetDatum(0);
+  nulls[ANUM_PG_PAX_FAST_SEQUENCE_OBJID - 1] = false;
+  nulls[ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE - 1] = false;
+  new_tuple = heap_form_tuple(desc, values, nulls);
+
+  if (init_type == FASTSEQUENCE_INIT_TYPE_CREATE) {
+    ObjectAddress base;
+    ObjectAddress aux;
+
+    if (HeapTupleIsValid(tuple))
+      elog(ERROR, "existing tuple in pg_pax_fastsequence when creating pax table");
+
+    CatalogTupleInsert(pax_fastsequence_rel, new_tuple);
+
+    base.classId = RelationRelationId;
+    base.objectId = objid;
+    base.objectSubId = 0;
+    aux.classId = PAX_FASTSEQUENCE_OID;
+    aux.objectId = objid;
+    aux.objectSubId = 0;
+    recordDependencyOn(&aux, &base, DEPENDENCY_INTERNAL);
+  } else {
+    // exists, set to 0 in-place, or update
+    if (!HeapTupleIsValid(tuple))
+      elog(ERROR, "no tuple found in pg_pax_fastsequence for existing pax table");
+
+    new_tuple->t_data->t_ctid = tuple->t_data->t_ctid;
+    new_tuple->t_self = tuple->t_self;
+    if (init_type == FASTSEQUENCE_INIT_TYPE_INPLACE)
+      heap_inplace_update(pax_fastsequence_rel, new_tuple);
+    else if (init_type == FASTSEQUENCE_INIT_TYPE_UPDATE)
+      CatalogTupleUpdate(pax_fastsequence_rel, &new_tuple->t_self, new_tuple);
+  }
+
+  heap_freetuple(new_tuple);
+  CPaxCloseFastSequenceTable(pax_fastsequence_rel, scan, RowExclusiveLock);
+}
+
+// GetFastSequences
+// Get consecutive sequence numbers, the returned sequence number is the
+// lastsequence + 1
+int32 CPaxGetFastSequences(Oid objid) {
+  Relation pax_fastsequence_rel = NULL;
+  SysScanDesc scan = NULL;
+  TupleDesc tuple_desc;
+  HeapTuple tuple;
+  Datum seqno_datum;
+  int32 seqno;
+  bool isnull = false;
+
+  // Increase and read sequence number base on objid and use row-based exclusive
+  // lock to avoid concurrency issue.
+  tuple = CPaxOpenFastSequenceTable(objid, &pax_fastsequence_rel, &scan,
+                                    RowExclusiveLock);
+
+  Assert(HeapTupleIsValid(tuple));
+
+  tuple_desc = RelationGetDescr(pax_fastsequence_rel);
+
+  seqno_datum = heap_getattr(tuple, ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE,
+                             tuple_desc, &isnull);
+  if (isnull) {
+    ereport(
+        ERROR,
+        (errcode(ERRCODE_UNDEFINED_OBJECT),
+         errmsg(
+             "CPaxGetFastSequences got an invalid lastsequence number: NULL")));
+  }
+  seqno = DatumGetInt32(seqno_datum);
+  if (seqno < 0)
+    elog(ERROR, "sequence number out of range: %d", seqno);
+
+  CPaxUpdateFastsequence(pax_fastsequence_rel, tuple, tuple_desc, objid,
+                         seqno + 1);
+
+  CPaxCloseFastSequenceTable(pax_fastsequence_rel, scan, RowExclusiveLock);
+
+  return seqno;
+}
+
+}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.h b/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.h
new file mode 100644
index 00000000000..b5269dfa3df
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/catalog/pax_fastsequence.h
@@ -0,0 +1,32 @@
+//-------------------------------------------------------------------------
+// Cloudberry Database
+// Copyright (c) 2023, HashData Technology Limited.
+// pax_fastsequence.h
+// provide a system table maintaining a light-weight fast sequence number for a
+// unique object.
+//
+// IDENTIFICATION
+//	    src/catalog/pax_fastsequence.h
+// Author: Tony Ying
+//--------------------------------------------------------------------------
+
+#pragma once
+#include "comm/cbdb_api.h"
+
+#define ANUM_PG_PAX_FAST_SEQUENCE_OBJID 1
+#define ANUM_PG_PAX_FAST_SEQUENCE_LASTSEQUENCE 2
+#define NATTS_PG_PAX_FAST_SEQUENCE_TABLES 2
+
+// CREATE:  initialize seqno by INSERT, no tuple exists before
+// INPLACE: inplace update when grow the seqno or non-transactional truncate
+// UPDATE:  transactional truncate, needs to preserve the old seqno
+//          after rollback
+#define FASTSEQUENCE_INIT_TYPE_CREATE 'C'
+#define FASTSEQUENCE_INIT_TYPE_INPLACE 'I'
+#define FASTSEQUENCE_INIT_TYPE_UPDATE 'U'
+
+namespace paxc {
+void CPaxInitializeFastSequenceEntry(Oid objid, char init_type);
+int32 CPaxGetFastSequences(Oid objid);
+
+}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.cc b/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.cc
new file mode 100644
index 00000000000..c3d7b98f5c9
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.cc
@@ -0,0 +1,131 @@
+#include "catalog/pg_pax_tables.h"
+
+#include "comm/cbdb_api.h"
+
+namespace paxc {
+
+void InsertPaxTablesEntry(Oid relid, Oid blocksrelid, Node *partitionspec) {
+  Relation rel;
+  TupleDesc desc;
+  HeapTuple tuple;
+  bool nulls[NATTS_PG_PAX_TABLES];
+  Datum values[NATTS_PG_PAX_TABLES];
+
+  rel = table_open(PAX_TABLES_RELATION_ID, RowExclusiveLock);
+  desc = RelationGetDescr(rel);
+  Assert(desc->natts == NATTS_PG_PAX_TABLES);
+
+  values[ANUM_PG_PAX_TABLES_RELID - 1] = ObjectIdGetDatum(relid);
+  values[ANUM_PG_PAX_TABLES_AUXRELID - 1] = ObjectIdGetDatum(blocksrelid);
+  nulls[ANUM_PG_PAX_TABLES_RELID - 1] = false;
+  nulls[ANUM_PG_PAX_TABLES_AUXRELID - 1] = false;
+
+  if (partitionspec) {
+    values[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] =
+        CStringGetTextDatum(nodeToString(partitionspec));
+    nulls[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = false;
+  } else {
+    values[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = 0;
+    nulls[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = true;
+  }
+  tuple = heap_form_tuple(desc, values, nulls);
+
+  /* insert a new tuple */
+  CatalogTupleInsert(rel, tuple);
+
+  table_close(rel, NoLock);
+}
+
+void GetPaxTablesEntryAttributes(Oid relid, Oid *blocksrelid,
+                                 Node **partitionspec) {
+  Relation rel;
+  ScanKeyData key[1];
+  SysScanDesc scan;
+  HeapTuple tuple;
+  bool isnull;
+
+  rel = table_open(PAX_TABLES_RELATION_ID, RowExclusiveLock);
+
+  ScanKeyInit(&key[0], ANUM_PG_PAX_TABLES_RELID, BTEqualStrategyNumber, F_OIDEQ,
+              ObjectIdGetDatum(relid));
+
+  scan = systable_beginscan(rel, PAX_TABLES_RELID_INDEX_ID, true, NULL, 1, key);
+  tuple = systable_getnext(scan);
+  if (!HeapTupleIsValid(tuple))
+    ereport(ERROR, (errcode(ERRCODE_UNDEFINED_OBJECT),
+                    errmsg("pax table relid \"%d\" does not exist in "
+                           "pg_pax_tables",
+                           relid)));
+
+  if (partitionspec) {
+    Datum v;
+    v = heap_getattr(tuple, ANUM_PG_PAX_TABLES_PARTITIONSPEC,
+                     RelationGetDescr(rel), &isnull);
+    *partitionspec = NULL;
+    if (!isnull) {
+      char *str = TextDatumGetCString(v);
+      *partitionspec = (Node *)stringToNode(str);
+      pfree(str);
+    }
+  }
+
+  if (blocksrelid) {
+    *blocksrelid = heap_getattr(tuple, ANUM_PG_PAX_TABLES_AUXRELID,
+                                RelationGetDescr(rel), &isnull);
+    if (isnull) ereport(ERROR, (errmsg("pg_pax_tables.auxrelid is null")));
+  }
+
+  /* Finish up scan and close pg_pax_tables catalog. */
+  systable_endscan(scan);
+  table_close(rel, NoLock);
+}
+
+void PaxInitializePartitionSpec(Relation paxrel, Node *part) {
+  Relation rel;
+  ScanKeyData key[1];
+  SysScanDesc scan;
+  HeapTuple oldtuple;
+  TupleDesc desc;
+  bool isnull;
+
+  Assert(paxrel->rd_rel->relkind == RELKIND_RELATION ||
+         paxrel->rd_rel->relkind == RELKIND_MATVIEW);
+  Assert(paxrel->rd_options);
+
+  rel = table_open(PAX_TABLES_RELATION_ID, RowExclusiveLock);
+  desc = RelationGetDescr(rel);
+  ScanKeyInit(&key[0], ANUM_PG_PAX_TABLES_RELID, BTEqualStrategyNumber, F_OIDEQ,
+              ObjectIdGetDatum(RelationGetRelid(paxrel)));
+
+  scan = systable_beginscan(rel, PAX_TABLES_RELID_INDEX_ID, true, NULL, 1, key);
+  oldtuple = systable_getnext(scan);
+  if (!HeapTupleIsValid(oldtuple)) elog(ERROR, "only support pax tables");
+
+  (void)heap_getattr(oldtuple, ANUM_PG_PAX_TABLES_PARTITIONSPEC, desc, &isnull);
+  if (isnull) {
+    HeapTuple newtup;
+    Datum values[NATTS_PG_PAX_TABLES];
+    bool repl[NATTS_PG_PAX_TABLES];
+    bool isnull[NATTS_PG_PAX_TABLES];
+
+    memset(repl, false, sizeof(repl));
+    values[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] =
+        CStringGetTextDatum(nodeToString(part));
+    repl[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = true;
+    isnull[ANUM_PG_PAX_TABLES_PARTITIONSPEC - 1] = false;
+
+    newtup = heap_modify_tuple(oldtuple, desc, values, isnull, repl);
+    CatalogTupleUpdate(rel, &oldtuple->t_self, newtup);
+    heap_freetuple(newtup);
+
+    CommandCounterIncrement();
+  } else {
+    elog(ERROR, "existing pax table update partition spec?");
+  }
+
+  /* Finish up scan and close pg_pax_tables catalog. */
+  systable_endscan(scan);
+  table_close(rel, NoLock);
+}
+
+}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.h b/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.h
new file mode 100644
index 00000000000..f4d138b0a4b
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/catalog/pg_pax_tables.h
@@ -0,0 +1,24 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#define NATTS_PG_PAX_TABLES 3
+#define ANUM_PG_PAX_TABLES_RELID 1
+#define ANUM_PG_PAX_TABLES_AUXRELID 2
+#define ANUM_PG_PAX_TABLES_PARTITIONSPEC 3
+
+namespace paxc {
+
+void InsertPaxTablesEntry(Oid relid, Oid blocksrelid, Node *partitionspec);
+
+void GetPaxTablesEntryAttributes(Oid relid, Oid *blocksrelid,
+                                 Node **partitionspec);
+
+void PaxInitializePartitionSpec(Relation paxrel, Node *part);
+
+static inline Oid GetPaxAuxRelid(Oid pax_relid) {
+  Oid aux_relid;
+  GetPaxTablesEntryAttributes(pax_relid, &aux_relid, nullptr);
+  return aux_relid;
+}
+
+}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/cmake/pax.cmake b/contrib/pax_storage/src/cpp/cmake/pax.cmake
new file mode 100644
index 00000000000..6c7ef92b60c
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/cmake/pax.cmake
@@ -0,0 +1,187 @@
+
+## generate_sql
+add_executable(generate_sql_script_program "${CMAKE_CURRENT_SOURCE_DIR}/../../tools/gen_sql.c")
+target_include_directories(generate_sql_script_program PUBLIC ${CMAKE_CURRENT_SOURCE_DIR} ${CBDB_INCLUDE_DIR})
+add_custom_command(OUTPUT generate_sql_file
+  COMMAND ${CMAKE_CURRENT_BINARY_DIR}/generate_sql_script_program > "${CMAKE_CURRENT_SOURCE_DIR}/../../pax-cdbinit--1.0.sql"
+  DEPENDS generate_sql_script_program
+  COMMENT "dynamically generate sql script file"
+)
+add_custom_target(create_sql_script DEPENDS generate_sql_script_program generate_sql_file)
+
+# bison
+bison_target(paxc_gram access/paxc_gram.y ${CMAKE_CURRENT_BINARY_DIR}/paxc_gram.c)
+
+
+set(pax_comm_src
+    comm/bitmap.cc
+    comm/guc.cc
+    comm/paxc_wrappers.cc
+    comm/pax_memory.cc
+    comm/cbdb_wrappers.cc)
+
+set(pax_exceptions_src
+    exceptions/CException.cc)
+
+set(pax_storage_src
+    storage/cache/pax_cache.cc
+    storage/cache/pax_plasma_cache.cc
+    storage/columns/pax_column_cache.cc
+    storage/columns/pax_column_traits.cc
+    storage/columns/pax_column.cc
+    storage/columns/pax_compress.cc
+    storage/columns/pax_columns.cc
+    storage/columns/pax_encoding_utils.cc
+    storage/columns/pax_encoding_non_fixed_column.cc
+    storage/columns/pax_encoding_column.cc
+    storage/columns/pax_decoding.cc
+    storage/columns/pax_encoding.cc
+    storage/columns/pax_rlev2_decoding.cc
+    storage/columns/pax_rlev2_encoding.cc
+    storage/columns/pax_vec_column.cc
+    storage/columns/pax_vec_encoding_column.cc
+    storage/oper/pax_oper.cc
+    storage/oper/pax_stats.cc
+    storage/file_system.cc
+    storage/local_file_system.cc
+    storage/micro_partition.cc
+    storage/micro_partition_file_factory.cc
+    storage/micro_partition_metadata.cc
+    storage/micro_partition_row_filter_reader.cc
+    storage/micro_partition_stats.cc
+    storage/orc/orc_format_reader.cc
+    storage/orc/orc_group.cc
+    storage/orc/orc_vec_group.cc
+    storage/orc/orc_reader.cc
+    storage/orc/orc_writer.cc
+    storage/pax_buffer.cc
+    storage/pax_filter.cc
+    storage/pax_itemptr.cc
+    storage/proto/protobuf_stream.cc
+    storage/pax.cc 
+    storage/pax_table_partition_writer.cc  
+    storage/strategy.cc
+    storage/micro_partition_iterator.cc
+  )
+
+
+set(pax_access_src
+    ${BISON_paxc_gram_OUTPUTS} # BISON output file
+    access/paxc_rel_options.cc
+    access/paxc_scanner.cc
+    access/pax_access_handle.cc
+    access/pax_deleter.cc
+    access/pax_dml_state.cc
+    access/pax_inserter.cc
+    access/pax_partition.cc
+    access/pax_updater.cc
+    access/pax_scanner.cc)
+
+set(pax_catalog_src
+    catalog/pax_aux_table.cc
+    catalog/pg_pax_tables.cc
+    catalog/pax_fastsequence.cc
+    )
+
+set(pax_vec_src
+  storage/vec/pax_vec_adapter.cc
+  storage/vec/pax_vec_reader.cc)
+
+
+#### pax.so
+set(pax_target_src  ${PROTO_SRCS} ${pax_storage_src} ${pax_exceptions_src}
+  ${pax_access_src} ${pax_comm_src} ${pax_catalog_src} ${pax_vec_src})
+set(pax_target_include ${ZTSD_HEADER} ${CMAKE_CURRENT_SOURCE_DIR} ${CBDB_INCLUDE_DIR})
+set(pax_target_link_libs protobuf zstd z postgres)
+set(pax_target_link_directories ${PROJECT_SOURCE_DIR}/../../src/backend/)
+set(pax_target_dependencies generate_protobuf create_sql_script)
+
+# enable plasma
+if (ENABLE_PLASMA)
+  set(pax_target_link_libs ${pax_target_link_libs} uuid plasma)
+endif()
+
+add_library(pax SHARED ${pax_target_src})
+set_target_properties(pax PROPERTIES OUTPUT_NAME pax)
+
+# vec build
+if (VEC_BUILD)
+  find_package(PkgConfig REQUIRED)
+  pkg_check_modules(GLIB REQUIRED glib-2.0)
+  set(pax_target_include
+      ${pax_target_include}
+      ${VEC_HOME}/src/include # for utils/tuptable_vec.h
+      ${VEC_HOME}/arrow/include  # for arrow-glib/arrow-glib.h and otehr arrow interface
+      ${GLIB_INCLUDE_DIRS} # for glib-object.h
+  )
+  set(pax_target_link_directories
+      ${pax_target_link_directories}
+      ${VEC_HOME}/arrow/lib)
+  set(pax_target_link_libs
+      ${pax_target_link_libs}
+      arrow)
+endif(VEC_BUILD)
+
+target_include_directories(pax PUBLIC ${pax_target_include})
+target_link_directories(pax PUBLIC ${pax_target_link_directories})
+target_link_libraries(pax PUBLIC ${pax_target_link_libs})
+set_target_properties(pax PROPERTIES
+  BUILD_RPATH_USE_ORIGIN ON
+  BUILD_WITH_INSTALL_RPATH ON
+  INSTALL_RPATH "$ORIGIN:$ORIGIN/.."
+  LINK_FLAGS "-Wl,--enable-new-dtags"
+)
+
+add_dependencies(pax ${pax_target_dependencies})
+add_custom_command(TARGET pax POST_BUILD
+                COMMAND ${CMAKE_COMMAND} -E
+                copy_if_different $<TARGET_FILE:pax> ${CMAKE_CURRENT_SOURCE_DIR}/../../pax.so)
+
+if (BUILD_GTEST)
+  add_subdirectory(contrib/googletest)
+  ADD_DEFINITIONS(-DRUN_GTEST)
+  file(GLOB test_case_sources
+    pax_gtest_helper.cc
+    pax_gtest.cc
+    ${CMAKE_CURRENT_SOURCE_DIR}/*/*_test.cc
+    ${CMAKE_CURRENT_SOURCE_DIR}/*/*/*_test.cc)
+
+  add_executable(test_main ${pax_target_src} ${test_case_sources})
+  add_dependencies(test_main ${pax_target_dependencies} gtest gmock)
+  target_include_directories(test_main PUBLIC ${pax_target_include} ${CMAKE_CURRENT_SOURCE_DIR} ${gtest_SOURCE_DIR}/include contrib/cpp-stub/src/ contrib/cpp-stub/src_linux/)
+
+  target_link_directories(test_main PUBLIC ${pax_target_link_directories})
+  target_link_libraries(test_main PUBLIC ${pax_target_link_libs} gtest gmock postgres)
+endif(BUILD_GTEST)
+
+if(BUILD_GBENCH)
+  add_subdirectory(contrib/googlebench)
+  ADD_DEFINITIONS(-DRUN_GBENCH)
+  file(GLOB bench_sources
+      pax_gbench.cc
+      ${CMAKE_CURRENT_SOURCE_DIR}/*/*_bench.cc
+      ${CMAKE_CURRENT_SOURCE_DIR}/*/*/*_bench.cc)
+
+    add_executable(bench_main ${pax_target_src} ${bench_sources})
+    add_dependencies(bench_main ${pax_target_dependencies} gtest gmock)
+    target_include_directories(bench_main PUBLIC ${pax_target_include} ${CMAKE_CURRENT_SOURCE_DIR} contrib/googlebench/include contrib/cpp-stub/src/ contrib/cpp-stub/src_linux/)
+    link_directories(contrib/googlebench/src)
+    target_link_libraries(bench_main PUBLIC ${pax_target_link_libs} gtest gmock benchmark postgres)
+    if (VEC_BUILD)
+      target_link_libraries(bench_main PRIVATE arrow)
+    endif(VEC_BUILD)
+endif(BUILD_GBENCH)
+
+if (BUILD_TOOLS) 
+  add_subdirectory(contrib/tabulate)
+  link_directories($ENV{GPHOME}/lib)
+
+  add_executable(pax_dump storage/tools/pax_dump.cpp storage/tools/pax_dump_reader.cpp)
+  target_include_directories(pax_dump PUBLIC ${pax_target_include} ${CMAKE_CURRENT_SOURCE_DIR} contrib/tabulate/include)
+  add_dependencies(pax_dump ${pax_target_dependencies})
+  target_link_libraries(pax_dump PUBLIC pax protobuf)
+endif(BUILD_TOOLS)
+
+## install dynamic libraray
+install(TARGETS pax
+  LIBRARY DESTINATION ${CMAKE_INSTALL_PREFIX}/lib)
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/cmake/pax_format.cmake b/contrib/pax_storage/src/cpp/cmake/pax_format.cmake
new file mode 100644
index 00000000000..55206384e91
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/cmake/pax_format.cmake
@@ -0,0 +1,93 @@
+# paxformat.so
+
+set(pax_comm_src
+    comm/bitmap.cc
+    comm/guc.cc
+    comm/paxc_wrappers.cc
+    comm/pax_memory.cc
+    comm/cbdb_wrappers.cc)
+
+set(pax_exceptions_src
+    exceptions/CException.cc)
+
+set(pax_storage_src
+    storage/cache/pax_cache.cc
+    storage/cache/pax_plasma_cache.cc
+    storage/columns/pax_column_cache.cc
+    storage/columns/pax_column_traits.cc
+    storage/columns/pax_column.cc
+    storage/columns/pax_compress.cc
+    storage/columns/pax_columns.cc
+    storage/columns/pax_encoding_utils.cc
+    storage/columns/pax_encoding_non_fixed_column.cc
+    storage/columns/pax_encoding_column.cc
+    storage/columns/pax_decoding.cc
+    storage/columns/pax_encoding.cc
+    storage/columns/pax_rlev2_decoding.cc
+    storage/columns/pax_rlev2_encoding.cc
+    storage/columns/pax_vec_column.cc
+    storage/columns/pax_vec_encoding_column.cc
+    storage/oper/pax_oper.cc
+    storage/oper/pax_stats.cc
+    storage/file_system.cc
+    storage/local_file_system.cc
+    storage/micro_partition.cc
+    storage/micro_partition_file_factory.cc
+    storage/micro_partition_metadata.cc
+    storage/micro_partition_row_filter_reader.cc
+    storage/micro_partition_stats.cc
+    storage/orc/orc_format_reader.cc
+    storage/orc/orc_group.cc
+    storage/orc/orc_vec_group.cc
+    storage/orc/orc_reader.cc
+    storage/orc/orc_writer.cc
+    storage/pax_buffer.cc
+    storage/pax_filter.cc
+    storage/proto/protobuf_stream.cc
+   )
+
+add_library(paxformat SHARED ${PROTO_SRCS} ${pax_storage_src} ${pax_exceptions_src} ${pax_comm_src} )
+target_compile_definitions(paxformat PRIVATE BUILD_PAX_FORMAT)
+target_include_directories(paxformat PUBLIC ${ZTSD_HEADER} ${CMAKE_CURRENT_SOURCE_DIR} ${CBDB_INCLUDE_DIR})
+target_link_libraries(paxformat PUBLIC uuid protobuf zstd z)
+set_target_properties(paxformat PROPERTIES
+  OUTPUT_NAME paxformat)
+add_dependencies(paxformat generate_protobuf)
+
+# export headers
+set(PAX_COMM_HEADERS
+  comm/bitmap.h
+  comm/cbdb_api.h
+  comm/log.h
+  comm/cbdb_wrappers.h
+  comm/pax_rel.h
+  comm/pax_memory.h
+  comm/guc.h
+)
+
+set(PAX_EXCEPTION_HEADERS
+  exceptions/CException.h
+)
+
+# TODO(gongxun):
+# We should explicitly specify the headers
+# that need to be exported, and use the syntax of
+# install(FILES,...) to install the header files
+install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/storage
+  DESTINATION ${CMAKE_INSTALL_PREFIX}/include/pax
+  FILES_MATCHING
+  PATTERN "*.h"
+)
+
+install(FILES ${PAX_COMM_HEADERS}
+  DESTINATION ${CMAKE_INSTALL_PREFIX}/include/pax/comm
+)
+
+install(FILES ${PAX_EXCEPTION_HEADERS}
+  DESTINATION ${CMAKE_INSTALL_PREFIX}/include/pax/exceptions
+)
+
+## install dynamic libraray
+install(TARGETS paxformat
+  LIBRARY DESTINATION ${CMAKE_INSTALL_PREFIX}/lib)
+
diff --git a/contrib/pax_storage/src/cpp/comm/bitmap.cc b/contrib/pax_storage/src/cpp/comm/bitmap.cc
index 7009323445f..eeb2b404cfc 100644
--- a/contrib/pax_storage/src/cpp/comm/bitmap.cc
+++ b/contrib/pax_storage/src/cpp/comm/bitmap.cc
@@ -1,150 +1,23 @@
 #include "comm/bitmap.h"
 
-#include "exceptions/CException.h"
-
 namespace pax {
+const uint8 kNumBits[] = {
+  0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4,
+  1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,
+  1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,
+  1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,
+  2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,
+  3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,
+  3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,
+  4,5,5,6,5,6,6,7,5,6,6,7,6,7,7,8,
+};
 
-DynamicBitmap::DynamicBitmap() { bitmap_.resize(1024); }
-DynamicBitmap::DynamicBitmap(uint32 size) { bitmap_.resize(size); }
-
-DynamicBitmap::~DynamicBitmap() { bitmap_.clear(); }
-
-void DynamicBitmap::Set(uint32 index) {
-  CBDB_CHECK(index >= 0 && index < bitmap_.size(),
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  bitmap_[index] = true;
-}
-
-bool DynamicBitmap::Test(uint32 index) const {
-  CBDB_CHECK(index >= 0 && index < bitmap_.size(),
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  return bitmap_[index];
-}
-
-void DynamicBitmap::Clear(uint32 index) {
-  CBDB_CHECK(index >= 0 && index < bitmap_.size(),
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  bitmap_[index] = false;
-}
-
-void DynamicBitmap::Reset() { bitmap_.clear(); }
-
-void DynamicBitmap::Resize(int size) { bitmap_.resize(size); }
-
-// TODO(gongxun): need to do optimization for this function
-bool DynamicBitmap::BitmapFindFirst(uint32 offset, bool value,
-                                    uint32 *idx) const {
-  auto it = std::find(bitmap_.begin() + offset, bitmap_.end(), value);
-  if (it == bitmap_.end()) {
-    return false;
-  }
-  *idx = it - bitmap_.begin();
-  return true;
-}
-
-uint32 DynamicBitmap::NumBits() const { return bitmap_.size(); }
-
-FixedBitmap::FixedBitmap(uint32 size) {
-  byte_size_ = (size >> 3) + (size & 7 ? 1 : 0);
-  bitmap_ = new uint8[byte_size_];
-
-  num_bits_ = size;
-  memset(bitmap_, 0, byte_size_);
-}
-
-FixedBitmap::~FixedBitmap() { delete[] bitmap_; }
-
-void FixedBitmap::Set(uint32 index) {
-  CBDB_CHECK(index >= 0 && index < num_bits_,
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  bitmap_[index >> 3] |= 1 << (index & 7);
-}
-
-bool FixedBitmap::Test(uint32 index) const {
-  CBDB_CHECK(index >= 0 && index < num_bits_,
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  return bitmap_[index >> 3] & (1 << (index & 7));
 }
-
-void FixedBitmap::Reset() { std::memset(bitmap_, 0, byte_size_); }
-
-void FixedBitmap::Clear(uint32 index) {
-  CBDB_CHECK(index >= 0 && index < num_bits_,
-             cbdb::CException::ExType::kExTypeOutOfRange);
-  bitmap_[index >> 3] &= ~(1 << (index & 7));
-}
-
-uint32 FixedBitmap::Size() const { return byte_size_; }
-uint32 FixedBitmap::NumBits() const { return num_bits_; }
-bool FixedBitmap::BitmapFindFirst(uint32 offset, bool value,
-                                  uint32 *idx) const {
-  const uint64 pattern64[2] = {0xffffffffffffffff, 0x0000000000000000};
-  const uint8 pattern8[2] = {0xff, 0x00};
-  uint32 bit;
-
-  if (offset >= num_bits_) {
-    return false;
-  }
-
-  // Jump to the byte at specified offset
-  const uint8 *p = bitmap_ + (offset >> 3);
-  uint32 num_bits = num_bits_ - offset;
-
-  // Find a 'value' bit at the end of the first byte
-  if ((bit = offset & 0x7)) {
-    for (; bit < 8 && num_bits > 0; ++bit) {
-      if (Test(((p - bitmap_) << 3) + bit) == value) {
-        *idx = ((p - bitmap_) << 3) + bit;
-        return true;
-      }
-
-      num_bits--;
-    }
-    p++;
-  }
-
-  // check 64bit at the time for a 'value' bit
-  const uint64 *u64 = (const uint64 *)p;
-  while (num_bits >= 64 && *u64 == pattern64[value]) {
-    num_bits -= 64;
-    u64++;
-  }
-
-  // check 8bit at the time for a 'value' bit
-  p = (const uint8 *)u64;
-  while (num_bits >= 8 && *p == pattern8[value]) {
-    num_bits -= 8;
-    p++;
-  }
-
-  // Find a 'value' bit at the beginning of the last byte
-  for (bit = 0; num_bits > 0; ++bit) {
-    if (Test(((p - bitmap_) << 3) + bit) == value) {
-      *idx = ((p - bitmap_) << 3) + bit;
-      return true;
-    }
-    num_bits--;
-  }
-
-  return false;
-}
-
-BitmapIterator::BitmapIterator(Bitmap *map) : offset_(0), bitmap_(map) {}
-
-void BitmapIterator::SeekTo(size_t bit) {
-  Assert(bit < bitmap_->NumBits());
-  offset_ = bit;
-}
-
-int32 BitmapIterator::Next(bool value) {
-  int32 len = bitmap_->NumBits() - offset_;
-  if (len <= 0) return -1;
-  uint32 index;
-  if (bitmap_->BitmapFindFirst(offset_, value, &index)) {
-    offset_ = index + 1;
-    return index;
-  }
-  return -1;
-}
-
-}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/comm/bitmap.h b/contrib/pax_storage/src/cpp/comm/bitmap.h
index daa5819a3a1..0d503be48f2 100644
--- a/contrib/pax_storage/src/cpp/comm/bitmap.h
+++ b/contrib/pax_storage/src/cpp/comm/bitmap.h
@@ -4,97 +4,261 @@
 
 #include <assert.h>
 
-#include <algorithm>
 #include <cstddef>
-#include <cstdint>
-#include <cstdio>
-#include <cstring>
-#include <stdexcept>
-#include <vector>
 
-namespace pax {
+#include "comm/pax_memory.h"
+#include "exceptions/CException.h"
 
-class Bitmap {
- public:
-  virtual ~Bitmap() {}
-  virtual void Set(uint32 index) = 0;
-  virtual bool Test(uint32 index) const = 0;
-  virtual void Clear(uint32 index) = 0;
-  virtual void Reset() = 0;
-  virtual bool BitmapFindFirst(uint32 offset, bool value,
-                               uint32 *idx) const = 0;
-  virtual uint32 NumBits() const = 0;
-};
-
-class DynamicBitmap : public Bitmap {
+namespace pax {
+extern const uint8 kNumBits[];
+#define BM_WORD_BITS (sizeof(T) << 3)
+// log2(BM_WORD_BITS)
+#define BM_WORD_SHIFTS \
+  (sizeof(T) == 1 ? 3 : (sizeof(T) == 2 ? 4 : (sizeof(T) == 4 ? 5 : 6)))
+#define BM_INDEX_WORD_OFF(index) ((index) >> BM_WORD_SHIFTS)
+#define BM_INDEX_BIT_OFF(index) ((index) & (BM_WORD_BITS - 1))
+#define BM_INDEX_BIT(index) (1ULL << BM_INDEX_BIT_OFF(index))
+template <typename T>
+struct BitmapRaw final {
  public:
-  friend class BitmapIterator;
-  DynamicBitmap();
-  explicit DynamicBitmap(uint32 size);
+  inline void Set(uint32 index) {
+    bitmap[BM_INDEX_WORD_OFF(index)] |= BM_INDEX_BIT(index);
+  }
+  // set first the bits [0, index] to 1
+  inline void SetN(uint32 index) {
+    memset(&bitmap[0], -1, sizeof(T) * BM_INDEX_WORD_OFF(index));
+    bitmap[BM_INDEX_WORD_OFF(index)] |= (BM_INDEX_BIT(index) << 1) - 1;
+  }
+  inline void Clear(uint32 index) {
+    bitmap[BM_INDEX_WORD_OFF(index)] &= ~BM_INDEX_BIT(index);
+  }
+  inline void ClearN(uint32 index) {
+    memset(&bitmap[0], 0, sizeof(T) * BM_INDEX_WORD_OFF(index));
+    bitmap[BM_INDEX_WORD_OFF(index)] &= ~((BM_INDEX_BIT(index) << 1) - 1);
+  }
+  inline void ClearAll() {
+    AssertImply(size > 0, bitmap);
+    if (size > 0) memset(&bitmap[0], 0, sizeof(T) * size);
+  }
+  inline bool Test(uint32 index) const {
+    return (bitmap[BM_INDEX_WORD_OFF(index)] & BM_INDEX_BIT(index)) != 0;
+  }
+  // invert the bit and return the old value.
+  inline bool Toggle(uint32 index) {
+    return !((bitmap[BM_INDEX_WORD_OFF(index)] ^= BM_INDEX_BIT(index)) &
+             BM_INDEX_BIT(index));
+  }
+  inline size_t WordBits(T v) const {
+    if (sizeof(T) == 1)
+      return kNumBits[v];
+    else if (sizeof(T) == 2)
+      return kNumBits[v & 0xff] + kNumBits[v >> 8];
+    else if (sizeof(T) == 4)
+      return kNumBits[v & 0xff] + kNumBits[(v >> 8) & 0xff] +
+             kNumBits[(v >> 16) & 0xff] + kNumBits[(v >> 24) & 0xff];
+    else if (sizeof(T) == 8)
+      return kNumBits[v & 0xff] + kNumBits[(v >> 8) & 0xff] +
+             kNumBits[(v >> 16) & 0xff] + kNumBits[(v >> 24) & 0xff] +
+             kNumBits[(v >> 32) & 0xff] + kNumBits[(v >> 40) & 0xff] +
+             kNumBits[(v >> 48) & 0xff] + kNumBits[(v >> 56) & 0xff];
+    return 0;
+  }
+  // count bits in range [0, index]
+  inline size_t CountBits(uint32 index) const {
+    size_t nbits = 0;
+    for (uint32 i = 0; i < BM_INDEX_WORD_OFF(index); i++)
+      nbits += WordBits(bitmap[i]);
+    {
+      auto w = bitmap[BM_INDEX_WORD_OFF(index)];
+      nbits += WordBits(w & ((BM_INDEX_BIT(index) << 1) - 1));
+    }
 
-  virtual ~DynamicBitmap();
+    return nbits;
+  }
+  // count bits in range [start, end]
+  inline size_t CountBits(uint32 start_index, uint32 end_index) const {
+    size_t nbits = 0;
+    uint32 word_off = BM_INDEX_WORD_OFF(start_index);
 
-  void Set(uint32 index) override;
+    Assert(start_index <= end_index);
 
-  bool Test(uint32 index) const override;
+    if (BM_INDEX_WORD_OFF(end_index) == word_off) {
+      uint32 w = bitmap[word_off] >> BM_INDEX_BIT_OFF(start_index);
+      return WordBits(w & ((1ULL << (end_index - start_index + 1)) - 1));
+    }
+    {
+      uint32 w = bitmap[BM_INDEX_WORD_OFF(start_index)];
+      nbits += WordBits(w >> BM_INDEX_BIT_OFF(start_index));
+    }
+    for (uint32 i = BM_INDEX_WORD_OFF(start_index + BM_WORD_BITS),
+                n = BM_INDEX_WORD_OFF(end_index);
+         i < n; i++)
+      nbits += WordBits(bitmap[i]);
+    {
+      auto w = bitmap[BM_INDEX_WORD_OFF(end_index)];
+      nbits += WordBits(w & ((BM_INDEX_BIT(end_index) << 1) - 1));
+    }
+    return nbits;
+  }
 
-  void Clear(uint32 index) override;
+  inline bool HasEnoughSpace(uint32 index) const {
+    static_assert(sizeof(T) == 1 || sizeof(T) == 2 || sizeof(T) == 4 ||
+                  sizeof(T) == 8);
+    static_assert(BM_WORD_BITS == (1 << BM_WORD_SHIFTS));
+    return (index >> BM_WORD_SHIFTS) < size;
+  }
+  inline bool Empty() const {
+    if (!bitmap) return true;
+    for (size_t i = 0; i < size; i++)
+      if (bitmap[i]) return false;
+    return true;
+  }
+  BitmapRaw() = default;
+  BitmapRaw(T *buffer, size_t size) : bitmap(buffer), size(size) {}
+  BitmapRaw(const BitmapRaw &) = delete;
+  BitmapRaw(BitmapRaw &&raw) : bitmap(raw.bitmap), size(raw.size) {
+    raw.bitmap = nullptr;
+    raw.size = 0;
+  }
+  BitmapRaw &operator=(BitmapRaw) = delete;
+  BitmapRaw &operator=(BitmapRaw &) = delete;
+  BitmapRaw &operator=(const BitmapRaw &) = delete;
+  BitmapRaw &operator=(BitmapRaw &&raw) {
+    if (this != &raw) {
+      PAX_DELETE_ARRAY(bitmap);
+      bitmap = raw.bitmap;
+      size = raw.size;
+      raw.bitmap = nullptr;
+      raw.size = 0;
+    }
+    return *this;
+  }
 
-  void Reset() override;
+  ~BitmapRaw() = default;
 
-  void Resize(int size);
-
-  // TODO(gongxun): need to do optimization for this function
-  bool BitmapFindFirst(uint32 offset, bool value, uint32 *idx) const override;
-
-  uint32 NumBits() const override;
-
- private:
-  std::vector<bool> bitmap_;
+  T *bitmap = nullptr;
+  size_t size = 0;
 };
 
-class FixedBitmap : public Bitmap {
+template <typename T>
+class BitmapTpl final {
  public:
-  friend class BitmapIterator;
-  explicit FixedBitmap(uint32 size);
+  using BitmapMemoryPolicy = void (*)(BitmapRaw<T> &, uint32);
+  explicit BitmapTpl(uint32 initial_size = 16,
+                     BitmapMemoryPolicy policy = DefaultBitmapMemoryPolicy) {
+    static_assert(sizeof(T) == 1 || sizeof(T) == 2 || sizeof(T) == 4 ||
+                  sizeof(T) == 8);
+    static_assert(BM_WORD_BITS == (1 << BM_WORD_SHIFTS));
+    policy_ = policy;
+    policy(raw_, Max(initial_size, 16));
+  }
+  explicit BitmapTpl(const BitmapRaw<T> &raw, BitmapMemoryPolicy policy) {
+    static_assert(sizeof(T) == 1 || sizeof(T) == 2 || sizeof(T) == 4 ||
+                  sizeof(T) == 8);
+    static_assert(BM_WORD_BITS == (1 << BM_WORD_SHIFTS));
+    Assert(policy == ReadOnlyRefBitmap || policy == ReadOnlyOwnBitmap);
+    policy_ = policy;
+    raw_.bitmap = raw.bitmap;
+    raw_.size = raw.size;
+  }
+  BitmapTpl(const BitmapTpl &tpl) = delete;
+  BitmapTpl(BitmapTpl &&tpl)
+      : raw_(std::move(tpl.raw_)), policy_(tpl.policy_) {}
+  BitmapTpl &operator=(const BitmapTpl &tpl) = delete;
+  BitmapTpl &operator=(BitmapTpl &&tpl) = delete;
+  ~BitmapTpl() {
+    // Reference doesn't free the memory
+    if (policy_ == ReadOnlyRefBitmap) raw_.bitmap = nullptr;
+  }
+  inline size_t WordBits() const { return BM_WORD_BITS; }
+  inline void Set(uint32 index) {
+    if (unlikely(!raw_.HasEnoughSpace(index))) policy_(raw_, index);
+    raw_.Set(index);
+  }
+  inline void SetN(uint32 index) {
+    if (unlikely(!raw_.HasEnoughSpace(index))) policy_(raw_, index);
+    raw_.SetN(index);
+  }
+  inline void Clear(uint32 index) {
+    if (likely(raw_.HasEnoughSpace(index))) raw_.Clear(index);
+  }
+  inline void ClearN(uint32 index) {
+    if (raw_.HasEnoughSpace(index))
+      raw_.ClearN(index);
+    else
+      raw_.ClearAll();
+  }
+  inline void ClearAll() { raw_.ClearAll(); }
+  inline bool Test(uint32 index) const {
+    if (likely(raw_.HasEnoughSpace(index))) return raw_.Test(index);
+    return false;
+  }
+  // invert the bit and return the old value.
+  inline bool Toggle(uint32 index) {
+    if (unlikely(!raw_.HasEnoughSpace(index))) policy_(raw_, index);
+    return raw_.Toggle(index);
+  }
+  // count bits in range [0, index]
+  inline size_t CountBits(uint32 index) const {
+    if (raw_.size == 0) return 0;
+    if ((raw_.size << BM_WORD_SHIFTS) <= index)
+      index = (raw_.size << BM_WORD_SHIFTS) - 1;
+    return raw_.CountBits(index);
+  }
+  inline size_t CountBits(uint32 start_index, uint32 end_index) const {
+    if ((raw_.size << BM_WORD_SHIFTS) <= start_index) return 0;
+    if ((raw_.size << BM_WORD_SHIFTS) <= end_index)
+      end_index = (raw_.size << BM_WORD_SHIFTS) - 1;
+    Assert(start_index <= end_index);
+    return raw_.CountBits(start_index, end_index);
+  }
 
-  virtual ~FixedBitmap();
+  inline bool Empty() const { return raw_.Empty(); }
 
-  void Set(uint32 index) override;
+  BitmapMemoryPolicy Policy() const { return policy_; }
 
-  bool Test(uint32 index) const override;
+  const BitmapRaw<T> &Raw() const { return raw_; }
+  BitmapRaw<T> &Raw() { return raw_; }
 
-  void Reset() override;
+  static void DefaultBitmapMemoryPolicy(BitmapRaw<T> &raw, uint32 index) {
+    auto old_bitmap = raw.bitmap;
+    auto old_size = raw.size;
+    auto size = Max(BM_INDEX_WORD_OFF(index) + 1, old_size * 2);
+    auto p = PAX_NEW_ARRAY<T>(size);
+    if (old_size > 0) memcpy(p, old_bitmap, sizeof(T) * old_size);
+    memset(&p[old_size], 0, sizeof(T) * (size - old_size));
+    raw.bitmap = p;
+    raw.size = size;
+    PAX_DELETE_ARRAY(old_bitmap);
+  }
+  static void ReadOnlyRefBitmap(BitmapRaw<T> &/*raw*/, uint32 /*index*/) {
+    // raise
+    CBDB_RAISE(cbdb::CException::kExTypeInvalidMemoryOperation);
+  }
+  static void ReadOnlyOwnBitmap(BitmapRaw<T> &/*raw*/, uint32 /*index*/) {
+    CBDB_RAISE(cbdb::CException::kExTypeInvalidMemoryOperation);
+  }
 
-  void Clear(uint32 index) override;
-
-  uint32 Size() const;
-
-  uint32 NumBits() const override;
-
-  bool BitmapFindFirst(uint32 offset, bool value, uint32 *idx) const;
+  static inline size_t RequireWords(size_t nbits) {
+    return nbits ? ((nbits - 1) >> BM_WORD_SHIFTS) + 1 : 0;
+  }
+  inline size_t CurrentBytes() const { return sizeof(T) * raw_.size; }
+  inline size_t MinimalStoredBytes(size_t nbits) {
+    auto nwords = RequireWords(nbits);
+    if (nwords > raw_.size) nwords = raw_.size;
+    while (nwords > 0 && raw_.bitmap[nwords - 1] == 0) nwords--;
+    return nwords * sizeof(T);
+  }
 
  private:
-  FixedBitmap(const FixedBitmap &other) = delete;
-  FixedBitmap(FixedBitmap &&other) = delete;
-  FixedBitmap &operator=(const FixedBitmap &other) = delete;
-  FixedBitmap &operator=(FixedBitmap &&other) = delete;
-
-  uint32 byte_size_;
-  uint32 num_bits_;
-  uint8 *bitmap_;
+  inline bool HasEnoughSpace(uint32 index) const {
+    return raw_.HasEnoughSpace(index);
+  }
+  BitmapRaw<T> raw_;
+  BitmapMemoryPolicy policy_;
 };
 
-class BitmapIterator {
- public:
-  explicit BitmapIterator(Bitmap *map);
-
-  void SeekTo(size_t bit);
-
-  int32 Next(bool value);
+using Bitmap8 = BitmapTpl<uint8>;
+using Bitmap64 = BitmapTpl<uint64>;
 
- private:
-  uint32 offset_;
-  Bitmap *bitmap_;
-};
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/comm/bitmap_test.cc b/contrib/pax_storage/src/cpp/comm/bitmap_test.cc
index b92b18b63ca..f5f7f164725 100644
--- a/contrib/pax_storage/src/cpp/comm/bitmap_test.cc
+++ b/contrib/pax_storage/src/cpp/comm/bitmap_test.cc
@@ -5,68 +5,162 @@
 namespace pax::tests {
 class BitMapTest : public ::testing::Test {};
 
-TEST_F(BitMapTest, test) {
-  FixedBitmap bit_map(100);
-  ASSERT_EQ(bit_map.Test(0), false);
-  ASSERT_EQ(bit_map.Test(99), false);
-  bit_map.Set(0);
-  ASSERT_EQ(bit_map.Test(0), true);
-  ASSERT_EQ(bit_map.Test(99), false);
-  bit_map.Set(99);
-  ASSERT_EQ(bit_map.Test(0), true);
-  ASSERT_EQ(bit_map.Test(99), true);
-  bit_map.Clear(0);
-  ASSERT_EQ(bit_map.Test(0), false);
-  ASSERT_EQ(bit_map.Test(99), true);
-  bit_map.Clear(99);
-  ASSERT_EQ(bit_map.Test(0), false);
-  ASSERT_EQ(bit_map.Test(99), false);
-
-  ASSERT_EQ(bit_map.Size(), 13);
+TEST_F(BitMapTest, Bitmap8) {
+  Bitmap8 bm(20);
+
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= 128; i++) {
+    ASSERT_FALSE(bm.Test(i));  // zeros
+    ASSERT_FALSE(bm.Toggle(i));
+    ASSERT_TRUE(bm.Test(i));
+    ASSERT_TRUE(bm.Toggle(i));
+    ASSERT_FALSE(bm.Test(i));
+
+    ASSERT_FALSE(bm.Test(i));  // zeros
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
+
+    bm.Clear(i);
+    ASSERT_FALSE(bm.Test(i));
+    bm.Clear(i);
+    ASSERT_FALSE(bm.Test(i));
+
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
+  }
+}
+
+TEST_F(BitMapTest, Bitmap8SetN) {
+  Bitmap8 bm(10);
+  const auto nbits = 128;
+
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+
+  auto fn = [&bm, nbits](uint32 index) {
+    bm.ClearAll();
+    for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+    bm.SetN(index);
+    for (uint32 i = 0; i <= index; i++) ASSERT_TRUE(bm.Test(i));
+    for (uint32 i = index + 1; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+  };
+  for (uint32 i = 0; i <= nbits; i++) fn(i);
+}
+
+TEST_F(BitMapTest, Bitmap8ClearN) {
+  Bitmap8 bm(10);
+  const auto nbits = 128;
+
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+
+  auto fn = [&bm, nbits](uint32 index) {
+    for (auto i = 0; i <= nbits; i++) {
+      bm.Set(i);
+      ASSERT_TRUE(bm.Test(i));
+    }
+    bm.ClearN(index);
+    for (uint32 i = 0; i <= index; i++) ASSERT_FALSE(bm.Test(i));
+    for (uint32 i = index + 1; i <= nbits; i++) ASSERT_TRUE(bm.Test(i));
+  };
+  for (uint32 i = 0; i <= nbits; i++) fn(i);
 }
 
-TEST_F(BitMapTest, FixedBitmap) {
-  FixedBitmap bit_map(100);
-  bit_map.Set(0);
-  bit_map.Set(50);
-  bit_map.Set(99);
+TEST_F(BitMapTest, Bitmap64) {
+  Bitmap64 bm(100);
 
-  BitmapIterator it(&bit_map);
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= 128; i++) {
+    ASSERT_FALSE(bm.Test(i));  // zeros
+    ASSERT_FALSE(bm.Toggle(i));
+    ASSERT_TRUE(bm.Test(i));
+    ASSERT_TRUE(bm.Toggle(i));
+    ASSERT_FALSE(bm.Test(i));
 
-  ASSERT_EQ(it.Next(true), 0);
-  ASSERT_EQ(it.Next(true), 50);
-  ASSERT_EQ(it.Next(true), 99);
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
 
-  it.SeekTo(0);
-  ASSERT_EQ(it.Next(false), 1);
-  ASSERT_EQ(it.Next(false), 2);
-  ASSERT_EQ(it.Next(false), 3);
+    bm.Clear(i);
+    ASSERT_FALSE(bm.Test(i));
+    bm.Clear(i);
+    ASSERT_FALSE(bm.Test(i));
+
+    bm.Set(i);
+    ASSERT_TRUE(bm.Test(i));
+  }
 }
+TEST_F(BitMapTest, Bitmap64SetN) {
+  Bitmap64 bm(1);
+  const auto nbits = 512;
 
-TEST_F(BitMapTest, DynamicBitmap) {
-  DynamicBitmap bit_map(100);
-  bit_map.Set(0);
-  bit_map.Set(50);
-  bit_map.Set(99);
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
 
-  BitmapIterator it(&bit_map);
+  auto fn = [&bm, nbits](uint32 index) {
+    bm.ClearAll();
+    for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+    bm.SetN(index);
+    for (uint32 i = 0; i <= index; i++) ASSERT_TRUE(bm.Test(i));
+    for (uint32 i = index + 1; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
+  };
+  for (uint32 i = 0; i <= nbits; i++) fn(i);
+}
 
-  ASSERT_EQ(it.Next(true), 0);
-  ASSERT_EQ(it.Next(true), 50);
-  ASSERT_EQ(it.Next(true), 99);
+TEST_F(BitMapTest, Bitmap64ClearN) {
+  Bitmap64 bm(1);
+  const auto nbits = 512;
 
-  bit_map.Resize(200);
-  bit_map.Set(100);
-  bit_map.Set(150);
-  bit_map.Set(199);
+  ASSERT_TRUE(bm.Empty());
+  for (auto i = 0; i <= nbits; i++) ASSERT_FALSE(bm.Test(i));
 
-  ASSERT_EQ(it.Next(true), 100);
-  ASSERT_EQ(it.Next(true), 150);
-  ASSERT_EQ(it.Next(true), 199);
+  auto fn = [&bm, &nbits](uint32 index) {
+    for (auto i = 0; i <= nbits; i++) {
+      bm.Set(i);
+      ASSERT_TRUE(bm.Test(i));
+    }
+    bm.ClearN(index);
+    for (uint32 i = 0; i <= index; i++) ASSERT_FALSE(bm.Test(i));
+    for (uint32 i = index + 1; i <= nbits; i++) ASSERT_TRUE(bm.Test(i));
+  };
+  for (uint32 i = 0; i <= nbits; i++) fn(i);
+}
+
+TEST_F(BitMapTest, CountBits) {
+  const uint32 starts[] = {0, 1, 3, 7};
+  const uint32 ends[] = {0, 1, 7, 8, 9, 15, 16, 17};
+  Bitmap8 bm(11);
 
-  it.SeekTo(0);
-  ASSERT_EQ(it.Next(false), 1);
-  ASSERT_EQ(it.Next(false), 2);
-  ASSERT_EQ(it.Next(false), 3);
+  auto fill_bits = [&bm](uint32 bits) {
+    uint32 k = 0;
+    bm.ClearAll();
+    while (bits) {
+      if (bits & 1) bm.Set(k);
+      bits = bits >> 1;
+      k++;
+    }
+  };
+  auto plain_count = [](uint32 bits, uint32 start, uint32 end) {
+    size_t nbits = 0;
+    for (auto i = start; i <= end; i++) {
+      if (bits & (1ULL << i)) nbits++;
+    }
+    return nbits;
+  };
+
+  for (uint32 i = 0; i < 0x3ffff; i++) {
+    fill_bits(i);
+    for (auto start : starts) {
+      for (auto end : ends) {
+        if (end < start) continue;
+        ASSERT_EQ(bm.CountBits(start, end), plain_count(i, start, end));
+        ASSERT_EQ(bm.CountBits(end), plain_count(i, 0, end));
+      }
+    }
+  }
 }
+
 }  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/comm/cbdb_api.h b/contrib/pax_storage/src/cpp/comm/cbdb_api.h
index b97800252ee..dcf074ed37b 100644
--- a/contrib/pax_storage/src/cpp/comm/cbdb_api.h
+++ b/contrib/pax_storage/src/cpp/comm/cbdb_api.h
@@ -1,11 +1,19 @@
 #ifndef SRC_CPP_COMM_CBDB_API_H_
 #define SRC_CPP_COMM_CBDB_API_H_
 
+#include "comm/pax_rel.h"
+
 #ifdef __cplusplus
 extern "C" {
 #endif
+
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wregister"
+
 #include "postgres.h"  //  NOLINT
+#include "postmaster/postmaster.h"
 
+#include "access/detoast.h"
 #include "access/genam.h"
 #include "access/heapam.h"
 #include "access/relscan.h"
@@ -14,17 +22,39 @@ extern "C" {
 #include "access/tsmapi.h"
 #include "access/tupdesc.h"
 #include "access/tupdesc_details.h"
+#include "catalog/catalog.h"
 #include "catalog/dependency.h"
 #include "catalog/heap.h"
+#include "catalog/gp_indexing.h"
+#include "catalog/index.h"
 #include "catalog/indexing.h"
+#include "catalog/objectaccess.h"
 #include "catalog/oid_dispatch.h"
 #include "catalog/pg_am.h"
 #include "catalog/pg_amop.h"
 #include "catalog/pg_amproc.h"
+#include "catalog/pg_attribute_encoding.h"
+#include "catalog/pg_collation.h"
 #include "catalog/pg_namespace.h"
+#include "catalog/pg_opclass.h"
+#include "catalog/toasting.h"
+#include "commands/progress.h"
+#include "commands/tablecmds.h"
+#include "nodes/execnodes.h"
+#include "funcapi.h"
+#include "partitioning/partdesc.h"
+#include "partitioning/partbounds.h"
+#include "pgstat.h"
+#include "utils/partcache.h"
+#include "utils/ruleutils.h"
+#include "access/nbtree.h"
+#include "access/hash.h"
+#include "parser/parse_utilcmd.h"
+#include "nodes/makefuncs.h"
+#include "parser/parse_oper.h"
+#include "parser/parse_expr.h"
 #ifndef BUILD_PAX_FORMAT
 #include "access/reloptions.h"
-#include "catalog/pg_pax_tables.h"
 #endif
 #include "catalog/storage.h"
 #include "cdb/cdbvars.h"
@@ -41,33 +71,32 @@ extern "C" {
 #include "storage/lwlock.h"
 #include "storage/relfilenode.h"
 #include "storage/smgr.h"
+#include "utils/backend_progress.h"
 #include "utils/builtins.h"
+#include "utils/date.h"
 #include "utils/datum.h"
 #include "utils/elog.h"
 #include "utils/hsearch.h"
 #include "utils/lsyscache.h"
 #include "utils/memutils.h"
+#include "utils/numeric.h"
 #include "utils/relcache.h"
 #include "utils/snapshot.h"
 #include "utils/syscache.h"
 #include "utils/wait_event.h"
 
 // no header file in cbdb
-extern BlockNumber system_nextsampleblock(SampleScanState *node, BlockNumber nblocks);  // NOLINT
-extern bool extractcolumns_from_node(Node *expr, bool *cols, AttrNumber natts);  // NOLINT
+extern BlockNumber system_nextsampleblock(SampleScanState *node,  // NOLINT
+                                          BlockNumber nblocks);
+extern bool extractcolumns_from_node(Node *expr, bool *cols,  // NOLINT
+                                     AttrNumber natts);
+extern int get_partition_for_tuple(PartitionKey key, PartitionDesc partdesc, // NOLINT
+                                   Datum *values, bool *isnull);
 extern Oid GetDefaultOpClass(Oid type_id, Oid am_id);
+
+#pragma GCC diagnostic pop
 #ifdef __cplusplus
 }
 #endif
 
-#define PAX_TABLE_AM_OID 7014
-#define PAX_AMNAME "pax"
-#define PAX_AM_HANDLER_OID 7600
-#define PAX_AM_HANDLER_NAME "pax_tableam_handler"
-
-#define PAX_AUX_STATS_IN_OID 7601
-#define PAX_AUX_STATS_OUT_OID 7602
-#define PAX_AUX_STATS_TYPE_OID 7603
-#define PAX_AUX_STATS_TYPE_NAME "paxauxstats"
-
 #endif  // SRC_CPP_COMM_CBDB_API_H_
diff --git a/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.cc b/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.cc
index fb7c4beced4..cb683fdfea6 100644
--- a/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.cc
+++ b/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.cc
@@ -1,6 +1,6 @@
 #include "comm/cbdb_wrappers.h"
+
 #include "comm/paxc_wrappers.h"
-#include "storage/paxc_block_map_manager.h"
 extern "C" {
 const char *progname;
 }
@@ -83,22 +83,6 @@ void Pfree(void *ptr) {
 
 }  // namespace cbdb
 
-void *operator new(std::size_t size) { return cbdb::Palloc(size); }
-
-void *operator new[](std::size_t size) { return cbdb::Palloc(size); }
-
-void *operator new(std::size_t size, MemoryContext ctx) {
-  return cbdb::MemCtxAlloc(ctx, size);
-}
-
-void *operator new[](std::size_t size, MemoryContext ctx) {
-  return cbdb::MemCtxAlloc(ctx, size);
-}
-
-void operator delete(void *ptr) { if (ptr) cbdb::Pfree(ptr); }
-
-void operator delete[](void *ptr) { if (ptr) cbdb::Pfree(ptr); }
-
 HTAB *cbdb::HashCreate(const char *tabname, int64 nelem, const HASHCTL *info,
                        int flags) {
   CBDB_WRAP_START;
@@ -173,6 +157,14 @@ Datum cbdb::DatumFromPointer(const void *p, int16 typlen) {
 }
 #endif
 
+
+struct varlena *cbdb::PgDeToastDatum(struct varlena *datum) {
+  CBDB_WRAP_START;
+  { return detoast_attr(datum); }
+  CBDB_WRAP_END;
+  return nullptr;
+}
+
 struct varlena *cbdb::PgDeToastDatumPacked(struct varlena *datum) {
   CBDB_WRAP_START;
   { return pg_detoast_datum_packed(datum); }
@@ -191,39 +183,10 @@ void *cbdb::PointerAndLenFromDatum(Datum d, int *len) {
   CBDB_WRAP_END;
 }
 
-// pax ctid mapping functions
-
-void cbdb::InitCommandResource() {
+void cbdb::SlotGetMissingAttrs(TupleTableSlot *slot, int start_attno,
+                               int last_attno) {
   CBDB_WRAP_START;
-  { paxc::init_command_resource(); }
-  CBDB_WRAP_END;
-}
-void cbdb::ReleaseCommandResource() {
-  CBDB_WRAP_START;
-  { paxc::release_command_resource(); }
-  CBDB_WRAP_END;
-}
-
-void cbdb::GetTableIndexAndTableNumber(Oid table_rel_oid, uint8 *table_no,
-                                       uint32 *table_index) {
-  CBDB_WRAP_START;
-  {
-    paxc::get_table_index_and_table_number(table_rel_oid, table_no,
-                                           table_index);
-  }
-  CBDB_WRAP_END;
-}
-
-uint32 cbdb::GetBlockNumber(Oid table_rel_oid, uint32 table_index,
-                            paxc::PaxBlockId block_id) {
-  CBDB_WRAP_START;
-  { return paxc::get_block_number(table_rel_oid, table_index, block_id); }
-  CBDB_WRAP_END;
-}
-paxc::PaxBlockId cbdb::GetBlockId(Oid table_rel_oid, uint8 table_no,
-                                  uint32 block_number) {
-  CBDB_WRAP_START;
-  { return paxc::get_block_id(table_rel_oid, table_no, block_number); }
+  { slot_getmissingattrs(slot, start_attno, last_attno); }
   CBDB_WRAP_END;
 }
 
@@ -299,16 +262,10 @@ std::string cbdb::BuildPaxDirectoryPath(RelFileNode rd_node,
   CBDB_WRAP_END;
 }
 
-std::string cbdb::BuildPaxFilePath(const Relation rel,
+std::string cbdb::BuildPaxFilePath(const std::string &rel_path,
                                    const std::string &block_id) {
-  CBDB_WRAP_START;
-  {
-    char *tmp_str = paxc::BuildPaxFilePath(rel, block_id.c_str());
-    std::string ret_str(tmp_str);
-    pfree(tmp_str);
-    return ret_str;
-  }
-  CBDB_WRAP_END;
+  Assert(!rel_path.empty());
+  return rel_path + "/" + block_id;
 }
 
 int cbdb::RelationGetAttributesNumber(Relation rel) {
@@ -317,56 +274,124 @@ int cbdb::RelationGetAttributesNumber(Relation rel) {
   CBDB_WRAP_END;
 }
 
+StdRdOptions **cbdb::RelGetAttributeOptions(Relation rel) {
+  CBDB_WRAP_START;
+  { return RelationGetAttributeOptions(rel); }
+  CBDB_WRAP_END;
+}
+
 TupleDesc cbdb::RelationGetTupleDesc(Relation rel) {
   CBDB_WRAP_START;
   { return RelationGetDescr(rel); }
   CBDB_WRAP_END;
 }
 
-bool cbdb::ExtractcolumnsFromNode(Node *expr, bool *cols, AttrNumber natts) {
+bool cbdb::IsSystemAttrNumExist(struct PaxcExtractcolumnContext *context,
+                                AttrNumber number) {
+  Assert(number < 0 && number > FirstLowInvalidHeapAttributeNumber && context);
+  return context->system_attr_number_mask[~number];
+}
+
+extern "C" {
+
+static bool paxc_extractcolumns_walker(  // NOLINT
+    Node *node, struct PaxcExtractcolumnContext *ec_ctx) {
+  if (node == NULL) {
+    return false;
+  }
+
+  if (IsA(node, Var)) {
+    Var *var = (Var *)node;
+
+    if (IS_SPECIAL_VARNO(var->varno)) return false;
+
+    if (var->varattno < 0) {
+      Assert(var->varattno > FirstLowInvalidHeapAttributeNumber);
+      ec_ctx->system_attr_number_mask[~var->varattno] = true;
+    } else if (ec_ctx->cols) {
+      if (var->varattno == 0) {
+        // If all attributes are included,
+        // set all entries in mask to true.
+        for (int attno = 0; attno < ec_ctx->natts; attno++)
+          ec_ctx->cols[attno] = true;
+        ec_ctx->found = true;
+      } else if (var->varattno <= ec_ctx->natts) {
+        ec_ctx->cols[var->varattno - 1] = true;
+        ec_ctx->found = true;
+      }
+      // Still need fill `system_attr_number_mask`
+      // Let this case return false
+    }
+
+    return false;
+  }
+
+  return expression_tree_walker(node, (bool (*)())paxc_extractcolumns_walker,
+                                (void *)ec_ctx);
+}
+
+};  // extern "C"
+
+bool cbdb::ExtractcolumnsFromNode(Node *expr,
+                                  struct PaxcExtractcolumnContext *ec_ctx) {
+  CBDB_WRAP_START;
+  {
+    paxc_extractcolumns_walker(expr, ec_ctx);
+    return ec_ctx->found;
+  }
+  CBDB_WRAP_END;
+}
+
+bool cbdb::ExtractcolumnsFromNode(Node *expr, bool *cols, int natts) {
   CBDB_WRAP_START;
   { return extractcolumns_from_node(expr, cols, natts); }
   CBDB_WRAP_END;
 }
 
-bool cbdb::MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, StrategyNumber strategynum)
-{
+bool cbdb::MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid *opfamily, FmgrInfo *finfo,
+                                     StrategyNumber strategynum) {
   CBDB_WRAP_START;
-  {  return paxc::MinMaxGetStrategyProcinfo(atttypid, procid, finfo, strategynum); }
+  {
+    return paxc::MinMaxGetStrategyProcinfo(atttypid, subtype, opfamily, finfo,
+                                           strategynum);
+  }
   CBDB_WRAP_END;
 }
 
-Datum cbdb::FunctionCall1Coll(FmgrInfo *flinfo, Oid collation, Datum arg1)
-{
+Datum cbdb::FunctionCall1Coll(FmgrInfo *flinfo, Oid collation, Datum arg1) {
   CBDB_WRAP_START;
-  {  return ::FunctionCall1Coll(flinfo, collation, arg1); }
+  { return ::FunctionCall1Coll(flinfo, collation, arg1); }
   CBDB_WRAP_END;
 }
 
-Datum cbdb::FunctionCall2Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2)
-{
+Datum cbdb::FunctionCall2Coll(FmgrInfo *flinfo, Oid collation, Datum arg1,
+                              Datum arg2) {
   CBDB_WRAP_START;
-  {  return ::FunctionCall2Coll(flinfo, collation, arg1, arg2); }
+  { return ::FunctionCall2Coll(flinfo, collation, arg1, arg2); }
   CBDB_WRAP_END;
 }
 
-Datum cbdb::FunctionCall3Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3)
-{
+Datum cbdb::FunctionCall3Coll(FmgrInfo *flinfo, Oid collation, Datum arg1,
+                              Datum arg2, Datum arg3) {
   CBDB_WRAP_START;
-  {  return ::FunctionCall3Coll(flinfo, collation, arg1, arg2, arg3); }
+  { return ::FunctionCall3Coll(flinfo, collation, arg1, arg2, arg3); }
   CBDB_WRAP_END;
 }
 
-Datum cbdb::FunctionCall4Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3, Datum arg4)
-{
+Datum cbdb::FunctionCall4Coll(FmgrInfo *flinfo, Oid collation, Datum arg1,
+                              Datum arg2, Datum arg3, Datum arg4) {
   CBDB_WRAP_START;
-  {  return ::FunctionCall4Coll(flinfo, collation, arg1, arg2, arg3, arg4); }
+  { return ::FunctionCall4Coll(flinfo, collation, arg1, arg2, arg3, arg4); }
   CBDB_WRAP_END;
 }
 
-SysScanDesc cbdb::SystableBeginScan(Relation rel, Oid index_id, bool index_ok, Snapshot snapshot, int n_keys, ScanKey keys) {
+SysScanDesc cbdb::SystableBeginScan(Relation rel, Oid index_id, bool index_ok,
+                                    Snapshot snapshot, int n_keys,
+                                    ScanKey keys) {
   CBDB_WRAP_START;
-  { return systable_beginscan(rel, index_id, index_ok, snapshot, n_keys, keys); }
+  {
+    return systable_beginscan(rel, index_id, index_ok, snapshot, n_keys, keys);
+  }
   CBDB_WRAP_END;
 }
 
@@ -382,7 +407,8 @@ void cbdb::SystableEndScan(SysScanDesc desc) {
   CBDB_WRAP_END;
 }
 
-Datum cbdb::HeapGetAttr(HeapTuple tup, int attnum, TupleDesc tuple_desc, bool *isnull) {
+Datum cbdb::HeapGetAttr(HeapTuple tup, int attnum, TupleDesc tuple_desc,
+                        bool *isnull) {
   CBDB_WRAP_START;
   { return heap_getattr(tup, attnum, tuple_desc, isnull); }
   CBDB_WRAP_END;
diff --git a/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.h b/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.h
index 9f80b5e614c..02b10f2d007 100644
--- a/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.h
+++ b/contrib/pax_storage/src/cpp/comm/cbdb_wrappers.h
@@ -6,13 +6,28 @@
 #include <string>
 
 #include "exceptions/CException.h"
-#include "storage/pax_block_id.h"
+
+struct PaxcExtractcolumnContext {
+  // If cols set and call ExtractcolumnsFromNode with
+  // `target list`. Then the cols will fill with projection mask.
+  bool *cols = nullptr;
+  int natts = 0;
+  bool found = false;
+
+  // This mask use to filter system attribute number.
+  // (~AttrNumber) will be index, mapping the [0,
+  // FirstLowInvalidHeapAttributeNumber) call `IsSystemAttrNumExist` to check
+  // system-defined attributes set
+  bool system_attr_number_mask[~FirstLowInvalidHeapAttributeNumber] = {
+      0};  // NOLINT
+};
 
 namespace cbdb {
 
 #define PAX_ALLOCSET_DEFAULT_MINSIZE ALLOCSET_DEFAULT_MINSIZE
 #define PAX_ALLOCSET_DEFAULT_INITSIZE (8 * 1024)
 #define PAX_ALLOCSET_DEFAULT_MAXSIZE (3 * 64 * 1024 * 1024)
+
 #define PAX_ALLOCSET_DEFAULT_SIZES                             \
   PAX_ALLOCSET_DEFAULT_MINSIZE, PAX_ALLOCSET_DEFAULT_INITSIZE, \
       PAX_ALLOCSET_DEFAULT_MAXSIZE
@@ -98,23 +113,17 @@ static inline Datum Int64ToDatum(int64 d) noexcept { return Int64GetDatum(d); }
 
 void *PointerAndLenFromDatum(Datum d, int *len);
 
+void SlotGetMissingAttrs(TupleTableSlot *slot, int start_attno, int last_attno);
+
 #ifdef RUN_GTEST
 Datum DatumFromCString(const char *src, size_t length);
 
 Datum DatumFromPointer(const void *p, int16 typlen);
 #endif
 
-struct varlena *PgDeToastDatumPacked(struct varlena *datum);
+struct varlena *PgDeToastDatum(struct varlena *datum);
 
-// pax ctid mapping functions
-void InitCommandResource();
-void ReleaseCommandResource();
-void GetTableIndexAndTableNumber(Oid table_rel_oid, uint8 *table_no,
-                                 uint32 *table_index);
-uint32 GetBlockNumber(Oid table_rel_oid, uint32 table_index,
-                      paxc::PaxBlockId block_id);
-paxc::PaxBlockId GetBlockId(Oid table_rel_oid, uint8 table_no,
-                            uint32 block_number);
+struct varlena *PgDeToastDatumPacked(struct varlena *datum);
 
 void RelationCreateStorageDirectory(RelFileNode rnode, char relpersistence,
                                     SMgrImpl smgr_which, Relation rel);
@@ -137,31 +146,44 @@ void MakedirRecursive(const char *path);
 
 std::string BuildPaxDirectoryPath(RelFileNode rd_node, BackendId rd_backend);
 
+std::string BuildPaxFilePath(const std::string &rel_path, const std::string &block_id);
+
 int RelationGetAttributesNumber(Relation rel);
 
+StdRdOptions **RelGetAttributeOptions(Relation rel);
 TupleDesc RelationGetTupleDesc(Relation rel);
 
-bool ExtractcolumnsFromNode(Node *expr, bool *cols, AttrNumber natts);
+bool ExtractcolumnsFromNode(Node *expr,
+                            struct PaxcExtractcolumnContext *ec_ctx);
+
+bool IsSystemAttrNumExist(struct PaxcExtractcolumnContext *context,
+                          AttrNumber number);
 
-std::string BuildPaxFilePath(Relation rel, const std::string &block_id);
+bool ExtractcolumnsFromNode(Node *expr, bool *cols, int natts);
 
-bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, StrategyNumber strategynum);
+bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid *opfamily, FmgrInfo *finfo,
+                               StrategyNumber strategynum);
 
 Datum FunctionCall1Coll(FmgrInfo *flinfo, Oid collation, Datum arg1);
 
-Datum FunctionCall2Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2);
+Datum FunctionCall2Coll(FmgrInfo *flinfo, Oid collation, Datum arg1,
+                        Datum arg2);
 
-Datum FunctionCall3Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3);
+Datum FunctionCall3Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2,
+                        Datum arg3);
 
-Datum FunctionCall4Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3, Datum arg4);
+Datum FunctionCall4Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2,
+                        Datum arg3, Datum arg4);
 
-SysScanDesc SystableBeginScan(Relation rel, Oid index_id, bool index_ok, Snapshot snapshot, int n_keys, ScanKey keys);
+SysScanDesc SystableBeginScan(Relation rel, Oid index_id, bool index_ok,
+                              Snapshot snapshot, int n_keys, ScanKey keys);
 
 HeapTuple SystableGetNext(SysScanDesc desc);
 
 void SystableEndScan(SysScanDesc desc);
 
-Datum HeapGetAttr(HeapTuple tup, int attnum, TupleDesc tuple_desc, bool *isnull);
+Datum HeapGetAttr(HeapTuple tup, int attnum, TupleDesc tuple_desc,
+                  bool *isnull);
 
 Relation TableOpen(Oid relid, LOCKMODE lockmode);
 
@@ -188,13 +210,3 @@ void TableClose(Relation rel, LOCKMODE lockmode);
   }                                                               \
   }
 // clang-format on
-
-// override the default new/delete to use current memory context
-extern void *operator new(std::size_t size);
-extern void *operator new[](std::size_t size);
-extern void operator delete(void *ptr);
-extern void operator delete[](void *ptr);
-
-// specify memory context for this allocation without switching memory context
-extern void *operator new(std::size_t size, MemoryContext ctx);
-extern void *operator new[](std::size_t size, MemoryContext ctx);
diff --git a/contrib/pax_storage/src/cpp/comm/comm_test.cc b/contrib/pax_storage/src/cpp/comm/comm_test.cc
index da867ecae32..3ff39adab1a 100644
--- a/contrib/pax_storage/src/cpp/comm/comm_test.cc
+++ b/contrib/pax_storage/src/cpp/comm/comm_test.cc
@@ -11,8 +11,6 @@ class CommTest : public ::testing::Test {
         1 * 1024 * 1024, 1 * 1024 * 1024);
     MemoryContextSwitchTo(comm_test_memory_context);
   }
-
-  void TearDown() override {}
 };
 
 TEST_F(CommTest, TestDeleteOperator) {
@@ -32,4 +30,19 @@ TEST_F(CommTest, TestDeleteOperator) {
   delete[] array_obj;
 }
 
+
+TEST_F(CommTest, TestNewOperator) {
+  auto obj = new bool[0];
+  ASSERT_NE(obj, nullptr);
+  delete[] obj;
+
+  auto obj2 = cbdb::Palloc(0);
+  ASSERT_NE(obj2, nullptr);
+  cbdb::Pfree(obj2);
+
+  auto obj3 = cbdb::Palloc0(0);
+  ASSERT_NE(obj3, nullptr);
+  cbdb::Pfree(obj3);
+}
+
 }  // namespace pax::tests
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/comm/guc.cc b/contrib/pax_storage/src/cpp/comm/guc.cc
new file mode 100644
index 00000000000..7ae3334ac50
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/guc.cc
@@ -0,0 +1,15 @@
+#include "comm/guc.h"
+
+#include "storage/pax_defined.h"
+
+namespace pax {
+bool pax_enable_debug = true;
+bool pax_enable_filter = true;
+int pax_scan_reuse_buffer_size = 0;
+int pax_max_tuples_per_group = VEC_BATCH_LENGTH;
+
+#ifdef ENABLE_PLASMA
+bool pax_enable_plasma_in_mem = true;
+#endif
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/comm/guc.h b/contrib/pax_storage/src/cpp/comm/guc.h
new file mode 100644
index 00000000000..c53678dc0dc
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/guc.h
@@ -0,0 +1,13 @@
+#pragma once
+
+namespace pax {
+extern bool pax_enable_debug;
+extern bool pax_enable_filter;
+extern int pax_scan_reuse_buffer_size;
+extern int pax_max_tuples_per_group;
+
+#ifdef ENABLE_PLASMA
+extern bool pax_enable_plasma_in_mem;
+#endif
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/comm/log.h b/contrib/pax_storage/src/cpp/comm/log.h
new file mode 100644
index 00000000000..21f2853b98e
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/log.h
@@ -0,0 +1,12 @@
+#pragma once
+
+// Should never call PAX_LOG* without PAX_ENABLE_DEBUG
+#define PAX_LOG_IF(ok, ...)         \
+  do {                              \
+    if (ok) elog(LOG, __VA_ARGS__); \
+  } while (0)
+
+#define PAX_LOG(...)        \
+  do {                      \
+    elog(LOG, __VA_ARGS__); \
+  } while (0)
diff --git a/contrib/pax_storage/src/cpp/comm/pax_defer.h b/contrib/pax_storage/src/cpp/comm/pax_defer.h
deleted file mode 100644
index ad39ba76bbd..00000000000
--- a/contrib/pax_storage/src/cpp/comm/pax_defer.h
+++ /dev/null
@@ -1,28 +0,0 @@
-#pragma once
-
-#include <utility>
-
-namespace pax {
-
-template <class F>
-class Defer {
- public:
-  const F function;
-
- public:
-  constexpr explicit Defer(const F &function) : function{function} {}
-  constexpr explicit Defer(F &&function) : function{std::move(function)} {}
-  ~Defer() { function(); }
-};
-
-template <class F>
-inline Defer<F> make_defer(F &&function) {
-  return Defer<F>(std::forward<F>(function));
-}
-
-}  //  namespace pax
-
-#define DEFER_CONCAT(n, ...) \
-  const auto defer##n = pax::make_defer([&] { __VA_ARGS__; })
-#define DEFER_FORWARD(n, ...) DEFER_CONCAT(n, __VA_ARGS__)
-#define DEFER(...) DEFER_FORWARD(__LINE__, __VA_ARGS__)
diff --git a/contrib/pax_storage/src/cpp/comm/pax_memory.cc b/contrib/pax_storage/src/cpp/comm/pax_memory.cc
new file mode 100644
index 00000000000..b9c05660709
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/pax_memory.cc
@@ -0,0 +1,25 @@
+#include "comm/pax_memory.h"
+
+#include "comm/cbdb_wrappers.h"
+
+void *operator new(std::size_t size) { return cbdb::Palloc(size); }
+
+void *operator new[](std::size_t size) { return cbdb::Palloc(size); }
+
+void *operator new(std::size_t size, MemoryContext ctx) {
+  return cbdb::MemCtxAlloc(ctx, size);
+}
+
+void *operator new[](std::size_t size, MemoryContext ctx) {
+  return cbdb::MemCtxAlloc(ctx, size);
+}
+
+void operator delete(void *ptr) {
+  if (ptr) cbdb::Pfree(ptr);
+}
+
+void operator delete[](void *ptr) {
+  if (ptr) cbdb::Pfree(ptr);
+}
+
+
diff --git a/contrib/pax_storage/src/cpp/comm/pax_memory.h b/contrib/pax_storage/src/cpp/comm/pax_memory.h
new file mode 100644
index 00000000000..03a81c036b1
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/pax_memory.h
@@ -0,0 +1,60 @@
+#pragma once
+#include "comm/cbdb_api.h"
+#include <memory>
+
+//#include "memory_allocator.h"
+
+namespace pax {
+
+template <typename T, typename... Args>
+static inline T* PAX_NEW(Args&&... args) {
+  return new T(std::forward<Args>(args)...);
+}
+
+template <typename T>
+static inline T* PAX_NEW_ARRAY(size_t N) {
+  return new T[N];
+}
+
+template <typename T>
+static inline void PAX_DELETE(T *&obj) {
+  delete obj;
+  obj = nullptr;
+}
+
+template <typename T>
+static inline void PAX_DELETE_ARRAY(T *&obj) {
+  delete []obj;
+  obj = nullptr;
+}
+
+struct PaxMemoryDeleter {
+  template <typename T>
+  inline void operator()(T* p) const {
+    delete p;
+  }
+};
+
+template <typename T>
+using pax_unique_ptr = std::unique_ptr<T>;
+
+template <typename T>
+using pax_shared_ptr = std::shared_ptr<T>;
+
+//template <typename T>
+//using pax_unique_ptr = std::unique_ptr<T, PaxMemoryDeleter>;
+
+//template <typename T>
+//using pax_shared_ptr = std::shared_ptr<T, PaxMemoryDeleter>;
+
+}
+
+// override the default new/delete to use current memory context
+extern void *operator new(std::size_t size);
+extern void *operator new[](std::size_t size);
+extern void operator delete(void *ptr);
+extern void operator delete[](void *ptr);
+
+// specify memory context for this allocation without switching memory context
+extern void *operator new(std::size_t size, MemoryContext ctx);
+extern void *operator new[](std::size_t size, MemoryContext ctx);
diff --git a/contrib/pax_storage/src/cpp/comm/pax_rel.h b/contrib/pax_storage/src/cpp/comm/pax_rel.h
new file mode 100644
index 00000000000..43934b475ff
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/comm/pax_rel.h
@@ -0,0 +1,29 @@
+
+#ifndef SRC_CPP_COMM_PAX_REL_H_
+#define SRC_CPP_COMM_PAX_REL_H_
+
+// Oid of pg_ext_aux.pg_pax_tables
+#define PAX_TABLES_RELATION_ID 7061
+#define PAX_TABLES_RELID_INDEX_ID 7047
+
+#define PAX_TABLE_AM_OID 7047
+#define PAX_AMNAME "pax"
+#define PAX_AM_HANDLER_OID 7600
+#define PAX_AM_HANDLER_NAME "pax_tableam_handler"
+
+#define PAX_AUX_STATS_IN_OID 7601
+#define PAX_AUX_STATS_OUT_OID 7602
+#define PAX_AUX_STATS_TYPE_OID 7603
+#define PAX_AUX_STATS_TYPE_NAME "paxauxstats"
+
+#define PAX_FASTSEQUENCE_OID 7604
+#define PAX_FASTSEQUENCE_INDEX_OID 7605
+
+#define PG_PAX_FASTSEQUENCE_NAMESPACE "pg_ext_aux"
+#define PG_PAX_FASTSEQUENCE_TABLE "pg_pax_fastsequence"
+#define PG_PAX_FASTSEQUENCE_INDEX_NAME "pg_pax_fastsequence_objid_idx"
+
+#define AMHandlerIsPAX(amhandler) ((amhandler) == PAX_AM_HANDLER_OID)
+#define RelationIsPAX(relation) AMHandlerIsPAX((relation)->rd_amhandler)
+
+#endif  // SRC_CPP_COMM_PAX_REL_H_
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/comm/paxc_wrappers.cc b/contrib/pax_storage/src/cpp/comm/paxc_wrappers.cc
index c968ae70940..219b7897259 100644
--- a/contrib/pax_storage/src/cpp/comm/paxc_wrappers.cc
+++ b/contrib/pax_storage/src/cpp/comm/paxc_wrappers.cc
@@ -155,21 +155,6 @@ char *BuildPaxDirectoryPath(RelFileNode rd_node, BackendId rd_backend) {
   return paxrelpath;
 }
 
-// BuildPaxFilePath: function used to build pax storage directory path following
-// pg convension, for example base/{database_oid}/{blocks_relid}_pax. parameter
-// rel IN Relation information. parameter block_id IN micro-partition block id.
-// return palloc'd pax storage directory path.
-char *BuildPaxFilePath(Relation rel, const char *block_id) {
-  char *relpath = NULL;
-  char *filepath = NULL;
-
-  relpath = BuildPaxDirectoryPath(rel->rd_node, rel->rd_backend);
-  Assert(relpath[0] != '\0');
-  filepath = psprintf("%s/%s", relpath, block_id);
-  pfree(relpath);
-  return filepath;
-}
-
 static void UnlinkIfExistsFname(const char *fname, bool isdir, int elevel) {
   if (isdir) {
     if (rmdir(fname) != 0 && errno != ENOENT)
@@ -224,12 +209,11 @@ static void DeletePaxDirectoryPathRecursive(
   }
 }
 
-bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, StrategyNumber strategynum)
+bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid *opfamily, FmgrInfo *finfo, StrategyNumber strategynum)
 {
   FmgrInfo dummy;
   HeapTuple tuple;
   Oid opclass;
-  Oid opfamily;
   Oid oprid;
   RegProcedure opcode;
   bool isNull;
@@ -238,10 +222,10 @@ bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, Strat
   if (!OidIsValid(opclass))
     return false;
 
-  opfamily = get_opclass_family(opclass);
-  tuple = SearchSysCache4(AMOPSTRATEGY, ObjectIdGetDatum(opfamily),
-                           ObjectIdGetDatum(atttypid),
+  *opfamily = get_opclass_family(opclass);
+  tuple = SearchSysCache4(AMOPSTRATEGY, ObjectIdGetDatum(*opfamily),
                            ObjectIdGetDatum(atttypid),
+                           ObjectIdGetDatum(subtype),
                            Int16GetDatum(strategynum));
 
   if (!HeapTupleIsValid(tuple))
@@ -257,8 +241,6 @@ bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, Strat
     return false;
 
   fmgr_info_cxt(opcode, finfo ? finfo : &dummy, CurrentMemoryContext);
-  *procid = opcode;
-
   return true;
 }
 
diff --git a/contrib/pax_storage/src/cpp/comm/paxc_wrappers.h b/contrib/pax_storage/src/cpp/comm/paxc_wrappers.h
index fc0315a0b22..d1f21f402b1 100644
--- a/contrib/pax_storage/src/cpp/comm/paxc_wrappers.h
+++ b/contrib/pax_storage/src/cpp/comm/paxc_wrappers.h
@@ -8,6 +8,5 @@ void CopyFile(const char *srcsegpath, const char *dstsegpath);
 void DeletePaxDirectoryPath(const char *dirname, bool delete_topleveldir);
 void MakedirRecursive(const char *path);
 char *BuildPaxDirectoryPath(RelFileNode rd_node, BackendId rd_backend);
-char *BuildPaxFilePath(Relation rel, const char *block_id);
-bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid *procid, FmgrInfo *finfo, StrategyNumber strategynum);
+bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid *opfamily, FmgrInfo *finfo, StrategyNumber strategynum);
 }  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/comm/singleton.h b/contrib/pax_storage/src/cpp/comm/singleton.h
index f53922f7b37..ef019b51683 100644
--- a/contrib/pax_storage/src/cpp/comm/singleton.h
+++ b/contrib/pax_storage/src/cpp/comm/singleton.h
@@ -3,6 +3,9 @@
 #include <memory>
 #include <mutex>
 #include <utility>
+
+#include "comm/pax_memory.h"
+
 namespace pax {
 
 template <typename T>
diff --git a/contrib/pax_storage/src/cpp/contrib/cpp-stub b/contrib/pax_storage/src/cpp/contrib/cpp-stub
new file mode 160000
index 00000000000..93d20c639a9
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/contrib/cpp-stub
@@ -0,0 +1 @@
+Subproject commit 93d20c639a99fe93068692803aeb1982ea10dd6c
diff --git a/contrib/pax_storage/src/cpp/contrib/googlebench b/contrib/pax_storage/src/cpp/contrib/googlebench
new file mode 160000
index 00000000000..c2de5261302
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/contrib/googlebench
@@ -0,0 +1 @@
+Subproject commit c2de5261302fa307ebe06b24c0fc30653bed5e17
diff --git a/contrib/pax_storage/src/cpp/contrib/tabulate b/contrib/pax_storage/src/cpp/contrib/tabulate
new file mode 160000
index 00000000000..59f1c648070
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/contrib/tabulate
@@ -0,0 +1 @@
+Subproject commit 59f1c6480705bae8e83800914e6ede4fb077b435
diff --git a/contrib/pax_storage/src/cpp/contrib/zstd b/contrib/pax_storage/src/cpp/contrib/zstd
deleted file mode 160000
index 1e6651126b5..00000000000
--- a/contrib/pax_storage/src/cpp/contrib/zstd
+++ /dev/null
@@ -1 +0,0 @@
-Subproject commit 1e6651126b5a0daf860c94d81cef019fb12283d7
diff --git a/contrib/pax_storage/src/cpp/pax_gbench.cc b/contrib/pax_storage/src/cpp/pax_gbench.cc
new file mode 100644
index 00000000000..d9e72f48e26
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/pax_gbench.cc
@@ -0,0 +1,9 @@
+#include <benchmark/benchmark.h>
+
+static void example_benchmark(benchmark::State &state) {
+  for (auto _ : state) {
+  }
+}
+BENCHMARK(example_benchmark);
+
+BENCHMARK_MAIN();
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/pax_gtest.cc b/contrib/pax_storage/src/cpp/pax_gtest.cc
new file mode 100644
index 00000000000..6cb6c0c3a8f
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/pax_gtest.cc
@@ -0,0 +1,24 @@
+#include <cstdio>
+
+#include "stub.h"
+#include "comm/gtest_wrappers.h"
+#include "comm/cbdb_wrappers.h"
+
+bool MockMinMaxGetStrategyProcinfo(Oid, Oid, Oid *, FmgrInfo *,
+                                   StrategyNumber) {
+  return false;
+}
+
+// Mock global method which is not link from another libarays
+void GlobalMock(Stub *stub) {
+  stub->set(cbdb::MinMaxGetStrategyProcinfo, MockMinMaxGetStrategyProcinfo);
+}
+
+int main(int argc, char **argv) {
+  Stub *stub_global;
+  stub_global = new Stub();
+  testing::InitGoogleTest(&argc, argv);
+  GlobalMock(stub_global);
+
+  return RUN_ALL_TESTS();
+}
diff --git a/contrib/pax_storage/src/cpp/pax_gtest_helper.cc b/contrib/pax_storage/src/cpp/pax_gtest_helper.cc
new file mode 100644
index 00000000000..a497986848e
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/pax_gtest_helper.cc
@@ -0,0 +1,168 @@
+#include "pax_gtest_helper.h"
+
+#include "storage/micro_partition.h"
+
+namespace pax::tests {
+
+void GenTextBuffer(char *buffer, size_t length) {
+  for (size_t i = 0; i < length; i++) {
+    buffer[i] = static_cast<char>(i);
+  }
+}
+
+void CreateMemoryContext() {
+  MemoryContext test_memory_context = AllocSetContextCreate(
+      (MemoryContext)NULL, "TestMemoryContext", 80 * 1024 * 1024,
+      80 * 1024 * 1024, 80 * 1024 * 1024);
+  MemoryContextSwitchTo(test_memory_context);
+}
+
+void CreateTestResourceOwner() {
+  CurrentResourceOwner = ResourceOwnerCreate(NULL, "TestResourceOwner");
+}
+
+void ReleaseTestResourceOwner() {
+  ResourceOwner tmp_resource_owner = CurrentResourceOwner;
+  CurrentResourceOwner = NULL;
+  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_BEFORE_LOCKS, false,
+                       true);
+  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_LOCKS, false, true);
+  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_AFTER_LOCKS, false,
+                       true);
+  ResourceOwnerDelete(tmp_resource_owner);
+}
+
+static TupleDesc CreateTestTupleDesc() {
+  auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
+      sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
+
+  tuple_desc->natts = COLUMN_NUMS;
+  tuple_desc->attrs[0] = {.atttypid = TEXTOID,
+                          .attlen = -1,
+                          .attbyval = false,
+                          .attalign = TYPALIGN_DOUBLE,
+                          .attisdropped = false,
+                          .attcollation = DEFAULT_COLLATION_OID};
+
+  tuple_desc->attrs[1] = {.atttypid = TEXTOID,
+                          .attlen = -1,
+                          .attbyval = false,
+                          .attalign = TYPALIGN_DOUBLE,
+                          .attisdropped = false,
+                          .attcollation = DEFAULT_COLLATION_OID};
+
+  tuple_desc->attrs[2] = {.atttypid = INT4OID,
+                          .attlen = 4,
+                          .attbyval = true,
+                          .attalign = TYPALIGN_INT,
+                          .attisdropped = false,
+                          .attcollation = InvalidOid};
+  return tuple_desc;
+}
+
+TupleTableSlot *CreateTestTupleTableSlot(bool with_value) {
+  TupleTableSlot *tuple_slot = nullptr;
+  TupleDesc tuple_desc = nullptr;
+
+  tuple_desc = CreateTestTupleDesc();
+
+  tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
+
+  if (with_value) {
+    char column_buff[COLUMN_SIZE * 2];
+    GenTextBuffer(column_buff, COLUMN_SIZE);
+    GenTextBuffer(column_buff + COLUMN_SIZE, COLUMN_SIZE);
+
+    tuple_slot->tts_values[0] =
+        cbdb::DatumFromCString(column_buff, COLUMN_SIZE);
+    tuple_slot->tts_values[1] =
+        cbdb::DatumFromCString(column_buff + COLUMN_SIZE, COLUMN_SIZE);
+    tuple_slot->tts_values[2] = cbdb::Int32ToDatum(INT32_COLUMN_VALUE);
+    tuple_slot->tts_isnull[0] = false;
+    tuple_slot->tts_isnull[1] = false;
+    tuple_slot->tts_isnull[2] = false;
+  }
+
+  return tuple_slot;
+}
+
+static bool VerifyTestNonFixed(Datum datum, bool is_null) {
+  struct varlena *vl, *tunpacked;
+  int read_len;
+  char *read_data;
+  char column_buff[COLUMN_SIZE];
+
+  GenTextBuffer(column_buff, COLUMN_SIZE);
+
+  if (is_null) {
+    return false;
+  }
+
+  vl = (struct varlena *)DatumGetPointer(datum);
+  tunpacked = pg_detoast_datum_packed(vl);
+  if ((Pointer)vl != (Pointer)tunpacked) {
+    return false;
+  }
+
+  read_len = VARSIZE(tunpacked);
+  read_data = VARDATA_ANY(tunpacked);
+
+  if (read_len != COLUMN_SIZE + VARHDRSZ) {
+    return false;
+  }
+
+  if (std::memcmp(read_data, column_buff, COLUMN_SIZE) != 0) {
+    return false;
+  }
+  return true;
+}
+
+static bool VerifyTestFixed(Datum datum, bool is_null) {
+  return !is_null && cbdb::DatumToInt32(datum) == INT32_COLUMN_VALUE;
+}
+
+bool VerifyTestTupleTableSlot(TupleTableSlot *tuple_slot) {
+  bool ok = true;
+
+  if (!tuple_slot) {
+    return false;
+  }
+
+  ok &=
+      VerifyTestNonFixed(tuple_slot->tts_values[0], tuple_slot->tts_isnull[0]);
+  ok &=
+      VerifyTestNonFixed(tuple_slot->tts_values[1], tuple_slot->tts_isnull[1]);
+  ok &= VerifyTestFixed(tuple_slot->tts_values[2], tuple_slot->tts_isnull[2]);
+  return ok;
+}
+
+bool VerifyTestTupleTableSlot(TupleTableSlot *tuple_slot, int attrno) {
+  Assert(attrno <= 3 && attrno > 0);
+
+  if (!tuple_slot) {
+    return false;
+  }
+
+  if (attrno <= 2) {
+    return VerifyTestNonFixed(tuple_slot->tts_values[attrno - 1],
+                              tuple_slot->tts_isnull[attrno - 1]);
+  } else {
+    return VerifyTestFixed(tuple_slot->tts_values[attrno - 1],
+                           tuple_slot->tts_isnull[attrno - 1]);
+  }
+}
+
+void DeleteTestTupleTableSlot(TupleTableSlot *tuple_slot) {
+  cbdb::Pfree(tuple_slot->tts_tupleDescriptor);
+  cbdb::Pfree(tuple_slot);
+}
+
+std::vector<pax::orc::proto::Type_Kind> CreateTestSchemaTypes() {
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
+  return types;
+}
+
+}  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/pax_gtest_helper.h b/contrib/pax_storage/src/cpp/pax_gtest_helper.h
new file mode 100644
index 00000000000..b82bf97e037
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/pax_gtest_helper.h
@@ -0,0 +1,26 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#include <vector>
+
+#include "storage/proto/proto_wrappers.h"
+
+namespace pax::tests {
+
+// 3 clomun - string(len 100), string(len 100), int(len 4)
+#define COLUMN_NUMS 3
+#define COLUMN_SIZE 100
+#define INT32_COLUMN_VALUE 0x123
+#define INT32_COLUMN_VALUE_DEFAULT 0x001
+
+extern void CreateMemoryContext();
+extern void CreateTestResourceOwner();
+extern void ReleaseTestResourceOwner();
+extern TupleTableSlot *CreateTestTupleTableSlot(bool with_value = true);
+extern bool VerifyTestTupleTableSlot(TupleTableSlot *tuple_slot);
+extern bool VerifyTestTupleTableSlot(TupleTableSlot *tuple_slot, int attrno);
+extern void DeleteTestTupleTableSlot(TupleTableSlot *tuple_slot);
+
+extern void GenTextBuffer(char *buffer, size_t length);
+extern std::vector<pax::orc::proto::Type_Kind> CreateTestSchemaTypes();
+}  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/storage/cache/pax_cache.cc b/contrib/pax_storage/src/cpp/storage/cache/pax_cache.cc
new file mode 100644
index 00000000000..9b135ee5a75
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/cache/pax_cache.cc
@@ -0,0 +1,14 @@
+#include "storage/cache/pax_cache.h"
+
+namespace pax {
+
+bool PaxCache::Status::Ok() const { return ok_; }
+
+std::string PaxCache::Status::Error() { return error_msg_; }
+
+void PaxCache::Status::SetError(const std::string &error_msg) {
+  ok_ = false;
+  error_msg_ = error_msg;
+}
+
+};  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/cache/pax_cache.h b/contrib/pax_storage/src/cpp/storage/cache/pax_cache.h
new file mode 100644
index 00000000000..121c78342a0
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/cache/pax_cache.h
@@ -0,0 +1,64 @@
+#pragma once
+
+#include <string>
+#include <vector>
+
+namespace pax {
+
+class PaxCache {
+ public:
+  struct Status {
+    friend class PaxCache;
+
+    bool Ok() const;
+
+    std::string Error();
+
+    void SetError(const std::string &error_msg);
+
+   private:
+    bool ok_ = true;
+    std::string error_msg_;
+  };
+
+  struct BatchBuffer {
+    const char *buffer = nullptr;
+    size_t buffer_len = 0;
+    const char *meta = nullptr;
+    size_t meta_len = 0;
+
+    bool not_exist = false;
+  };
+
+  virtual ~PaxCache() = default;
+
+  virtual Status Initialize() = 0;
+
+  virtual Status Put(const std::string &key,
+                     const BatchBuffer &batch_buffer) = 0;
+
+  virtual Status Put(const std::string &key,
+                     const std::vector<std::pair<char *, size_t>> &buffers,
+                     const std::pair<char *, size_t> &meta) = 0;
+
+  virtual Status Exists(const std::string &key, bool *has) = 0;
+
+  virtual Status Get(const std::string &key, BatchBuffer &batch_buffer) = 0;
+
+  virtual Status Get(const std::vector<std::string> &keys,
+                     std::vector<BatchBuffer> &batchs) = 0;
+
+  virtual Status Release(const std::string &key) = 0;
+
+  virtual Status Release(const std::vector<std::string> &keys) = 0;
+
+  virtual Status Delete(const std::string &key) = 0;
+
+  virtual Status Delete(const std::vector<std::string> &key) = 0;
+
+  virtual Status Destroy() = 0;
+
+  virtual size_t KeySizeLimit() = 0;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/cache/pax_cache_test.cc b/contrib/pax_storage/src/cpp/storage/cache/pax_cache_test.cc
new file mode 100644
index 00000000000..15ac2015dbb
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/cache/pax_cache_test.cc
@@ -0,0 +1,347 @@
+#ifdef ENABLE_PLASMA
+#include "plasma/store.h"
+#endif
+
+#include <gtest/gtest.h>
+
+#include <gmock/gmock.h>
+
+#include <thread>
+
+// #include "comm/gtest_wrappers.h"
+#include "pax_gtest_helper.h"
+#include "storage/cache/pax_cache.h"
+#include "storage/cache/pax_plasma_cache.h"
+#ifdef ENABLE_PLASMA
+
+namespace pax::tests {
+
+#define CACHE_DATA_LEN 100
+#define CACHE_META_LEN 20
+
+class PaxCacheTest : public ::testing::Test {
+  void SetUp() override {
+    plasma_server_ = std::thread([this] {
+      plasma::StartServer(
+          plasma_socket_ /* socket_name */, "" /* plasma_directory */,
+          false /* hugepages_enabled */, nullptr /* external_store */,
+          10 * 1024 * 1024 /* system_memory */,
+          PLASMA_INFO /* plasmaLogSeverity */);
+      plasma::ShutdownServer();
+    });
+    sleep(1);
+  }
+
+  void TearDown() override {
+    plasma::StopServer();
+    plasma_server_.join();
+  }
+
+ protected:
+  static void PutKey(PaxCache *pax_cache, const std::string &key,
+                     const PaxCache::BatchBuffer &input) {
+    auto status = pax_cache->Put(key, input);
+    ASSERT_TRUE(status.Ok()) << "fail to put key: " << key << status.Error();
+  }
+
+  static void Exist(PaxCache *pax_cache, const std::string &key, bool exist) {
+    bool exist_rc = false;
+    auto status = pax_cache->Exists(key, &exist_rc);
+    ASSERT_TRUE(status.Ok()) << status.Error();
+    ASSERT_TRUE(exist ? exist_rc : !exist_rc) << "key: " << key << " exist";
+  };
+
+ protected:
+  const int64_t client_memory_quota_ = 5 * 1024 * 1024;
+  char plasma_socket_[1024] = "/tmp/plasma";
+  std::thread plasma_server_;
+};
+
+TEST_F(PaxCacheTest, TestCacheInterface) {
+  PaxCache *pax_cache;
+  PaxPlasmaCache::CacheOptions cache_options;
+  PaxCache::Status status;
+  PaxCache::BatchBuffer batch_buffer{0};
+
+  cache_options.domain_socket = std::string(plasma_socket_);
+  cache_options.client_name = "CLI1";
+  cache_options.memory_quota = client_memory_quota_;
+  cache_options.waitting_ms = 0;
+
+  pax_cache = new PaxPlasmaCache(cache_options);
+  status = pax_cache->Initialize();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  // create 3 key
+  char data[CACHE_DATA_LEN];
+  char meta[CACHE_META_LEN];
+  GenTextBuffer(data, CACHE_DATA_LEN);
+  GenTextBuffer(meta, CACHE_META_LEN);
+
+  batch_buffer.buffer = data;
+  batch_buffer.buffer_len = CACHE_DATA_LEN;
+  batch_buffer.meta = nullptr;
+  batch_buffer.meta = 0;
+
+  PutKey(pax_cache, "key1", batch_buffer);
+  batch_buffer.meta = meta;
+  batch_buffer.meta_len = CACHE_META_LEN;
+
+  PutKey(pax_cache, "key2", batch_buffer);
+  PutKey(pax_cache, "key3", batch_buffer);
+
+  Exist(pax_cache, "key1", true);
+  Exist(pax_cache, "key2", true);
+  Exist(pax_cache, "key3", true);
+
+  batch_buffer.buffer = nullptr;
+  batch_buffer.buffer_len = 0;
+  batch_buffer.meta = nullptr;
+  batch_buffer.meta_len = 0;
+
+  // get + release
+  status = pax_cache->Get("key1", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  EXPECT_EQ(CACHE_DATA_LEN, batch_buffer.buffer_len);
+  EXPECT_EQ(0, batch_buffer.meta_len);
+  EXPECT_EQ(0, std::memcmp(batch_buffer.buffer, data, CACHE_DATA_LEN));
+  // still will alloc a meta address with size 0
+  EXPECT_NE(nullptr, batch_buffer.meta);
+
+  status = pax_cache->Get("key2", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  EXPECT_EQ(CACHE_DATA_LEN, batch_buffer.buffer_len);
+  EXPECT_EQ(CACHE_META_LEN, batch_buffer.meta_len);
+  EXPECT_EQ(0, std::memcmp(batch_buffer.buffer, data, CACHE_DATA_LEN));
+  EXPECT_EQ(0, std::memcmp(batch_buffer.meta, meta, CACHE_META_LEN));
+
+  status = pax_cache->Get("key3", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Release("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  std::vector<std::string> release_list = {"key2", "key3"};
+  status = pax_cache->Release(release_list);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Delete("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  std::vector<std::string> delete_list = {"key2", "key3"};
+  status = pax_cache->Delete(delete_list);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  Exist(pax_cache, "key1", false);
+  Exist(pax_cache, "key2", false);
+  Exist(pax_cache, "key3", false);
+
+  status = pax_cache->Destroy();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  delete pax_cache;
+}
+
+TEST_F(PaxCacheTest, TestLRUReplace) {
+  PaxCache *pax_cache;
+  PaxPlasmaCache::CacheOptions cache_options;
+  PaxCache::Status status;
+  PaxCache::BatchBuffer batch_buffer{0};
+
+  cache_options.domain_socket = std::string(plasma_socket_);
+  cache_options.client_name = "CLI1";
+  cache_options.memory_quota = CACHE_DATA_LEN * 3;
+  cache_options.waitting_ms = 0;
+
+  pax_cache = new PaxPlasmaCache(cache_options);
+  status = pax_cache->Initialize();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  char data[CACHE_DATA_LEN];
+  GenTextBuffer(data, CACHE_DATA_LEN);
+
+  batch_buffer.buffer = data;
+  batch_buffer.buffer_len = CACHE_DATA_LEN;
+  batch_buffer.meta = nullptr;
+  batch_buffer.meta_len = 0;
+
+  PutKey(pax_cache, "key1", batch_buffer);
+  PutKey(pax_cache, "key2", batch_buffer);
+  PutKey(pax_cache, "key3", batch_buffer);
+  PutKey(pax_cache, "key4", batch_buffer);
+  PutKey(pax_cache, "key5", batch_buffer);
+
+  status = pax_cache->Get("key1", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_TRUE(batch_buffer.not_exist);
+
+  status = pax_cache->Get("key2", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_TRUE(batch_buffer.not_exist);
+
+  status = pax_cache->Get("key3", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_FALSE(batch_buffer.not_exist);
+
+  status = pax_cache->Release("key3");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Delete("key3");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Get("key4", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_FALSE(batch_buffer.not_exist);
+
+  status = pax_cache->Release("key4");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Delete("key4");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Get("key5", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_FALSE(batch_buffer.not_exist);
+
+  status = pax_cache->Release("key5");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Delete("key5");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Destroy();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  delete pax_cache;
+}
+
+TEST_F(PaxCacheTest, TestGetNoExist) {
+  PaxCache *pax_cache;
+  PaxPlasmaCache::CacheOptions cache_options;
+  PaxCache::Status status;
+  PaxCache::BatchBuffer batch_buffer{0};
+
+  cache_options.domain_socket = std::string(plasma_socket_);
+  cache_options.client_name = "CLI1";
+  cache_options.memory_quota = client_memory_quota_;
+  cache_options.waitting_ms = 0;
+
+  pax_cache = new PaxPlasmaCache(cache_options);
+  status = pax_cache->Initialize();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  char data[CACHE_DATA_LEN];
+  char meta[CACHE_META_LEN];
+  GenTextBuffer(data, CACHE_DATA_LEN);
+  GenTextBuffer(meta, CACHE_META_LEN);
+
+  batch_buffer.buffer = data;
+  batch_buffer.buffer_len = CACHE_DATA_LEN;
+  batch_buffer.meta = meta;
+  batch_buffer.meta_len = CACHE_META_LEN;
+
+  PutKey(pax_cache, "key1", batch_buffer);
+  Exist(pax_cache, "key1", true);
+
+  status = pax_cache->Get("key1", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Release("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Get("abc", batch_buffer);
+  ASSERT_TRUE(status.Ok());
+  ASSERT_TRUE(batch_buffer.not_exist);
+
+  std::vector<PaxCache::BatchBuffer> batch_buffers;
+  status = pax_cache->Get({"key1", "abc"}, batch_buffers);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  ASSERT_FALSE(batch_buffers[0].not_exist);
+  ASSERT_TRUE(batch_buffers[1].not_exist);
+
+  status = pax_cache->Release("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Delete("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  status = pax_cache->Destroy();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  delete pax_cache;
+}
+
+TEST_F(PaxCacheTest, TestDifferentClientDelete) {
+  PaxCache *pax_cache;
+  PaxPlasmaCache::CacheOptions cache_options;
+  PaxCache::Status status;
+  PaxCache::BatchBuffer batch_buffer{0};
+
+  cache_options.domain_socket = std::string(plasma_socket_);
+  cache_options.client_name = "CLI1";
+  cache_options.memory_quota = client_memory_quota_;
+  cache_options.waitting_ms = 0;
+
+  pax_cache = new PaxPlasmaCache(cache_options);
+  status = pax_cache->Initialize();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  char data[CACHE_DATA_LEN];
+  char meta[CACHE_META_LEN];
+  GenTextBuffer(data, CACHE_DATA_LEN);
+  GenTextBuffer(meta, CACHE_META_LEN);
+
+  batch_buffer.buffer = data;
+  batch_buffer.buffer_len = CACHE_DATA_LEN;
+  batch_buffer.meta = meta;
+  batch_buffer.meta_len = CACHE_META_LEN;
+
+  PutKey(pax_cache, "key1", batch_buffer);
+  Exist(pax_cache, "key1", true);
+
+  // CLI1 destroy
+  status = pax_cache->Destroy();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  delete pax_cache;
+
+  // create CLI2
+  cache_options.client_name = "CLI2";
+  pax_cache = new PaxPlasmaCache(cache_options);
+
+  status = pax_cache->Initialize();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  // check exist
+  Exist(pax_cache, "key1", true);
+
+  // get key1
+  batch_buffer.buffer = nullptr;
+  batch_buffer.buffer_len = 0;
+  batch_buffer.meta = nullptr;
+  batch_buffer.meta_len = 0;
+
+  status = pax_cache->Get("key1", batch_buffer);
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  EXPECT_EQ(CACHE_DATA_LEN, batch_buffer.buffer_len);
+  EXPECT_EQ(CACHE_META_LEN, batch_buffer.meta_len);
+  EXPECT_EQ(0, std::memcmp(batch_buffer.buffer, data, CACHE_DATA_LEN));
+  EXPECT_EQ(0, std::memcmp(batch_buffer.meta, meta, CACHE_META_LEN));
+
+  status = pax_cache->Release("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  // delete key1
+  status = pax_cache->Delete("key1");
+  ASSERT_TRUE(status.Ok()) << status.Error();
+
+  // should delete success
+  Exist(pax_cache, "key1", false);
+
+  status = pax_cache->Destroy();
+  ASSERT_TRUE(status.Ok()) << status.Error();
+  delete pax_cache;
+}
+
+}  // namespace pax::tests
+
+#endif  //  ENABLE_PLASMA
diff --git a/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.cc b/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.cc
new file mode 100644
index 00000000000..2d9e941a1d2
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.cc
@@ -0,0 +1,276 @@
+#include "storage/cache/pax_plasma_cache.h"
+
+#ifdef ENABLE_PLASMA
+#include <plasma/client.h>
+#include <plasma/plasma.h>
+#endif  // ENABLE_PLASMA
+
+#include <iostream>
+
+#include "comm/cbdb_wrappers.h"
+
+#ifdef ENABLE_PLASMA
+
+namespace pax {
+
+static inline plasma::ObjectID KeyToPlasmaId(const std::string &key,
+                                             size_t key_size_limit) {
+  plasma::ObjectID key_id;
+
+  Assert(key.length() <= key_size_limit);
+  memcpy(key_id.mutable_data(), key.c_str(), key.length());
+  memset(key_id.mutable_data() + key.length(), 0,
+         key_size_limit - key.length());
+
+  return key_id;
+}
+
+static inline std::string PlasmaIdToKey(const plasma::ObjectID &key_id) {
+  std::string key;
+  key = key_id.binary();
+  return key;
+}
+
+PaxPlasmaCache::PaxPlasmaCache(const CacheOptions &option)
+    : PaxCache(),
+      options_(option),
+      is_initialized_(false),
+      plasma_client_(PAX_NEW<plasma::PlasmaClient>()) {}
+
+PaxPlasmaCache::~PaxPlasmaCache() { PAX_DELETE(plasma_client_); };
+
+PaxCache::Status PaxPlasmaCache::Initialize() {
+  PaxCache::Status status;
+  if (is_initialized_) {
+    status.SetError("Don't initialize twice.");
+    return status;
+  }
+
+  auto plasma_status = plasma_client_->Connect(
+      options_.domain_socket /*store_socket_name*/, "" /*manager_socket_name*/,
+      0 /*release_delay*/, 3 /*num_retries*/);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  if (options_.memory_quota != 0) {
+    plasma_status = plasma_client_->SetClientOptions(options_.client_name,
+                                                     options_.memory_quota);
+    CHECK_PLASMA_STATUS(plasma_status, status);
+  }
+
+  is_initialized_ = true;
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Put(const std::string &key,
+                                     const BatchBuffer &batch_buffer) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+  std::shared_ptr<plasma::Buffer> plasma_buffer;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+
+  plasma::Status plasma_status = plasma_client_->Create(
+      key_id, batch_buffer.buffer_len, (const uint8_t *)batch_buffer.meta,
+      batch_buffer.meta_len, &plasma_buffer);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  assert((size_t)plasma_buffer->size() == batch_buffer.buffer_len);
+
+  memcpy(plasma_buffer->mutable_data(), batch_buffer.buffer,
+         batch_buffer.buffer_len);
+
+  plasma_status = plasma_client_->Seal(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  plasma_status = plasma_client_->Release(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Put(
+    const std::string &key,
+    const std::vector<std::pair<char *, size_t>> &buffers,
+    const std::pair<char *, size_t> &meta) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+  std::shared_ptr<plasma::Buffer> plasma_buffer;
+  size_t total_size = 0;
+  size_t data_offset = 0;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+
+  for (auto &pair : buffers) {
+    total_size += pair.second;
+  }
+
+  plasma::Status plasma_status =
+      plasma_client_->Create(key_id, total_size, (const uint8_t *)meta.first,
+                             meta.second, &plasma_buffer);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  assert((size_t)plasma_buffer->size() == total_size);
+
+  for (auto &pair : buffers) {
+    memcpy(plasma_buffer->mutable_data() + data_offset, pair.first,
+           pair.second);
+    data_offset += pair.second;
+  }
+  Assert(data_offset == total_size);
+
+  plasma_status = plasma_client_->Seal(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  plasma_status = plasma_client_->Release(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Exists(const std::string &key, bool *has) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+
+  plasma::Status plasma_status = plasma_client_->Contains(key_id, has);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Get(const std::string &key,
+                                     BatchBuffer &batch_buffer) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+  plasma::ObjectBuffer obj_buffer;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+  auto plasma_status =
+      plasma_client_->Get(&key_id, 1, options_.waitting_ms, &obj_buffer);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  if (!obj_buffer.data) {
+    // not exist in server
+    batch_buffer.not_exist = true;
+    return status;
+  }
+
+  batch_buffer.buffer = (const char *)obj_buffer.data->data();
+  batch_buffer.buffer_len = obj_buffer.data->size();
+  batch_buffer.meta = (const char *)obj_buffer.metadata->data();
+  batch_buffer.meta_len = obj_buffer.metadata->size();
+  batch_buffer.not_exist = false;
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Get(const std::vector<std::string> &keys,
+                                     std::vector<BatchBuffer> &batchs) {
+  PaxCache::Status status;
+  plasma::ObjectID key_ids[keys.size()];
+  plasma::ObjectBuffer obj_buffers[keys.size()];
+
+  assert(is_initialized_);
+
+  for (size_t i = 0; i < keys.size(); i++) {
+    assert(keys[i].length() <= KeySizeLimit());
+    key_ids[i] = KeyToPlasmaId(keys[i], KeySizeLimit());
+  }
+
+  auto plasma_status = plasma_client_->Get(key_ids, keys.size(),
+                                           options_.waitting_ms, obj_buffers);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  for (size_t i = 0; i < keys.size(); i++) {
+    BatchBuffer batch_buffer;
+    if (!obj_buffers[i].data) {
+      batch_buffer.not_exist = true;
+    } else {
+      batch_buffer.not_exist = false;
+      batch_buffer.buffer = (const char *)obj_buffers[i].data->data();
+      batch_buffer.buffer_len = obj_buffers[i].data->size();
+      batch_buffer.meta = (const char *)obj_buffers[i].metadata->data();
+      batch_buffer.meta_len = obj_buffers[i].metadata->size();
+    }
+    batchs.emplace_back(batch_buffer);
+  }
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Release(const std::string &key) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+  auto plasma_status = plasma_client_->Release(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Release(const std::vector<std::string> &keys) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+
+  assert(is_initialized_);
+  for (const auto &key : keys) {
+    key_id = KeyToPlasmaId(key, KeySizeLimit());
+    auto plasma_status = plasma_client_->Release(key_id);
+    CHECK_PLASMA_STATUS(plasma_status, status);
+  }
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Delete(const std::string &key) {
+  PaxCache::Status status;
+  plasma::ObjectID key_id;
+
+  assert(is_initialized_);
+  assert(key.length() <= KeySizeLimit());
+  key_id = KeyToPlasmaId(key, KeySizeLimit());
+  plasma::Status plasma_status = plasma_client_->Delete(key_id);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Delete(const std::vector<std::string> &keys) {
+  PaxCache::Status status;
+  std::vector<plasma::ObjectID> key_ids;
+  std::vector<plasma::ObjectBuffer> obj_buffers;
+
+  assert(is_initialized_);
+  for (const auto &key : keys) {
+    key_ids.emplace_back(KeyToPlasmaId(key, KeySizeLimit()));
+  }
+
+  plasma::Status plasma_status = plasma_client_->Delete(key_ids);
+  CHECK_PLASMA_STATUS(plasma_status, status);
+
+  return status;
+}
+
+PaxCache::Status PaxPlasmaCache::Destroy() {
+  PaxCache::Status status;
+  plasma::Status plasma_status = plasma_client_->Disconnect();
+  assert(is_initialized_);
+  is_initialized_ = false;
+  CHECK_PLASMA_STATUS(plasma_status, status);
+  return status;
+}
+
+size_t PaxPlasmaCache::KeySizeLimit() { return plasma::kUniqueIDSize; }
+
+}  // namespace pax
+
+#endif  // ENABLE_PLASMA
diff --git a/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.h b/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.h
new file mode 100644
index 00000000000..ab3555a4461
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/cache/pax_plasma_cache.h
@@ -0,0 +1,82 @@
+#pragma once
+
+#ifdef ENABLE_PLASMA
+
+#include <string>
+#include <string_view>
+
+#include "storage/cache/pax_cache.h"
+
+namespace plasma {
+class PlasmaClient;
+}
+
+namespace pax {
+
+#define CHECK_PLASMA_STATUS(plasma_status, status_rc)   \
+  do {                                                  \
+    if (!(plasma_status).ok()) {                        \
+      (status_rc).SetError((plasma_status).ToString()); \
+      return (status_rc);                               \
+    }                                                   \
+  } while (0);
+
+class PaxPlasmaCache : public PaxCache {
+ public:
+  struct CacheOptions {
+    std::string domain_socket;
+    // client name + memory quota will limit current client memory used
+    // if memory_quota_ is 0 means no limit
+    // Notice that: if current plasma server capcity LT memory quota
+    // Then it will make Initialize failed
+    std::string client_name;
+    size_t memory_quota = 0;
+
+    // the waitting time after `Get` call failed
+    // during this period, if the same `key` is put,
+    // the data will be obtained
+    size_t waitting_ms = 0;
+  };
+
+  explicit PaxPlasmaCache(const CacheOptions &option);
+
+  ~PaxPlasmaCache() override;
+
+  PaxCache::Status Initialize() override;
+
+  PaxCache::Status Put(const std::string &key,
+                       const BatchBuffer &batch_buffer) override;
+
+  PaxCache::Status Put(const std::string &key,
+                       const std::vector<std::pair<char *, size_t>> &buffers,
+                       const std::pair<char *, size_t> &meta) override;
+
+  PaxCache::Status Exists(const std::string &key, bool *has) override;
+
+  PaxCache::Status Get(const std::string &key,
+                       BatchBuffer &batch_buffer) override;
+
+  PaxCache::Status Get(const std::vector<std::string> &keys,
+                       std::vector<BatchBuffer> &batchs) override;
+
+  PaxCache::Status Release(const std::string &key) override;
+
+  PaxCache::Status Release(const std::vector<std::string> &keys) override;
+
+  PaxCache::Status Delete(const std::string &key) override;
+
+  PaxCache::Status Delete(const std::vector<std::string> &keys) override;
+
+  PaxCache::Status Destroy() override;
+
+  size_t KeySizeLimit() override;
+
+ private:
+  CacheOptions options_;
+  bool is_initialized_;
+  plasma::PlasmaClient *plasma_client_;
+};
+
+}  // namespace pax
+
+#endif  // ENABLE_PLASMA
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_column.cc
index 04eba6feb42..2ad0a7bfa57 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_column.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column.cc
@@ -6,125 +6,87 @@
 #include <utility>
 #include <vector>
 
-#include "comm/pax_defer.h"
+#include "storage/columns/pax_column_traits.h"
+#include "storage/pax_defined.h"
 
 namespace pax {
 
 PaxColumn::PaxColumn()
     : null_bitmap_(nullptr),
+      total_rows_(0),
+      non_null_rows_(0),
       encoded_type_(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED),
-      storage_type_(PaxColumnStorageType::kTypeStorageNonVec) {}
+      compress_level_(0),
+      type_align_size_(PAX_DATA_NO_ALIGN) {}
 
-PaxColumn::~PaxColumn() {
-  if (null_bitmap_) {
-    delete null_bitmap_;
-  }
-}
+PaxColumn::~PaxColumn() { PAX_DELETE(null_bitmap_); }
 
 PaxColumnTypeInMem PaxColumn::GetPaxColumnTypeInMem() const {
   return PaxColumnTypeInMem::kTypeInvalid;
 }
 
-void PaxColumn::Clear() {
-  if (null_bitmap_) {
-    delete null_bitmap_;
-    null_bitmap_ = nullptr;
-  }
-}
-
 bool PaxColumn::HasNull() { return null_bitmap_ != nullptr; }
 
-void PaxColumn::SetNulls(DataBuffer<bool> *null_bitmap) {
+bool PaxColumn::AllNull() const {
+  return null_bitmap_ && null_bitmap_->Empty();
+}
+
+void PaxColumn::SetBitmap(Bitmap8 *null_bitmap) {
   Assert(!null_bitmap_);
   null_bitmap_ = null_bitmap;
 }
 
-DataBuffer<bool> *PaxColumn::GetNulls() const { return null_bitmap_; }
-
-std::pair<bool *, size_t> PaxColumn::GetRangeNulls(size_t start_pos,
-                                                   size_t len) {
-  Assert(null_bitmap_);
-  CBDB_CHECK((start_pos + len) <= GetRows(),
-             cbdb::CException::ExType::kExTypeOutOfRange);
+size_t PaxColumn::GetRows() const { return total_rows_; }
 
-  static_assert(sizeof(char) == sizeof(bool));
-  return std::make_pair(null_bitmap_->GetBuffer() + start_pos, len);
-}
+size_t PaxColumn::GetNonNullRows() const { return non_null_rows_; }
 
-size_t PaxColumn::GetRows() {
-  return null_bitmap_ ? null_bitmap_->Used() : GetNonNullRows();
-}
+void PaxColumn::SetRows(size_t total_rows) { total_rows_ = total_rows; }
 
 size_t PaxColumn::GetRangeNonNullRows(size_t start_pos, size_t len) {
   CBDB_CHECK((start_pos + len) <= GetRows(),
              cbdb::CException::ExType::kExTypeOutOfRange);
-  if (null_bitmap_) {
-    size_t total_non_null = 0;
-    for (size_t i = start_pos; i < (start_pos + len); i++) {
-      if ((*null_bitmap_)[i]) {
-        total_non_null++;
-      }
-    }
-
-    return total_non_null;
-  } else {
-    return len;
+  if (!null_bitmap_) return len;
+  if (len == 0) {
+    return 0;
   }
+  return null_bitmap_->CountBits(start_pos, start_pos + len - 1);
+}
+
+void PaxColumn::CreateNulls(size_t cap) {
+  Assert(!null_bitmap_);
+  null_bitmap_ = PAX_NEW<Bitmap8>(cap);
+  null_bitmap_->SetN(total_rows_);
 }
 
 void PaxColumn::AppendNull() {
   if (!null_bitmap_) {
-    size_t current_rows = GetNonNullRows();
-    size_t size = current_rows > DEFAULT_CAPACITY
-                      ? (current_rows / DEFAULT_CAPACITY + 1) * DEFAULT_CAPACITY
-                      : DEFAULT_CAPACITY;
-    null_bitmap_ = new DataBuffer<bool>(size);
-    null_bitmap_->Brush(current_rows * sizeof(bool));
-    memset(null_bitmap_->GetBuffer(), 1, null_bitmap_->Capacity());
+    CreateNulls(DEFAULT_CAPACITY);
   }
-
-  if (null_bitmap_->Available() == 0) {
-    size_t old_cap = null_bitmap_->Capacity();
-    null_bitmap_->ReSize(old_cap * 2);
-    memset(null_bitmap_->GetAvailableBuffer(), 1, old_cap);
-  }
-
-  null_bitmap_->Write(false);
-  null_bitmap_->Brush(sizeof(bool));
+  null_bitmap_->Clear(total_rows_);
+  ++total_rows_;
 }
 
-void PaxColumn::Append([[maybe_unused]] char *buffer,
-                       [[maybe_unused]] size_t size) {
-  if (null_bitmap_) {
-    if (null_bitmap_->Available() == 0) {
-      size_t old_cap = null_bitmap_->Capacity();
-      null_bitmap_->ReSize(old_cap * 2);
-      memset(null_bitmap_->GetAvailableBuffer(), 1, old_cap);
-    }
-    null_bitmap_->Brush(sizeof(bool));
-  }
+void PaxColumn::Append(char * /*buffer*/, size_t /*size*/) {
+  if (null_bitmap_) null_bitmap_->Set(total_rows_);
+  ++total_rows_;
+  ++non_null_rows_;
 }
 
-PaxColumn *PaxColumn::SetColumnEncodeType(ColumnEncoding_Kind encoding_type) {
-  encoded_type_ = encoding_type;
-  return this;
-}
+size_t PaxColumn::GetAlignSize() const { return type_align_size_; }
 
-PaxColumn *PaxColumn::SetColumnStorageType(PaxColumnStorageType storage_type) {
-  storage_type_ = storage_type;
-  return this;
+void PaxColumn::SetAlignSize(size_t align_size) {
+  Assert(align_size > 0 && (align_size & (align_size - 1)) == 0);
+  type_align_size_ = align_size;
 }
 
-ColumnEncoding_Kind PaxColumn::GetEncodingType() const { return encoded_type_; }
-
 template <typename T>
-PaxCommColumn<T>::PaxCommColumn(uint64 capacity) : capacity_(capacity) {
-  data_ = new DataBuffer<T>(capacity * sizeof(T));
+PaxCommColumn<T>::PaxCommColumn(uint32 capacity) {
+  data_ = PAX_NEW<DataBuffer<T>>(capacity * sizeof(T));
 }
 
 template <typename T>
 PaxCommColumn<T>::~PaxCommColumn() {
-  delete data_;
+  PAX_DELETE(data_);
 }
 
 template <typename T>  // NOLINT: redirect constructor
@@ -132,7 +94,7 @@ PaxCommColumn<T>::PaxCommColumn() : PaxCommColumn(DEFAULT_CAPACITY) {}
 
 template <typename T>
 void PaxCommColumn<T>::Set(DataBuffer<T> *data) {
-  delete data_;
+  PAX_DELETE(data_);
 
   data_ = data;
 }
@@ -145,10 +107,10 @@ void PaxCommColumn<T>::Append(char *buffer, size_t size) {
   // TODO(jiaqizho): Is it necessary to support multiple buffer insertions for
   // bulk insert push to mirco partition?
   Assert(size == sizeof(T));
-  Assert(GetNonNullRows() <= capacity_);
+  Assert(data_->Capacity() >= sizeof(T));
 
-  if (GetNonNullRows() == capacity_) {
-    ReSize(capacity_ * 2);
+  if (data_->Available() == 0) {
+    data_->ReSize(data_->Used() + size, 2);
   }
 
   data_->Write(buffer_t, sizeof(T));
@@ -156,22 +118,13 @@ void PaxCommColumn<T>::Append(char *buffer, size_t size) {
 }
 
 template <typename T>
-PaxColumnTypeInMem PaxCommColumn<T>::GetPaxColumnTypeInMem() const {
-  return PaxColumnTypeInMem::kTypeFixed;
-}
-
-template <typename T>
-void PaxCommColumn<T>::Clear() {
-  PaxColumn::Clear();
-  data_->BrushBackAll();
+PaxStorageFormat PaxCommColumn<T>::GetStorageFormat() const {
+  return PaxStorageFormat::kTypeStorageOrcNonVec;
 }
 
 template <typename T>
-void PaxCommColumn<T>::ReSize(uint64 cap) {
-  if (capacity_ < cap) {
-    data_->ReSize(cap * sizeof(T));
-    capacity_ = cap;
-  }
+PaxColumnTypeInMem PaxCommColumn<T>::GetPaxColumnTypeInMem() const {
+  return PaxColumnTypeInMem::kTypeFixed;
 }
 
 template <typename T>
@@ -223,36 +176,30 @@ template class PaxCommColumn<int64>;
 template class PaxCommColumn<float>;
 template class PaxCommColumn<double>;
 
-PaxNonFixedColumn::PaxNonFixedColumn(uint64 capacity) : estimated_size_(0) {
-  data_ = new DataBuffer<char>(capacity * sizeof(char) * 100);
-  lengths_ = new DataBuffer<int64>(capacity * sizeof(char));
+PaxNonFixedColumn::PaxNonFixedColumn(uint32 capacity) : estimated_size_(0) {
+  data_ = PAX_NEW<DataBuffer<char>>(capacity * sizeof(char));
+  lengths_ = PAX_NEW<DataBuffer<int32>>(capacity * sizeof(char));
 }
 
 PaxNonFixedColumn::PaxNonFixedColumn() : PaxNonFixedColumn(DEFAULT_CAPACITY) {}
 
 PaxNonFixedColumn::~PaxNonFixedColumn() {
-  if (data_) {
-    delete data_;
-  }
-
-  if (lengths_) {
-    delete lengths_;
-  }
+  PAX_DELETE(data_);
+  PAX_DELETE(lengths_);
 }
 
-void PaxNonFixedColumn::Set(DataBuffer<char> *data, DataBuffer<int64> *lengths,
+void PaxNonFixedColumn::Set(DataBuffer<char> *data, DataBuffer<int32> *lengths,
                             size_t total_size) {
-  if (data_) {
-    delete data_;
-  }
-
-  if (lengths_) {
-    delete lengths_;
-  }
+  PAX_DELETE(data_);
+  PAX_DELETE(lengths_);
 
   estimated_size_ = total_size;
   data_ = data;
   lengths_ = lengths;
+  BuildOffsets();
+}
+
+void PaxNonFixedColumn::BuildOffsets() {
   offsets_.clear();
   for (size_t i = 0; i < lengths_->GetSize(); i++) {
     offsets_.emplace_back(i == 0 ? 0 : offsets_[i - 1] + (*lengths_)[i - 1]);
@@ -260,30 +207,30 @@ void PaxNonFixedColumn::Set(DataBuffer<char> *data, DataBuffer<int64> *lengths,
 }
 
 void PaxNonFixedColumn::Append(char *buffer, size_t size) {
-  Assert(likely(reinterpret_cast<char *> MAXALIGN(data_->Position()) ==
-                data_->Position()));
-
   size_t origin_size;
   origin_size = size;
 
-  // FIMXE(gongxun): maybe it should be aligned base on the typalign?
-  size = MAXALIGN(size);
+  if (!COLUMN_STORAGE_FORMAT_IS_VEC(this)) {
+    Assert(likely(reinterpret_cast<char *> MAXALIGN(data_->Position()) ==
+                  data_->Position()));
+    size = MAXALIGN(size);
+  }
 
   PaxColumn::Append(buffer, origin_size);
-  while (data_->Available() < size) {
-    data_->ReSize(data_->Capacity() * 2);
+  if (data_->Available() < size) {
+    data_->ReSize(data_->Used() + size, 2);
   }
 
   if (lengths_->Available() == 0) {
-    lengths_->ReSize(lengths_->Capacity() * 2);
+    lengths_->ReSize(lengths_->Used() + sizeof(int32), 2);
   }
 
   estimated_size_ += size;
   data_->Write(buffer, origin_size);
   data_->Brush(size);
 
-  lengths_->Write(reinterpret_cast<int64 *>(&size), sizeof(int64));
-  lengths_->Brush(sizeof(int64));
+  lengths_->Write(reinterpret_cast<int32 *>(&size), sizeof(int32));
+  lengths_->Brush(sizeof(int32));
 
   offsets_.emplace_back(offsets_.empty()
                             ? 0
@@ -292,7 +239,7 @@ void PaxNonFixedColumn::Append(char *buffer, size_t size) {
   Assert(offsets_.size() == lengths_->GetSize());
 }
 
-DataBuffer<int64> *PaxNonFixedColumn::GetLengthBuffer() const {
+DataBuffer<int32> *PaxNonFixedColumn::GetLengthBuffer() const {
   return lengths_;
 }
 
@@ -300,13 +247,8 @@ PaxColumnTypeInMem PaxNonFixedColumn::GetPaxColumnTypeInMem() const {
   return PaxColumnTypeInMem::kTypeNonFixed;
 }
 
-void PaxNonFixedColumn::Clear() {
-  PaxColumn::Clear();
-
-  data_->BrushBackAll();
-  lengths_->BrushBackAll();
-
-  offsets_.clear();
+PaxStorageFormat PaxNonFixedColumn::GetStorageFormat() const {
+  return PaxStorageFormat::kTypeStorageOrcNonVec;
 }
 
 std::pair<char *, size_t> PaxNonFixedColumn::GetBuffer() {
@@ -350,14 +292,4 @@ std::pair<char *, size_t> PaxNonFixedColumn::GetRangeBuffer(size_t start_pos,
   return std::make_pair(data_->GetBuffer() + offsets_[start_pos], range_len);
 }
 
-bool PaxNonFixedColumn::IsMemTakeOver() const {
-  Assert(data_->IsMemTakeOver() == lengths_->IsMemTakeOver());
-  return data_->IsMemTakeOver();
-}
-
-void PaxNonFixedColumn::SetMemTakeOver(bool take_over) {
-  data_->SetMemTakeOver(take_over);
-  lengths_->SetMemTakeOver(take_over);
-}
-
 };  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column.h b/contrib/pax_storage/src/cpp/storage/columns/pax_column.h
index f6de8f4f567..69592fa8876 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_column.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column.h
@@ -8,9 +8,13 @@
 #include <utility>
 #include <vector>
 
+#include "comm/bitmap.h"
 #include "storage/columns/pax_compress.h"
+#include "storage/columns/pax_decoding.h"
+#include "storage/columns/pax_encoding.h"
 #include "storage/columns/pax_encoding_utils.h"
 #include "storage/pax_buffer.h"
+#include "storage/pax_defined.h"
 #include "storage/proto/proto_wrappers.h"
 
 namespace pax {
@@ -21,47 +25,115 @@ namespace pax {
 // Used to mapping pg_type
 enum PaxColumnTypeInMem { kTypeInvalid = 1, kTypeFixed = 2, kTypeNonFixed = 3 };
 
-enum PaxColumnStorageType {
-  // default non-vec store
-  // which split null field and null bitmap
-  kTypeStorageNonVec,
-  // vec storage format
-  // spec the storage format
-  kTypeStorageVec,
-};
-
 class PaxColumn {
  public:
   PaxColumn();
 
   virtual ~PaxColumn();
 
-  virtual PaxColumn *SetColumnEncodeType(ColumnEncoding_Kind encoding_type);
-
-  virtual PaxColumn *SetColumnStorageType(PaxColumnStorageType storage_type);
-
   // Get the column in memory type
   virtual PaxColumnTypeInMem GetPaxColumnTypeInMem() const;
 
-  // Empties the vector from all its elements, recursively.
-  // Do not alter the current capacity.
-  virtual void Clear();
-
   // Get column buffer from current column
   virtual std::pair<char *, size_t> GetBuffer() = 0;
 
-  // Get buffer by position
+  // The interface `GetBuffer(size_t position)` and
+  // `GetRangeBuffer(size_t start_pos, size_t len)`
+  // will return the different values in different
+  // `ColumnStorageType` + `ColumnTypeInMem`
+  //
+  // Also they should NEVER call in write path with encoding option!!!
+  // But without encoding option, still can direct call it.
+  //
+  // If `storage_type_` is kTypeStorageOrcVec
+  // Then data part contains `null field` which means no need use
+  // `row index - null counts` to get the data.
+  //
+  // But If `storage_type_` is not kTypeStorageOrcVec
+  // Then position should be `row index - null counts`, because
+  // data part will not contains `null field`.
+  //
+  // Also it is kind different in fixed-length column and non-fixed-length
+  // column when `storage_type_` is kTypeStorageOrcVec. For the fixed-length
+  // column, If we got a `null field`, then it will return the buffer with zero
+  // fill. But in non-fixed-length column, once we got  `null field`, the buffer
+  // will be nullptr.
+  //
+  // A example to explain:
+  //  std::tuple<char *, size_t, bool> GetBufferWithNull(
+  //     size_t row_index,
+  //     size_t null_counts) {
+  //
+  //    PaxColumn *column = source();
+  //    char * buffer = nullptr;
+  //    size_t length = 0;
+  //    switch (GetPaxColumnTypeInMem()) {
+  //      case kTypeFixed: {
+  //        if (COLUMN_STORAGE_FORMAT_IS_VEC(column)) {
+  //          std::tie(buffer, length) = column->GetBuffer(row_index);
+  //          assert(buffer);  // different return in different ColumnTypeInMem
+  //          if (!length) {
+  //            return {nullptr, 0, true};
+  //          }
+  //        } else {
+  //          std::tie(buffer, length) = column->GetBuffer(
+  //            row_index - null_counts);
+  //        }
+  //        assert(buffer && length);
+  //        return {buffer, length, false};
+  //      }
+  //      case kTypeNonFixed: {
+  //        if (COLUMN_STORAGE_FORMAT_IS_VEC(column)) {
+  //          std::tie(buffer, length) = column->GetBuffer(row_index);
+  //          // different return in different ColumnTypeInMem
+  //          assert((!buffer && !length) || (buffer && length));
+  //          if (!buffer && !length) {
+  //            return {nullptr, 0, true};
+  //          }
+  //        } else {
+  //          std::tie(buffer, length) = column->GetBuffer(
+  //            row_index - null_counts);
+  //        }
+  //        return {buffer, length, false};
+  //        break;
+  //      }
+  //      default:
+  //        // nothing
+  //    }
+  //    // should not react here!
+  //    assert(false);
+  //   }
+  //
+  // A simplest example:
+  //  std::tuple<char *, size_t, bool> GetBufferWithNull(size_t row_index,
+  //  size_t null_counts) {
+  //    PaxColumn *column = source();
+  //    char * buffer = nullptr;
+  //    size_t length = 0;
+  //    if (COLUMN_STORAGE_FORMAT_IS_VEC(column)) {
+  //      std::tie(buffer, length) = column->GetBuffer(row_index);
+  //      if (!length) {
+  //        return {nullptr, 0, true};
+  //      }
+  //    } else {
+  //      std::tie(buffer, length) = column->GetBuffer(row_index - null_counts);
+  //    }
+  //    assert(buffer && length);
+  //    return {buffer, length, false};
+  //  }
+  //
   virtual std::pair<char *, size_t> GetBuffer(size_t position) = 0;
 
   // Get buffer by range [start_pos, start_pos + len)
+  // Should never call in write path with encoding option
   virtual std::pair<char *, size_t> GetRangeBuffer(size_t start_pos,
                                                    size_t len) = 0;
 
   // Get all rows number(contain null) from column
-  virtual size_t GetRows();
+  virtual size_t GetRows() const;
 
   // Get rows number(not null) from column
-  virtual size_t GetNonNullRows() const = 0;
+  virtual size_t GetNonNullRows() const;
 
   // Get all rows number(not null) from column by range [start_pos, start_pos +
   // len)
@@ -76,36 +148,86 @@ class PaxColumn {
   // Estimated memory size from current column
   virtual size_t PhysicalSize() const = 0;
 
-  // Get current encoding type
-  virtual ColumnEncoding_Kind GetEncodingType() const;
+  // Get current storage type
+  virtual PaxStorageFormat GetStorageFormat() const = 0;
 
   // Get the data size without encoding/compress
   virtual int64 GetOriginLength() const = 0;
 
-  // Get the type length, if non-fixed, will return -1
+  // Get the type length, used to identify sub-class
+  // - `PaxCommColumn<T>` will return the <T> length
+  // - `PaxNonFixedColumn` will return -1
   virtual int32 GetTypeLength() const = 0;
 
   // Contain null filed or not
   bool HasNull();
 
+  // Are all values null?
+  bool AllNull() const;
+
   // Set null bitmap
-  void SetNulls(DataBuffer<bool> *null_bitmap);
+  void SetBitmap(Bitmap8 *null_bitmap);
+
+  // Get Bitmap
+  Bitmap8 *GetBitmap() { return null_bitmap_; }
+
+  void SetRows(size_t total_rows);
+
+  virtual size_t GetAlignSize() const;
+
+  virtual void SetAlignSize(size_t align_size);
+
+  // Get current encoding type
+  inline ColumnEncoding_Kind GetEncodingType() const { return encoded_type_; }
+
+  // Get current compress level
+  inline int GetCompressLevel() const { return compress_level_; }
+
+ protected:
+  // The encoding option should pass in sub-class
+  inline void SetEncodeType(ColumnEncoding_Kind encoding_type) {
+    encoded_type_ = encoding_type;
+  }
 
-  // Get null bitmaps
-  DataBuffer<bool> *GetNulls() const;
+  inline void SetCompressLevel(int compress_level) {
+    compress_level_ = compress_level;
+  }
 
-  // Get bull bitmaps by range [start_pos, start_pos + len)
-  std::pair<bool *, size_t> GetRangeNulls(size_t start_pos, size_t len);
+ private:
+  void CreateNulls(size_t cap);
 
  protected:
   // null field bit map
-  DataBuffer<bool> *null_bitmap_;
+  Bitmap8 *null_bitmap_;
+
+  // Writer: write pointer
+  // Reader: total rows
+  uint32 total_rows_;
 
-  // the column is encoded type
+  // some of subclass will not implements the not null logic,
+  // but can direct get not null rows by data part.
+  size_t non_null_rows_;
+
+  // the column encoded type
   ColumnEncoding_Kind encoded_type_;
 
-  // whether the column is storage
-  PaxColumnStorageType storage_type_;
+  // the column compress level
+  int compress_level_;
+
+  // data part align size.
+  // This field only takes effect when current column is no encoding/compress.
+  //
+  // About `type_align` in `pg_type` what you need to know:
+  // 1. address alignment: the datum which return need alignment with
+  // `type_align`
+  // 2. datum padding: the datum need padding with `type_align`
+  //
+  // The align logic in pax:
+  // 1. address alignment:
+  //    - write will make sure address alignment(data stream) in disk
+  //    - `ReadTuple` with/without memcpy should get a alignment datum
+  // 2. datum padding: deal it in column `Append`
+  size_t type_align_size_;
 
  private:
   PaxColumn(const PaxColumn &);
@@ -115,7 +237,7 @@ class PaxColumn {
 template <typename T>
 class PaxCommColumn : public PaxColumn {
  public:
-  explicit PaxCommColumn(uint64 capacity);
+  explicit PaxCommColumn(uint32 capacity);
 
   ~PaxCommColumn() override;
 
@@ -125,6 +247,8 @@ class PaxCommColumn : public PaxColumn {
 
   PaxColumnTypeInMem GetPaxColumnTypeInMem() const override;
 
+  PaxStorageFormat GetStorageFormat() const override;
+
   void Append(char *buffer, size_t size) override;
 
   std::pair<char *, size_t> GetBuffer(size_t position) override;
@@ -134,8 +258,6 @@ class PaxCommColumn : public PaxColumn {
 
   size_t GetNonNullRows() const override;
 
-  void Clear() override;
-
   size_t PhysicalSize() const override;
 
   int64 GetOriginLength() const override;
@@ -145,10 +267,6 @@ class PaxCommColumn : public PaxColumn {
   int32 GetTypeLength() const override;
 
  protected:
-  virtual void ReSize(uint64 capacity);
-
- protected:
-  uint64 capacity_;
   DataBuffer<T> *data_;
 };
 
@@ -162,20 +280,20 @@ extern template class PaxCommColumn<double>;
 
 class PaxNonFixedColumn : public PaxColumn {
  public:
-  explicit PaxNonFixedColumn(uint64 capacity);
+  explicit PaxNonFixedColumn(uint32 capacity);
 
   PaxNonFixedColumn();
 
   ~PaxNonFixedColumn() override;
 
-  virtual void Set(DataBuffer<char> *data, DataBuffer<int64> *lengths,
+  virtual void Set(DataBuffer<char> *data, DataBuffer<int32> *lengths,
                    size_t total_size);
 
   void Append(char *buffer, size_t size) override;
 
   PaxColumnTypeInMem GetPaxColumnTypeInMem() const override;
 
-  void Clear() override;
+  PaxStorageFormat GetStorageFormat() const override;
 
   std::pair<char *, size_t> GetBuffer() override;
 
@@ -192,18 +310,22 @@ class PaxNonFixedColumn : public PaxColumn {
 
   size_t GetNonNullRows() const override;
 
-  DataBuffer<int64> *GetLengthBuffer() const;
+  DataBuffer<int32> *GetLengthBuffer() const;
 
-  bool IsMemTakeOver() const;
+  DataBuffer<int32> *GetOffsetBuffer(bool append_last = false);
 
-  void SetMemTakeOver(bool take_over);
+ protected:
+  void BuildOffsets();
 
  protected:
   size_t estimated_size_;
   DataBuffer<char> *data_;
 
-  // orc needs to serialize int64 array
-  DataBuffer<int64> *lengths_;
+  // orc needs to serialize int32 array
+  // the length of a single tuple field will not exceed 2GB,
+  // so a variable-length element of the lengths stream can use int32 
+  // to represent the length
+  DataBuffer<int32> *lengths_;
   std::vector<uint64> offsets_;
 };
 
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.cc
new file mode 100644
index 00000000000..6b2335dd09c
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.cc
@@ -0,0 +1,236 @@
+#include "storage/columns/pax_column_cache.h"
+
+#include <uuid/uuid.h>
+
+#ifdef ENABLE_PLASMA
+namespace pax {
+
+struct PaxColumnsMeta {
+  int16 type_len : 8;
+  uint32 null_size : 32;
+  uint32 data_size : 32;
+  uint32 len_size : 32;
+  uint32 rows : 32;
+} __attribute__((__aligned__(8)));
+
+static std::string BuildCacheKey(const std::string &file_name,
+                                 const uint16 column_index,
+                                 const uint16 group_index) {
+  unsigned char key_str[20];
+
+  CBDB_CHECK(uuid_parse(file_name.c_str(), key_str) == 0,
+             cbdb::CException::ExType::kExTypeCError);
+
+  static_assert(sizeof(uuid_t) == 16, "Invalid uuid_t length");
+  memcpy(key_str + 16, &column_index, sizeof(uint16));
+  memcpy(key_str + 18, &group_index, sizeof(uint16));
+
+  return std::string((char *)key_str, 20);
+}
+
+PaxColumnCache::PaxColumnCache(PaxCache *cache, const std::string &file_name,
+                               bool *proj, size_t proj_num)
+    : pax_cache_(cache),
+      file_name_(file_name),
+      proj_(proj),
+      proj_num_(proj_num) {
+  Assert(pax_cache_ && proj_);
+}
+
+template <typename T>
+static PaxColumn *NewFixColumn(const char *buffer, size_t buffer_len) {
+  auto column = PAX_NEW<PaxCommColumn<T>>(0);
+  Assert(buffer_len % sizeof(T) == 0);
+  auto data_buffer = PAX_NEW<DataBuffer<T>>((T *)(buffer), buffer_len, false, false);
+  data_buffer->BrushAll();
+  column->Set(data_buffer);
+  return column;
+}
+
+std::tuple<PaxColumns *, std::vector<std::string>, bool *>
+PaxColumnCache::ReadCache(size_t group_index) {
+  PaxColumns *columns = PAX_NEW<PaxColumns>();
+  std::vector<std::string> keys;
+  std::vector<PaxCache::BatchBuffer> batchs;
+  size_t cache_index = 0;
+  int64 rows = -1;
+  bool *proj_copy = PAX_NEW_ARRAY<bool>(proj_num_);
+  size_t no_proj_num = 0;
+
+  memcpy(proj_copy, proj_, proj_num_);
+
+  for (size_t i = 0; i < proj_num_; i++) {
+    if (!proj_copy[i]) {
+      continue;
+    }
+    keys.emplace_back(BuildCacheKey(file_name_, i, group_index));
+  }
+
+  auto status = pax_cache_->Get(keys, batchs);
+  if (!status.Ok()) {
+    keys.clear();
+    // TODO(jiaqizho): add log here
+    return std::make_tuple(nullptr, keys, proj_copy);
+  }
+
+  for (size_t i = 0; i < proj_num_; i++) {
+    if (!proj_copy[i]) {
+      no_proj_num++;
+      columns->Append(nullptr);
+      continue;
+    }
+    auto batch_buffer = batchs[cache_index++];
+
+    if (batch_buffer.not_exist) {
+      keys[i - no_proj_num] = "";
+      columns->Append(nullptr);
+      continue;
+    }
+
+    Assert(batch_buffer.meta_len == sizeof(PaxColumnsMeta));
+    PaxColumnsMeta *meta = (PaxColumnsMeta *)batch_buffer.meta;
+
+    AssertImply(rows != -1, (size_t)rows == meta->rows);
+    rows = meta->rows;
+
+    Assert(batch_buffer.buffer_len ==
+           (size_t)(meta->null_size + meta->data_size + meta->len_size));
+
+    PaxColumn *column = nullptr;
+    switch (meta->type_len) {
+      case -1: {
+        auto non_fixed_column = PAX_NEW<PaxNonFixedColumn>(0);
+        Assert(meta->len_size % sizeof(int64) == 0);
+        auto data_buffer = PAX_NEW<DataBuffer<char>>(
+            (char *)(batch_buffer.buffer + meta->null_size), meta->data_size,
+            false, false);
+        auto len_data_buffer = PAX_NEW<DataBuffer<int64>>(
+            (int64 *)(batch_buffer.buffer + meta->null_size + meta->data_size),
+            meta->len_size, false, false);
+        data_buffer->BrushAll();
+        len_data_buffer->BrushAll();
+
+        non_fixed_column->Set(data_buffer, len_data_buffer,
+                              batch_buffer.buffer_len);
+        column = non_fixed_column;
+        break;
+      }
+      case 1: {
+        column = NewFixColumn<int8>(batch_buffer.buffer + meta->null_size,
+                                    meta->data_size);
+        break;
+      }
+      case 2: {
+        column = NewFixColumn<int16>(batch_buffer.buffer + meta->null_size,
+                                     meta->data_size);
+        break;
+      }
+      case 4: {
+        column = NewFixColumn<int32>(batch_buffer.buffer + meta->null_size,
+                                     meta->data_size);
+        break;
+      }
+      case 8: {
+        column = NewFixColumn<int64>(batch_buffer.buffer + meta->null_size,
+                                     meta->data_size);
+        break;
+      }
+      default: {
+        Assert(false);
+      }
+    }
+
+    if (meta->null_size != 0) {
+      auto null_bitmap = PAX_NEW<Bitmap8>(
+          BitmapRaw<uint8>((uint8 *)(batch_buffer.buffer), meta->null_size),
+          BitmapTpl<uint8>::ReadOnlyRefBitmap);
+      column->SetBitmap(null_bitmap);
+    } else {
+      column->SetBitmap(nullptr);
+    }
+
+    columns->Append(column);
+    proj_copy[i] = false;
+  }
+
+  if (rows != -1) {
+    columns->AddRows(rows);
+  }
+
+  return std::make_tuple(columns, keys, proj_copy);
+}
+
+void PaxColumnCache::ReleaseCache(std::vector<std::string> keys) {
+  for (auto &key : keys) {
+    if (key.length() != 0) pax_cache_->Release(key);
+  }
+}
+
+void PaxColumnCache::WriteCache(PaxColumns *columns, size_t group_index) {
+  std::string key;
+  PaxColumnsMeta meta{};
+  int64 rows = -1;
+
+  for (size_t i = 0; i < proj_num_; i++) {
+    auto column = (*columns)[i];
+    if (!proj_[i] || !column) {
+      continue;
+    }
+
+    key = BuildCacheKey(file_name_, i, group_index);
+
+    AssertImply(rows != -1, (size_t)rows == column->GetRows());
+    rows = column->GetRows();
+
+    std::vector<std::pair<char *, size_t>> buffers;
+
+    if (column->HasNull()) {
+      auto bm = column->GetBitmap();
+      Assert(bm);
+      auto nbytes = bm->MinimalStoredBytes(column->GetRows());
+      Assert(nbytes <= bm->Raw().size);
+
+      meta.null_size = nbytes;
+      buffers.emplace_back(
+          std::make_pair(reinterpret_cast<char *>(bm->Raw().bitmap), nbytes));
+    } else {
+      meta.null_size = 0;
+    }
+
+    char *buffer = nullptr;
+    size_t buffer_len = 0;
+
+    if (column->GetPaxColumnTypeInMem() == kTypeNonFixed) {
+      auto non_fixed_column = (PaxNonFixedColumn *)column;
+      std::tie(buffer, buffer_len) = non_fixed_column->GetBuffer();
+      auto len_buffer = non_fixed_column->GetLengthBuffer();
+
+      buffers.emplace_back(std::make_pair(buffer, buffer_len));
+      buffers.emplace_back(
+          std::make_pair((char *)len_buffer->GetBuffer(), len_buffer->Used()));
+
+      meta.type_len = non_fixed_column->GetTypeLength();
+      meta.data_size = buffer_len;
+      meta.len_size = len_buffer->Used();
+      meta.rows = rows;
+    } else if (column->GetPaxColumnTypeInMem() == kTypeFixed) {
+      std::tie(buffer, buffer_len) = column->GetBuffer();
+      buffers.emplace_back(std::make_pair(buffer, buffer_len));
+
+      meta.type_len = column->GetTypeLength();
+      meta.data_size = buffer_len;
+      meta.len_size = 0;
+      meta.rows = rows;
+
+    } else {
+      Assert(false);
+    }
+
+    pax_cache_->Put(key, buffers,
+                    std::make_pair((char *)&meta, sizeof(PaxColumnsMeta)));
+  }
+}
+
+}  // namespace pax
+
+#endif  // ENABLE_PLASMA
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.h b/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.h
new file mode 100644
index 00000000000..ee56de5a1b1
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column_cache.h
@@ -0,0 +1,38 @@
+#pragma once
+#include <cstddef>
+#include <string>
+#include <utility>
+
+#include "storage/columns/pax_columns.h"
+
+#ifdef ENABLE_PLASMA
+#include "storage/cache/pax_plasma_cache.h"
+namespace pax {
+
+class PaxColumnCache final {
+ public:
+  PaxColumnCache(PaxCache *cache, const std::string &file_name, bool *proj,
+                 size_t proj_num);
+
+  ~PaxColumnCache() = default;
+
+  // Read the cache from current group
+  // Return the tuple with
+  // <cached PaxColumns, release keyids, a new projection mask>
+  std::tuple<PaxColumns *, std::vector<std::string>, bool *> ReadCache(
+      size_t group_index);
+
+  void ReleaseCache(std::vector<std::string> keys);
+
+  void WriteCache(PaxColumns *columns, size_t group_index);
+
+ private:
+  PaxCache *pax_cache_;
+  std::string file_name_;
+  bool *proj_;
+  size_t proj_num_;
+};
+
+};  // namespace pax
+
+#endif  // ENABLE_PLASMA
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.cc
deleted file mode 100644
index 51419bd6ffd..00000000000
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.cc
+++ /dev/null
@@ -1,43 +0,0 @@
-
-#include "storage/columns/pax_column_int.h"
-
-namespace pax {
-
-template <typename T>
-PaxIntColumn<T>::PaxIntColumn(const PaxEncoder::EncodingOption &encoding_option)
-    : PaxEncodingColumn<T>(DEFAULT_CAPACITY, encoding_option) {
-  PaxEncodingColumn<T>::InitEncoder();
-}
-
-template <typename T>
-PaxIntColumn<T>::PaxIntColumn(uint64 capacity,
-                              const PaxEncoder::EncodingOption &encoding_option)
-    : PaxEncodingColumn<T>(capacity, encoding_option) {
-  PaxEncodingColumn<T>::InitEncoder();
-}
-
-template <typename T>
-PaxIntColumn<T>::PaxIntColumn(const PaxDecoder::DecodingOption &decoding_option)
-    : PaxEncodingColumn<T>(DEFAULT_CAPACITY, decoding_option) {
-  PaxEncodingColumn<T>::InitDecoder();
-}
-
-template <typename T>
-PaxIntColumn<T>::PaxIntColumn(uint64 capacity,
-                              const PaxDecoder::DecodingOption &decoding_option)
-    : PaxEncodingColumn<T>(capacity, decoding_option) {
-  PaxEncodingColumn<T>::InitDecoder();
-}
-
-template <typename T>
-ColumnEncoding_Kind PaxIntColumn<T>::GetDefaultColumnType() {
-  return sizeof(T) >= 4 ? ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2
-                        : ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA;
-}
-
-template class PaxIntColumn<int8>;
-template class PaxIntColumn<int16>;
-template class PaxIntColumn<int32>;
-template class PaxIntColumn<int64>;
-
-}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.h b/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.h
deleted file mode 100644
index e38b8c3f0cd..00000000000
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_column_int.h
+++ /dev/null
@@ -1,31 +0,0 @@
-
-#pragma once
-#include "storage/columns/pax_encoding_column.h"
-
-namespace pax {
-
-template <typename T>
-class PaxIntColumn final : public PaxEncodingColumn<T> {
- public:
-  explicit PaxIntColumn(const PaxEncoder::EncodingOption &encoding_option);
-
-  PaxIntColumn(uint64 capacity,
-               const PaxEncoder::EncodingOption &encoding_option);
-
-  explicit PaxIntColumn(const PaxDecoder::DecodingOption &decoding_option);
-
-  PaxIntColumn(uint64 capacity,
-               const PaxDecoder::DecodingOption &decoding_option);
-
-  ~PaxIntColumn() override = default;
-
- protected:
-  ColumnEncoding_Kind GetDefaultColumnType() override;
-};
-
-extern template class PaxIntColumn<int8>;
-extern template class PaxIntColumn<int16>;
-extern template class PaxIntColumn<int32>;
-extern template class PaxIntColumn<int64>;
-
-}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_test.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_column_test.cc
index 640975de062..96128117b29 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_column_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column_test.cc
@@ -5,12 +5,11 @@
 #include "comm/cbdb_wrappers.h"
 #include "comm/gtest_wrappers.h"
 #include "exceptions/CException.h"
-#include "storage/columns/pax_column_int.h"
-#include "storage/columns/pax_encoding_column.h"
-#include "storage/columns/pax_encoding_non_fixed_column.h"
+#include "pax_gtest_helper.h"
+#include "storage/columns/pax_column_traits.h"
 
 namespace pax::tests {
-
+using namespace pax::traits;
 static void AppendInt4All(PaxColumn *pax_column, size_t bits) {
   int64 data;
   for (int16 i = INT16_MIN; i <= INT16_MAX; ++i) {  // dead loop
@@ -55,123 +54,168 @@ static void VerifyInt4All(char *verify_buff, size_t verify_len, size_t bits) {
 }
 
 static PaxColumn *CreateEncodeColumn(
-    uint8 bits, const PaxEncoder::EncodingOption &encoding_option) {
+    uint8 bits, const PaxEncoder::EncodingOption &encoding_option,
+    PaxStorageFormat storage_type = PaxStorageFormat::kTypeStorageOrcNonVec) {
   PaxColumn *int_column;
 
   switch (bits) {
     case 16:
-      int_column = new PaxIntColumn<int16>(1024, std::move(encoding_option));
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int16>::create_encoding(
+                1024, std::move(encoding_option));
+      } else {
+        int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int16>::create_encoding(
+                1024, std::move(encoding_option));
+      }
       break;
     case 32:
-      int_column = new PaxIntColumn<int32>(1024, std::move(encoding_option));
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int32>::create_encoding(
+                1024, std::move(encoding_option));
+      } else {
+        int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int32>::create_encoding(
+                1024, std::move(encoding_option));
+      }
       break;
     case 64:
-      int_column = new PaxIntColumn<int64>(1024, std::move(encoding_option));
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int64>::create_encoding(
+                1024, std::move(encoding_option));
+      } else {
+        int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int64>::create_encoding(
+                1024, std::move(encoding_option));
+      }
       break;
     default:
       int_column = nullptr;
       break;
   }
+
   return int_column;
 }
 
 static PaxColumn *CreateDecodeColumn(
-    uint8 bits, size_t origin_lem,
+    uint8 bits, size_t origin_len, size_t origin_rows,
     const PaxDecoder::DecodingOption &decoding_option, char *encoded_buff,
-    size_t encoded_len) {
+    size_t encoded_len,
+    PaxStorageFormat storage_type = PaxStorageFormat::kTypeStorageOrcNonVec,
+    size_t column_not_nulls = 0) {
+  PaxColumn *column_rc = nullptr;
   switch (bits) {
     case 16: {
       auto *buffer_for_read = new DataBuffer<int16>(
           reinterpret_cast<int16 *>(encoded_buff), encoded_len, false, false);
       buffer_for_read->Brush(encoded_len);
 
-      auto int_column = new PaxIntColumn<int16>(origin_lem / sizeof(int16),
-                                                std::move(decoding_option));
-      int_column->Set(buffer_for_read);
-
-      return int_column;
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        auto int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int16>::create_decoding(
+                origin_len / sizeof(int16), std::move(decoding_option));
+        int_column->Set(buffer_for_read);
+        column_rc = int_column;
+      } else {
+        auto int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int16>::create_decoding(
+                origin_len / sizeof(int16), std::move(decoding_option));
+        int_column->Set(buffer_for_read, column_not_nulls);
+        column_rc = int_column;
+      }
+      break;
     }
     case 32: {
       auto *buffer_for_read = new DataBuffer<int32>(
           reinterpret_cast<int32 *>(encoded_buff), encoded_len, false, false);
       buffer_for_read->Brush(encoded_len);
 
-      auto int_column = new PaxIntColumn<int32>(origin_lem / sizeof(int32),
-                                                std::move(decoding_option));
-      int_column->Set(buffer_for_read);
-      return int_column;
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        auto int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int32>::create_decoding(
+                origin_len / sizeof(int32), std::move(decoding_option));
+        int_column->Set(buffer_for_read);
+        column_rc = int_column;
+      } else {
+        auto int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int32>::create_decoding(
+                origin_len / sizeof(int32), std::move(decoding_option));
+        int_column->Set(buffer_for_read, column_not_nulls);
+        column_rc = int_column;
+      }
+      break;
     }
     case 64: {
       auto *buffer_for_read = new DataBuffer<int64>(
           reinterpret_cast<int64 *>(encoded_buff), encoded_len, false, false);
       buffer_for_read->Brush(encoded_len);
 
-      auto int_column = new PaxIntColumn<int64>(origin_lem / sizeof(int64),
-                                                std::move(decoding_option));
-      int_column->Set(buffer_for_read);
-      return int_column;
+      if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+        auto int_column =
+            ColumnOptCreateTraits<PaxEncodingColumn, int64>::create_decoding(
+                origin_len / sizeof(int64), std::move(decoding_option));
+        int_column->Set(buffer_for_read);
+        column_rc = int_column;
+      } else {
+        auto int_column =
+            ColumnOptCreateTraits<PaxVecEncodingColumn, int64>::create_decoding(
+                origin_len / sizeof(int64), std::move(decoding_option));
+        int_column->Set(buffer_for_read, column_not_nulls);
+        column_rc = int_column;
+      }
+      break;
     }
     default: {
       return nullptr;
     }
   }
-  return nullptr;
+
+  if (column_rc) {
+    column_rc->SetRows(origin_rows);
+  }
+  return column_rc;
 }
 
-class PaxColumnTest : public ::testing::Test {
+class PaxColumnTest : public ::testing::TestWithParam<PaxStorageFormat> {
  public:
-  void SetUp() override {
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxColumn memory context", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
-class PaxColumnEncodingTest : public ::testing::TestWithParam<uint8> {
+class PaxColumnEncodingTest : public ::testing::TestWithParam<
+                                  ::testing::tuple<uint8, PaxStorageFormat>> {
  public:
-  void SetUp() override {
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxColumn memory context", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxColumnCompressTest
     : public ::testing::TestWithParam<
           ::testing::tuple<uint8, ColumnEncoding_Kind>> {
  public:
-  void SetUp() override {
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxColumn memory context", 800 * 1024 * 1024,
-        800 * 1024 * 1024, 800 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxNonFixedColumnCompressTest
     : public ::testing::TestWithParam<
           ::testing::tuple<uint8, ColumnEncoding_Kind, bool>> {
  public:
-  void SetUp() override {
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxColumn memory context", 800 * 1024 * 1024,
-        800 * 1024 * 1024, 800 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
-TEST_F(PaxColumnTest, FixColumnGetRangeBufferTest) {
+TEST_P(PaxColumnTest, FixColumnGetRangeBufferTest) {
   PaxColumn *column;
+  auto storage_type = GetParam();
   char *buffer = nullptr;
   size_t buffer_len = 0;
 
-  column = new PaxCommColumn<int32>(200);
+  if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+    column = ColumnCreateTraits<PaxCommColumn, int32>::create(200);
+  } else {
+    column = ColumnCreateTraits<PaxVecCommColumn, int32>::create(200);
+  }
+
   for (int32 i = 0; i < 16; i++) {
     column->Append(reinterpret_cast<char *>(&i), sizeof(int32));
   }
@@ -186,7 +230,12 @@ TEST_F(PaxColumnTest, FixColumnGetRangeBufferTest) {
   ASSERT_EQ(column->GetRows(), 16);
   ASSERT_EQ(column->GetRangeNonNullRows(0, column->GetRows()), 16);
 
-  column->Clear();
+  delete column;
+  if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+    column = ColumnCreateTraits<PaxCommColumn, int32>::create(200);
+  } else {
+    column = ColumnCreateTraits<PaxVecCommColumn, int32>::create(200);
+  }
 
   for (int32 i = 0; i < 16; i++) {
     if (i % 3 == 0) {
@@ -195,12 +244,37 @@ TEST_F(PaxColumnTest, FixColumnGetRangeBufferTest) {
     column->Append(reinterpret_cast<char *>(&i), sizeof(int32));
   }
 
-  std::tie(buffer, buffer_len) = column->GetRangeBuffer(5, 10);
-  ASSERT_EQ(buffer_len, 10 * sizeof(int32));
+  switch (storage_type) {
+    case kTypeStorageOrcNonVec: {
+      std::tie(buffer, buffer_len) = column->GetRangeBuffer(5, 10);
+      ASSERT_EQ(buffer_len, 10 * sizeof(int32));
 
-  for (size_t i = 5; i < 16; i++) {
-    auto *i_32 = reinterpret_cast<int32 *>(buffer + ((i - 5) * sizeof(int32)));
-    ASSERT_EQ(*i_32, (int32)i);
+      for (size_t i = 5; i < 16; i++) {
+        auto *i_32 =
+            reinterpret_cast<int32 *>(buffer + ((i - 5) * sizeof(int32)));
+        ASSERT_EQ(*i_32, (int32)i);
+      }
+      break;
+    }
+    case kTypeStorageOrcVec: {
+      std::tie(buffer, buffer_len) = column->GetRangeBuffer(0, 10);
+      ASSERT_EQ(buffer_len, 10 * sizeof(int32));
+
+      size_t nulls_count = 0;
+      for (size_t i = 0; i < 10; i++) {
+        auto *i_32 = reinterpret_cast<int32 *>(buffer + (i * sizeof(int32)));
+        if (i % 4 == 0) {
+          nulls_count++;
+          ASSERT_EQ(*i_32, 0);
+        } else {
+          ASSERT_EQ(*i_32, (int32)i - nulls_count);
+        }
+      }
+
+      break;
+    }
+    default:
+      break;
   }
 
   ASSERT_EQ(column->GetRows(), 16 + 6);
@@ -209,12 +283,18 @@ TEST_F(PaxColumnTest, FixColumnGetRangeBufferTest) {
   delete column;
 }
 
-TEST_F(PaxColumnTest, NonFixColumnGetRangeBufferTest) {
+TEST_P(PaxColumnTest, NonFixColumnGetRangeBufferTest) {
   PaxColumn *column;
+  auto storage_type = GetParam();
   char *buffer = nullptr;
   size_t buffer_len = 0;
 
-  column = new PaxNonFixedColumn(200);
+  if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+    column = ColumnCreateTraits2<PaxNonFixedColumn>::create(200);
+  } else {
+    column = ColumnCreateTraits2<PaxVecNonFixedColumn>::create(200);
+  }
+
   for (int64 i = 0; i < 16; i++) {
     column->Append(reinterpret_cast<char *>(&i), sizeof(int64));
   }
@@ -223,13 +303,19 @@ TEST_F(PaxColumnTest, NonFixColumnGetRangeBufferTest) {
   ASSERT_EQ(buffer_len, 10 * sizeof(int64));
 
   for (size_t i = 5; i < 16; i++) {
-    auto *i_32 = reinterpret_cast<int64 *>(buffer + ((i - 5) * sizeof(int64)));
-    ASSERT_EQ(*i_32, (int64)i);
+    auto *i_64 = reinterpret_cast<int64 *>(buffer + ((i - 5) * sizeof(int64)));
+    ASSERT_EQ(*i_64, (int64)i);
   }
   ASSERT_EQ(column->GetRows(), 16);
   ASSERT_EQ(column->GetRangeNonNullRows(0, column->GetRows()), 16);
 
-  column->Clear();
+  delete column;
+
+  if (storage_type == PaxStorageFormat::kTypeStorageOrcNonVec) {
+    column = ColumnCreateTraits2<PaxNonFixedColumn>::create(200);
+  } else {
+    column = ColumnCreateTraits2<PaxVecNonFixedColumn>::create(200);
+  }
 
   for (int64 i = 0; i < 16; i++) {
     if (i % 3 == 0) {
@@ -238,12 +324,49 @@ TEST_F(PaxColumnTest, NonFixColumnGetRangeBufferTest) {
     column->Append(reinterpret_cast<char *>(&i), sizeof(int64));
   }
 
-  std::tie(buffer, buffer_len) = column->GetRangeBuffer(5, 10);
-  ASSERT_EQ(buffer_len, 10 * sizeof(int64));
+  switch (storage_type) {
+    case kTypeStorageOrcNonVec: {
+      std::tie(buffer, buffer_len) = column->GetRangeBuffer(5, 10);
+      ASSERT_EQ(buffer_len, 10 * sizeof(int64));
 
-  for (size_t i = 5; i < 16; i++) {
-    auto *i_32 = reinterpret_cast<int64 *>(buffer + ((i - 5) * sizeof(int64)));
-    ASSERT_EQ(*i_32, (int64)i);
+      for (size_t i = 5; i < 16; i++) {
+        auto *i_64 =
+            reinterpret_cast<int64 *>(buffer + ((i - 5) * sizeof(int64)));
+        ASSERT_EQ(*i_64, (int64)i);
+      }
+      break;
+    }
+    case kTypeStorageOrcVec: {
+      size_t nulls_count = 0;
+      for (size_t i = 0; i < 10; i++) {
+        std::tie(buffer, buffer_len) = column->GetBuffer(i);
+        if (buffer) {
+          ASSERT_EQ(i - nulls_count, *reinterpret_cast<int64 *>(buffer));
+        } else {
+          nulls_count++;
+        }
+      }
+
+      std::tie(buffer, buffer_len) = column->GetRangeBuffer(0, 10);
+
+      // 0 4 8 is null
+      ASSERT_EQ(buffer_len, 7 * sizeof(int64));
+
+      nulls_count = 0;
+      for (size_t i = 0; i < 10; i++) {
+        auto *i_64 = reinterpret_cast<int64 *>(
+            buffer + ((i - nulls_count) * sizeof(int64)));
+        if (i % 4 == 0) {
+          nulls_count++;
+        } else {
+          ASSERT_EQ(*i_64, (int32)i - nulls_count);
+        }
+      }
+
+      break;
+    }
+    default:
+      break;
   }
 
   ASSERT_EQ(column->GetRows(), 16 + 6);
@@ -254,7 +377,8 @@ TEST_F(PaxColumnTest, NonFixColumnGetRangeBufferTest) {
 
 TEST_P(PaxColumnEncodingTest, GetRangeEncodingColumnTest) {
   PaxColumn *int_column;
-  auto bits = GetParam();
+  auto bits = ::testing::get<0>(GetParam());
+  auto storage_type = ::testing::get<1>(GetParam());
   if (bits < 32) {
     return;
   }
@@ -264,7 +388,8 @@ TEST_P(PaxColumnEncodingTest, GetRangeEncodingColumnTest) {
       ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED;
   encoding_option.is_sign = true;
 
-  int_column = CreateEncodeColumn(bits, std::move(encoding_option));
+  int_column =
+      CreateEncodeColumn(bits, std::move(encoding_option), storage_type);
   ASSERT_TRUE(int_column);
 
   int64 data;
@@ -280,16 +405,19 @@ TEST_P(PaxColumnEncodingTest, GetRangeEncodingColumnTest) {
   ASSERT_LT(encoded_len, UINT16_MAX);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, (100) * bits / 8);
 
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoding_option.is_sign = true;
 
   auto int_column_for_read = CreateDecodeColumn(
-      bits, origin_len, std::move(decoding_option), encoded_buff, encoded_len);
+      bits, origin_len, origin_rows, std::move(decoding_option), encoded_buff,
+      encoded_len, storage_type, 100);
 
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 0);
   char *verify_buff;
   size_t verify_len;
   std::tie(verify_buff, verify_len) =
@@ -317,7 +445,7 @@ TEST_P(PaxColumnCompressTest, FixedCompressColumnGetRangeTest) {
 
   PaxEncoder::EncodingOption encoding_option;
   encoding_option.column_encode_type = kind;
-  encoding_option.compress_lvl = 5;
+  encoding_option.compress_level = 5;
   encoding_option.is_sign = true;
 
   int_column = CreateEncodeColumn(bits, std::move(encoding_option));
@@ -336,6 +464,7 @@ TEST_P(PaxColumnCompressTest, FixedCompressColumnGetRangeTest) {
   ASSERT_LT(encoded_len, UINT16_MAX);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, kind != ColumnEncoding_Kind_NO_ENCODED
                             ? (100) * bits / 8
                             : NO_ENCODE_ORIGIN_LEN);
@@ -343,11 +472,13 @@ TEST_P(PaxColumnCompressTest, FixedCompressColumnGetRangeTest) {
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type = kind;
   decoding_option.is_sign = true;
+  decoding_option.compress_level = 5;
 
   auto int_column_for_read =
-      CreateDecodeColumn(bits, (100) * bits / 8, std::move(decoding_option),
-                         encoded_buff, encoded_len);
+      CreateDecodeColumn(bits, (100) * bits / 8, origin_rows,
+                         std::move(decoding_option), encoded_buff, encoded_len);
 
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 5);
   char *verify_buff;
   size_t verify_len;
   std::tie(verify_buff, verify_len) =
@@ -370,7 +501,8 @@ TEST_P(PaxColumnCompressTest, FixedCompressColumnGetRangeTest) {
 
 TEST_P(PaxColumnEncodingTest, PaxEncodingColumnDefault) {
   PaxColumn *int_column;
-  auto bits = GetParam();
+  auto bits = ::testing::get<0>(GetParam());
+  auto storage_type = ::testing::get<1>(GetParam());
   if (bits < 32) {
     return;
   }
@@ -380,7 +512,8 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnDefault) {
       ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED;
   encoding_option.is_sign = true;
 
-  int_column = CreateEncodeColumn(bits, std::move(encoding_option));
+  int_column =
+      CreateEncodeColumn(bits, std::move(encoding_option), storage_type);
   ASSERT_TRUE(int_column);
 
   AppendInt4All(int_column, bits);
@@ -392,16 +525,19 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnDefault) {
   ASSERT_LT(encoded_len, UINT16_MAX);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, (UINT16_MAX + 1) * bits / 8);
 
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoding_option.is_sign = true;
 
   auto int_column_for_read = CreateDecodeColumn(
-      bits, origin_len, std::move(decoding_option), encoded_buff, encoded_len);
+      bits, origin_len, origin_rows, std::move(decoding_option), encoded_buff,
+      encoded_len, storage_type);
 
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 0);
   char *verify_buff;
   size_t verify_len;
   std::tie(verify_buff, verify_len) = int_column_for_read->GetBuffer();
@@ -413,14 +549,16 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnDefault) {
 
 TEST_P(PaxColumnEncodingTest, PaxEncodingColumnSpecType) {
   PaxColumn *int_column;
-  auto bits = GetParam();
+  auto bits = ::testing::get<0>(GetParam());
+  auto storage_type = ::testing::get<1>(GetParam());
 
   PaxEncoder::EncodingOption encoding_option;
   encoding_option.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoding_option.is_sign = true;
 
-  int_column = CreateEncodeColumn(bits, std::move(encoding_option));
+  int_column =
+      CreateEncodeColumn(bits, std::move(encoding_option), storage_type);
   ASSERT_TRUE(int_column);
 
   AppendInt4All(int_column, bits);
@@ -432,15 +570,18 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnSpecType) {
   ASSERT_LT(encoded_len, UINT16_MAX);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, (UINT16_MAX + 1) * bits / 8);
 
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoding_option.is_sign = true;
 
   auto int_column_for_read = CreateDecodeColumn(
-      bits, origin_len, std::move(decoding_option), encoded_buff, encoded_len);
+      bits, origin_len, origin_rows, std::move(decoding_option), encoded_buff,
+      encoded_len, storage_type);
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 0);
 
   char *verify_buff;
   size_t verify_len;
@@ -453,14 +594,16 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnSpecType) {
 
 TEST_P(PaxColumnEncodingTest, PaxEncodingColumnNoEncoding) {
   PaxColumn *int_column;
-  auto bits = GetParam();
+  auto bits = ::testing::get<0>(GetParam());
+  auto storage_type = ::testing::get<1>(GetParam());
 
   PaxEncoder::EncodingOption encoding_option;
   encoding_option.column_encode_type =
       ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED;
   encoding_option.is_sign = true;
 
-  int_column = CreateEncodeColumn(bits, std::move(encoding_option));
+  int_column =
+      CreateEncodeColumn(bits, std::move(encoding_option), storage_type);
   ASSERT_TRUE(int_column);
 
   AppendInt4All(int_column, bits);
@@ -471,6 +614,7 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnNoEncoding) {
   ASSERT_NE(encoded_buff, nullptr);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, NO_ENCODE_ORIGIN_LEN);
 
   PaxDecoder::DecodingOption decoding_option;
@@ -479,8 +623,9 @@ TEST_P(PaxColumnEncodingTest, PaxEncodingColumnNoEncoding) {
   decoding_option.is_sign = true;
 
   auto int_column_for_read = CreateDecodeColumn(
-      bits, encoded_len, std::move(decoding_option), encoded_buff, encoded_len);
-
+      bits, encoded_len, origin_rows, std::move(decoding_option), encoded_buff,
+      encoded_len, storage_type);
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 0);
   char *verify_buff;
   size_t verify_len;
   std::tie(verify_buff, verify_len) = int_column_for_read->GetBuffer();
@@ -497,7 +642,7 @@ TEST_P(PaxColumnCompressTest, PaxEncodingColumnCompressDecompress) {
 
   PaxEncoder::EncodingOption encoding_option;
   encoding_option.column_encode_type = kind;
-  encoding_option.compress_lvl = 5;
+  encoding_option.compress_level = 5;
   encoding_option.is_sign = true;
 
   int_column = CreateEncodeColumn(bits, std::move(encoding_option));
@@ -511,6 +656,7 @@ TEST_P(PaxColumnCompressTest, PaxEncodingColumnCompressDecompress) {
   ASSERT_NE(encoded_buff, nullptr);
 
   auto origin_len = int_column->GetOriginLength();
+  auto origin_rows = int_column->GetRows();
   ASSERT_EQ(origin_len, kind != ColumnEncoding_Kind_NO_ENCODED
                             ? (UINT16_MAX + 1) * bits / 8
                             : NO_ENCODE_ORIGIN_LEN);
@@ -518,11 +664,13 @@ TEST_P(PaxColumnCompressTest, PaxEncodingColumnCompressDecompress) {
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type = kind;
   decoding_option.is_sign = true;
+  decoding_option.compress_level = 5;
 
   auto int_column_for_read =
-      CreateDecodeColumn(bits, (UINT16_MAX + 1) * bits / 8,
+      CreateDecodeColumn(bits, (UINT16_MAX + 1) * bits / 8, origin_rows,
                          std::move(decoding_option), encoded_buff, encoded_len);
 
+  ASSERT_EQ(int_column_for_read->GetCompressLevel(), 5);
   char *verify_buff;
   size_t verify_len;
   std::tie(verify_buff, verify_len) = int_column_for_read->GetBuffer();
@@ -543,7 +691,7 @@ TEST_P(PaxNonFixedColumnCompressTest,
 
   PaxEncoder::EncodingOption encoding_option;
   encoding_option.column_encode_type = kind;
-  encoding_option.compress_lvl = 5;
+  encoding_option.compress_level = 5;
   encoding_option.is_sign = true;
 
   non_fixed_column =
@@ -577,16 +725,17 @@ TEST_P(PaxNonFixedColumnCompressTest,
   PaxDecoder::DecodingOption decoding_option;
   decoding_option.column_encode_type = kind;
   decoding_option.is_sign = true;
+  decoding_option.compress_level = 5;
 
   auto non_fixed_column_for_read = new PaxNonFixedEncodingColumn(
       buffer_len * number, std::move(decoding_option));
   auto data_buffer_for_read =
       new DataBuffer<char>(encoded_buff, encoded_len, false, false);
   data_buffer_for_read->Brush(encoded_len);
-  auto length_buffer_cpy = new DataBuffer<int64>(*length_buffer);
+  auto length_buffer_cpy = new DataBuffer<int32>(*length_buffer);
   non_fixed_column_for_read->Set(data_buffer_for_read, length_buffer_cpy,
                                  origin_len);
-
+  ASSERT_EQ(non_fixed_column_for_read->GetCompressLevel(), 5);
   char *verify_buff;
   size_t verify_len;
 
@@ -612,8 +761,15 @@ TEST_P(PaxNonFixedColumnCompressTest,
   delete non_fixed_column_for_read;
 }
 
-INSTANTIATE_TEST_CASE_P(PaxColumnEncodingTestCombine, PaxColumnEncodingTest,
-                        testing::Values(16, 32, 64));
+INSTANTIATE_TEST_CASE_P(PaxColumnTestCombine, PaxColumnTest,
+                        testing::Values(PaxStorageFormat::kTypeStorageOrcNonVec,
+                                        PaxStorageFormat::kTypeStorageOrcVec));
+
+INSTANTIATE_TEST_CASE_P(
+    PaxColumnEncodingTestCombine, PaxColumnEncodingTest,
+    testing::Combine(testing::Values(16, 32, 64),
+                     testing::Values(PaxStorageFormat::kTypeStorageOrcNonVec,
+                                     PaxStorageFormat::kTypeStorageOrcVec)));
 
 INSTANTIATE_TEST_CASE_P(
     PaxColumnEncodingTestCombine, PaxColumnCompressTest,
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.cc
new file mode 100644
index 00000000000..e23364ddd3a
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.cc
@@ -0,0 +1,114 @@
+#include "storage/columns/pax_column_traits.h"
+
+namespace pax::traits {
+
+
+Impl::CreateFunc<PaxCommColumn<int8>>
+    ColumnCreateTraits<PaxCommColumn, int8>::create =
+        Impl::CreateImpl<PaxCommColumn<int8>>;
+Impl::CreateFunc<PaxCommColumn<int16>>
+    ColumnCreateTraits<PaxCommColumn, int16>::create =
+        Impl::CreateImpl<PaxCommColumn<int16>>;
+Impl::CreateFunc<PaxCommColumn<int32>>
+    ColumnCreateTraits<PaxCommColumn, int32>::create =
+        Impl::CreateImpl<PaxCommColumn<int32>>;
+Impl::CreateFunc<PaxCommColumn<int64>>
+    ColumnCreateTraits<PaxCommColumn, int64>::create =
+        Impl::CreateImpl<PaxCommColumn<int64>>;
+Impl::CreateFunc<PaxCommColumn<float>>
+    ColumnCreateTraits<PaxCommColumn, float>::create =
+        Impl::CreateImpl<PaxCommColumn<float>>;
+Impl::CreateFunc<PaxCommColumn<double>>
+    ColumnCreateTraits<PaxCommColumn, double>::create =
+        Impl::CreateImpl<PaxCommColumn<double>>;
+
+Impl::CreateFunc<PaxVecCommColumn<int8>>
+    ColumnCreateTraits<PaxVecCommColumn, int8>::create =
+        Impl::CreateImpl<PaxVecCommColumn<int8>>;
+Impl::CreateFunc<PaxVecCommColumn<int16>>
+    ColumnCreateTraits<PaxVecCommColumn, int16>::create =
+        Impl::CreateImpl<PaxVecCommColumn<int16>>;
+Impl::CreateFunc<PaxVecCommColumn<int32>>
+    ColumnCreateTraits<PaxVecCommColumn, int32>::create =
+        Impl::CreateImpl<PaxVecCommColumn<int32>>;
+Impl::CreateFunc<PaxVecCommColumn<int64>>
+    ColumnCreateTraits<PaxVecCommColumn, int64>::create =
+        Impl::CreateImpl<PaxVecCommColumn<int64>>;
+Impl::CreateFunc<PaxVecCommColumn<float>>
+    ColumnCreateTraits<PaxVecCommColumn, float>::create =
+        Impl::CreateImpl<PaxVecCommColumn<float>>;
+Impl::CreateFunc<PaxVecCommColumn<double>>
+    ColumnCreateTraits<PaxVecCommColumn, double>::create =
+        Impl::CreateImpl<PaxVecCommColumn<double>>;
+Impl::CreateFunc<PaxNonFixedColumn>
+    ColumnCreateTraits2<PaxNonFixedColumn>::create =
+        Impl::CreateImpl<PaxNonFixedColumn>;
+Impl::CreateFunc<PaxVecNonFixedColumn>
+    ColumnCreateTraits2<PaxVecNonFixedColumn>::create =
+        Impl::CreateImpl<PaxVecNonFixedColumn>;
+
+
+
+Impl::CreateEncodingFunc<PaxEncodingColumn<int8>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int8>::create_encoding =
+        Impl::CreateEncodingImpl<PaxEncodingColumn<int8>>;
+Impl::CreateEncodingFunc<PaxEncodingColumn<int16>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int16>::create_encoding =
+        Impl::CreateEncodingImpl<PaxEncodingColumn<int16>>;
+Impl::CreateEncodingFunc<PaxEncodingColumn<int32>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int32>::create_encoding =
+        Impl::CreateEncodingImpl<PaxEncodingColumn<int32>>;
+Impl::CreateEncodingFunc<PaxEncodingColumn<int64>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int64>::create_encoding =
+        Impl::CreateEncodingImpl<PaxEncodingColumn<int64>>;
+Impl::CreateDecodingFunc<PaxEncodingColumn<int8>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int8>::create_decoding =
+        Impl::CreateDecodingImpl<PaxEncodingColumn<int8>>;
+Impl::CreateDecodingFunc<PaxEncodingColumn<int16>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int16>::create_decoding =
+        Impl::CreateDecodingImpl<PaxEncodingColumn<int16>>;
+Impl::CreateDecodingFunc<PaxEncodingColumn<int32>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int32>::create_decoding =
+        Impl::CreateDecodingImpl<PaxEncodingColumn<int32>>;
+Impl::CreateDecodingFunc<PaxEncodingColumn<int64>>
+    ColumnOptCreateTraits<PaxEncodingColumn, int64>::create_decoding =
+        Impl::CreateDecodingImpl<PaxEncodingColumn<int64>>;
+
+Impl::CreateEncodingFunc<PaxVecEncodingColumn<int8>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int8>::create_encoding =
+        Impl::CreateEncodingImpl<PaxVecEncodingColumn<int8>>;
+Impl::CreateEncodingFunc<PaxVecEncodingColumn<int16>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int16>::create_encoding =
+        Impl::CreateEncodingImpl<PaxVecEncodingColumn<int16>>;
+Impl::CreateEncodingFunc<PaxVecEncodingColumn<int32>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int32>::create_encoding =
+        Impl::CreateEncodingImpl<PaxVecEncodingColumn<int32>>;
+Impl::CreateEncodingFunc<PaxVecEncodingColumn<int64>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int64>::create_encoding =
+        Impl::CreateEncodingImpl<PaxVecEncodingColumn<int64>>;
+Impl::CreateDecodingFunc<PaxVecEncodingColumn<int8>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int8>::create_decoding =
+        Impl::CreateDecodingImpl<PaxVecEncodingColumn<int8>>;
+Impl::CreateDecodingFunc<PaxVecEncodingColumn<int16>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int16>::create_decoding =
+        Impl::CreateDecodingImpl<PaxVecEncodingColumn<int16>>;
+Impl::CreateDecodingFunc<PaxVecEncodingColumn<int32>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int32>::create_decoding =
+        Impl::CreateDecodingImpl<PaxVecEncodingColumn<int32>>;
+Impl::CreateDecodingFunc<PaxVecEncodingColumn<int64>>
+    ColumnOptCreateTraits<PaxVecEncodingColumn, int64>::create_decoding =
+        Impl::CreateDecodingImpl<PaxVecEncodingColumn<int64>>;
+
+Impl::CreateEncodingFunc<PaxNonFixedEncodingColumn>
+    ColumnOptCreateTraits2<PaxNonFixedEncodingColumn>::create_encoding =
+        Impl::CreateEncodingImpl<PaxNonFixedEncodingColumn>;
+Impl::CreateDecodingFunc<PaxNonFixedEncodingColumn>
+    ColumnOptCreateTraits2<PaxNonFixedEncodingColumn>::create_decoding =
+        Impl::CreateDecodingImpl<PaxNonFixedEncodingColumn>;
+Impl::CreateEncodingFunc<PaxVecNonFixedEncodingColumn>
+    ColumnOptCreateTraits2<PaxVecNonFixedEncodingColumn>::create_encoding =
+        Impl::CreateEncodingImpl<PaxVecNonFixedEncodingColumn>;
+Impl::CreateDecodingFunc<PaxVecNonFixedEncodingColumn>
+    ColumnOptCreateTraits2<PaxVecNonFixedEncodingColumn>::create_decoding =
+        Impl::CreateDecodingImpl<PaxVecNonFixedEncodingColumn>;
+}  // namespace pax::traits
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.h b/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.h
new file mode 100644
index 00000000000..d992a70ec91
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_column_traits.h
@@ -0,0 +1,115 @@
+#pragma once
+#include "comm/pax_memory.h"
+#include "storage/columns/pax_column.h"
+#include "storage/columns/pax_encoding_column.h"
+#include "storage/columns/pax_encoding_non_fixed_column.h"
+#include "storage/columns/pax_vec_column.h"
+#include "storage/columns/pax_vec_encoding_column.h"
+
+namespace pax::traits {
+
+namespace Impl {
+
+template <typename T>
+using CreateFunc = std::function<T *(uint64)>;
+
+template <typename T>
+static T *CreateImpl(uint64 cap) {
+  auto t = PAX_NEW<T>(cap);
+  return t;
+}
+
+template <typename T>
+using CreateEncodingFunc =
+    std::function<T *(uint64, const PaxEncoder::EncodingOption &)>;
+
+template <typename T>
+using CreateDecodingFunc =
+    std::function<T *(uint64, const PaxDecoder::DecodingOption &)>;
+
+template <typename T>
+static T *CreateEncodingImpl(uint64 cap,
+                             const PaxEncoder::EncodingOption &encoding_opt) {
+  auto t = PAX_NEW<T>(cap, encoding_opt);
+  return t;
+}
+
+template <typename T>
+static T *CreateDecodingImpl(uint64 cap,
+                             const PaxDecoder::DecodingOption &decoding_opt) {
+  auto t = PAX_NEW<T>(cap, decoding_opt);
+  return t;
+}
+
+}  // namespace Impl
+
+template <template <typename> class T, typename N>
+struct ColumnCreateTraits {};
+
+template <class T>
+struct ColumnCreateTraits2 {};
+
+#define TRAITS_DECL(_class, _type)                 \
+  template <>                                      \
+  struct ColumnCreateTraits<_class, _type> {       \
+    static Impl::CreateFunc<_class<_type>> create; \
+  }
+
+#define TRAITS_DECL2(_class)                \
+  template <>                               \
+  struct ColumnCreateTraits2<_class> {      \
+    static Impl::CreateFunc<_class> create; \
+  }
+
+TRAITS_DECL(PaxCommColumn, int8);
+TRAITS_DECL(PaxCommColumn, int16);
+TRAITS_DECL(PaxCommColumn, int32);
+TRAITS_DECL(PaxCommColumn, int64);
+TRAITS_DECL(PaxCommColumn, float);
+TRAITS_DECL(PaxCommColumn, double);
+
+TRAITS_DECL(PaxVecCommColumn, int8);
+TRAITS_DECL(PaxVecCommColumn, int16);
+TRAITS_DECL(PaxVecCommColumn, int32);
+TRAITS_DECL(PaxVecCommColumn, int64);
+TRAITS_DECL(PaxVecCommColumn, float);
+TRAITS_DECL(PaxVecCommColumn, double);
+
+TRAITS_DECL2(PaxNonFixedColumn);
+TRAITS_DECL2(PaxVecNonFixedColumn);
+
+
+template <template <typename> class T, typename N>
+struct ColumnOptCreateTraits {};
+
+template <class T>
+struct ColumnOptCreateTraits2 {};
+
+#define TRAITS_OPT_DECL(_class, _type)                              \
+  template <>                                                       \
+  struct ColumnOptCreateTraits<_class, _type> {                     \
+    static Impl::CreateEncodingFunc<_class<_type>> create_encoding; \
+    static Impl::CreateDecodingFunc<_class<_type>> create_decoding; \
+  }
+
+#define TRAITS_OPT_DECL2(_class)                             \
+  template <>                                                \
+  struct ColumnOptCreateTraits2<_class> {                    \
+    static Impl::CreateEncodingFunc<_class> create_encoding; \
+    static Impl::CreateDecodingFunc<_class> create_decoding; \
+  }
+
+TRAITS_OPT_DECL(PaxEncodingColumn, int8);
+TRAITS_OPT_DECL(PaxEncodingColumn, int16);
+TRAITS_OPT_DECL(PaxEncodingColumn, int32);
+TRAITS_OPT_DECL(PaxEncodingColumn, int64);
+
+TRAITS_OPT_DECL(PaxVecEncodingColumn, int8);
+TRAITS_OPT_DECL(PaxVecEncodingColumn, int16);
+TRAITS_OPT_DECL(PaxVecEncodingColumn, int32);
+TRAITS_OPT_DECL(PaxVecEncodingColumn, int64);
+
+TRAITS_OPT_DECL2(PaxNonFixedEncodingColumn);
+TRAITS_OPT_DECL2(PaxVecNonFixedEncodingColumn);
+
+}  // namespace pax::traits
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_columns.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_columns.cc
index 1c57d90b7cb..dea7bafb502 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_columns.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_columns.cc
@@ -6,63 +6,72 @@
 #include <utility>
 #include <vector>
 
-#include "storage/columns/pax_column_int.h"
-#include "storage/columns/pax_encoding_column.h"
-#include "storage/columns/pax_encoding_non_fixed_column.h"
+#include "comm/pax_memory.h"
+#include "storage/columns/pax_column_traits.h"
 
 namespace pax {
 
-PaxColumns::PaxColumns(
-    const std::vector<orc::proto::Type_Kind> types,
-    const std::vector<ColumnEncoding_Kind> column_encoding_types)
-    : row_nums_(0) {
-  data_ = new DataBuffer<char>(0);
+template <typename N>
+static PaxColumn *CreateCommColumn(bool is_vec,
+                                   const PaxEncoder::EncodingOption &opts) {
+  return is_vec
+             ? (PaxColumn *)traits::ColumnOptCreateTraits<
+                   PaxVecEncodingColumn, N>::create_encoding(DEFAULT_CAPACITY,
+                                                             opts)
+             : (PaxColumn *)traits::ColumnOptCreateTraits<
+                   PaxEncodingColumn, N>::create_encoding(DEFAULT_CAPACITY,
+                                                          opts);
+}
+
+PaxColumns::PaxColumns(const std::vector<pax::orc::proto::Type_Kind> &types,
+                       const std::vector<std::tuple<ColumnEncoding_Kind, int>>
+                           &column_encoding_types,
+                       const PaxStorageFormat &storage_format)
+    : row_nums_(0), storage_format_(storage_format) {
+  Assert(columns_.empty());
+  Assert(types.size() == column_encoding_types.size());
+  data_ = PAX_NEW<DataBuffer<char>>(0);
+  auto is_vec = storage_format_ == PaxStorageFormat::kTypeStorageOrcVec;
+
   for (size_t i = 0; i < types.size(); i++) {
     auto type = types[i];
+
+    PaxEncoder::EncodingOption encoding_option;
+    encoding_option.column_encode_type = std::get<0>(column_encoding_types[i]);
+    encoding_option.is_sign = true;
+    encoding_option.compress_level = std::get<1>(column_encoding_types[i]);
+
     switch (type) {
-      case (orc::proto::Type_Kind::Type_Kind_STRING): {
-        PaxEncoder::EncodingOption encoding_option;
-        encoding_option.column_encode_type = column_encoding_types[i];
+      case (pax::orc::proto::Type_Kind::Type_Kind_STRING): {
         encoding_option.is_sign = false;
-        encoding_option.compress_lvl = column_encoding_types[i];
-
-        auto pax_non_fixed_column = new PaxNonFixedEncodingColumn(  //
-            DEFAULT_CAPACITY, std::move(encoding_option));
-        // current memory will copy from tuple, so should take over it
-        pax_non_fixed_column->SetMemTakeOver(true);
-        columns_.emplace_back(pax_non_fixed_column);
+        columns_.emplace_back(
+            is_vec ? (PaxColumn *)traits::ColumnOptCreateTraits2<
+                         PaxVecNonFixedEncodingColumn>::
+                         create_encoding(DEFAULT_CAPACITY,
+                                         std::move(encoding_option))
+                   : (PaxColumn *)traits::ColumnOptCreateTraits2<
+                         PaxNonFixedEncodingColumn>::
+                         create_encoding(DEFAULT_CAPACITY,
+                                         std::move(encoding_option)));
         break;
       }
-      case (orc::proto::Type_Kind::Type_Kind_BOOLEAN):
-      case (orc::proto::Type_Kind::Type_Kind_BYTE): {  // len 1 integer
-        columns_.emplace_back(new PaxCommColumn<char>());
+      case (pax::orc::proto::Type_Kind::Type_Kind_BOOLEAN):
+      case (pax::orc::proto::Type_Kind::Type_Kind_BYTE):  // len 1 integer
+        columns_.emplace_back(
+            CreateCommColumn<int8>(is_vec, std::move(encoding_option)));
         break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_SHORT): {  // len 2 integer
-        PaxEncoder::EncodingOption encoding_option;
-        encoding_option.column_encode_type = column_encoding_types[i];
-        encoding_option.is_sign = true;
+      case (pax::orc::proto::Type_Kind::Type_Kind_SHORT):  // len 2 integer
         columns_.emplace_back(
-            new PaxIntColumn<int16>(std::move(encoding_option)));
+            CreateCommColumn<int16>(is_vec, std::move(encoding_option)));
         break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_INT): {  // len 4 integer
-        PaxEncoder::EncodingOption encoding_option;
-        encoding_option.column_encode_type = column_encoding_types[i];
-        encoding_option.is_sign = true;
+      case (pax::orc::proto::Type_Kind::Type_Kind_INT):  // len 4 integer
         columns_.emplace_back(
-            new PaxIntColumn<int32>(std::move(encoding_option)));
+            CreateCommColumn<int32>(is_vec, std::move(encoding_option)));
         break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_LONG): {  // len 8 integer
-        PaxEncoder::EncodingOption encoding_option;
-        encoding_option.column_encode_type = column_encoding_types[i];
-        encoding_option.is_sign = true;
+      case (pax::orc::proto::Type_Kind::Type_Kind_LONG):  // len 8 integer
         columns_.emplace_back(
-            new PaxIntColumn<int64>(std::move(encoding_option)));
-
+            CreateCommColumn<int64>(is_vec, std::move(encoding_option)));
         break;
-      }
       default:
         // TODO(jiaqizho): support other column type
         // but now should't be here
@@ -72,37 +81,64 @@ PaxColumns::PaxColumns(
   }
 }
 
-PaxColumns::PaxColumns() : row_nums_(0) { data_ = new DataBuffer<char>(0); }
+PaxColumns::PaxColumns()
+    : row_nums_(0), storage_format_(PaxStorageFormat::kTypeStorageOrcNonVec) {
+  data_ = PAX_NEW<DataBuffer<char>>(0);
+}
 
 PaxColumns::~PaxColumns() {
+  // Notice that: the resources freed here,
+  // must transform owner in `PaxColumns::Merge`
   for (auto column : columns_) {
-    delete column;
+    PAX_DELETE(column);
   }
-  delete data_;
+  for (auto holder : data_holder_) {
+    PAX_DELETE(holder);
+  }
+  PAX_DELETE(data_);
 }
 
-void PaxColumns::Clear() {
-  row_nums_ = 0;
-  for (auto column : columns_) {
-    if (column) column->Clear();
+void PaxColumns::SetStorageFormat(PaxStorageFormat format) {
+  storage_format_ = format;
+}
+
+PaxStorageFormat PaxColumns::GetStorageFormat() const {
+  return storage_format_;
+}
+
+void PaxColumns::Merge(PaxColumns *columns) {
+  Assert(GetColumns() == columns->GetColumns());
+  Assert(GetRows() == columns->GetRows());
+  Assert(columns->data_holder_.empty());
+
+  for (size_t i = 0; i < columns->GetColumns(); i++) {
+    AssertImply(columns_[i], !columns->columns_[i]);
+    if (!columns_[i] && columns->columns_[i]) {
+      columns_[i] = columns->columns_[i];
+      columns->columns_[i] = nullptr;
+    }
+  }
+
+  if (columns->data_) {
+    data_holder_.emplace_back(columns->data_);
+    columns->data_ = nullptr;
   }
 
-  data_->Clear();
+  PAX_DELETE(columns);
 }
 
 PaxColumn *PaxColumns::operator[](uint64 i) { return columns_[i]; }
 
 void PaxColumns::Append(PaxColumn *column) { columns_.emplace_back(column); }
 
-void PaxColumns::Append([[maybe_unused]] char *buffer,
-                        [[maybe_unused]] size_t size) {
+void PaxColumns::Append(char * /*buffer*/, size_t /*size*/) {
   CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
 }
 
 void PaxColumns::Set(DataBuffer<char> *data) {
   Assert(data_->GetBuffer() == nullptr);
 
-  delete data_;
+  PAX_DELETE(data_);
   data_ = data;
 }
 
@@ -152,6 +188,15 @@ std::pair<char *, size_t> PaxColumns::GetRangeBuffer(size_t /*start_pos*/,
   CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
 }
 
+size_t PaxColumns::AlignSize(size_t buf_len, size_t len, size_t align_size) {
+  if ((buf_len + len) % align_size != 0) {
+    auto align_buf_len = TYPEALIGN(align_size, (buf_len + len));
+    Assert(align_buf_len - buf_len > len);
+    len = align_buf_len - buf_len;
+  }
+  return len;
+}
+
 DataBuffer<char> *PaxColumns::GetDataBuffer(
     const ColumnStreamsFunc &column_streams_func,
     const ColumnEncodingFunc &column_encoding_func) {
@@ -163,13 +208,110 @@ DataBuffer<char> *PaxColumns::GetDataBuffer(
     data_->Clear();
   }
 
-  buffer_len = MeasureDataBuffer(column_streams_func, column_encoding_func);
-  data_->Set(reinterpret_cast<char *>(cbdb::Palloc(buffer_len)), buffer_len, 0);
-  CombineDataBuffer();
+#ifdef ENABLE_DEBUG
+  auto storage_format = GetStorageFormat();
+  for (auto column : columns_) {
+    AssertImply(column, column->GetStorageFormat() == storage_format);
+  }
+#endif
+
+  if (COLUMN_STORAGE_FORMAT_IS_VEC(this)) {
+    buffer_len =
+        MeasureVecDataBuffer(column_streams_func, column_encoding_func);
+    data_->Set(reinterpret_cast<char *>(cbdb::Palloc(buffer_len)), buffer_len,
+               0);
+    CombineVecDataBuffer();
+  } else {
+    buffer_len =
+        MeasureOrcDataBuffer(column_streams_func, column_encoding_func);
+    data_->Set(reinterpret_cast<char *>(cbdb::Palloc(buffer_len)), buffer_len,
+               0);
+    CombineOrcDataBuffer();
+  }
+
+  Assert(data_->Used() == buffer_len);
+  Assert(data_->Available() == 0);
   return data_;
 }
 
-size_t PaxColumns::MeasureDataBuffer(
+size_t PaxColumns::MeasureVecDataBuffer(
+    const ColumnStreamsFunc &column_streams_func,
+    const ColumnEncodingFunc &column_encoding_func) {
+  size_t buffer_len = 0;
+  for (auto column : columns_) {
+    if (!column) {
+      continue;
+    }
+
+    size_t total_rows = column->GetRows();
+    size_t non_null_rows = column->GetNonNullRows();
+
+    // has null will generate a bitmap in current stripe
+    if (column->HasNull()) {
+      auto bm = column->GetBitmap();
+      Assert(bm);
+      size_t bm_length = bm->MinimalStoredBytes(total_rows);
+
+      bm_length = TYPEALIGN(MEMORY_ALIGN_SIZE, bm_length);
+      buffer_len += bm_length;
+      column_streams_func(pax::orc::proto::Stream_Kind_PRESENT, total_rows,
+                          bm_length);
+    }
+
+    switch (column->GetPaxColumnTypeInMem()) {
+      case kTypeNonFixed: {
+        size_t offsets_size =
+            TYPEALIGN(MEMORY_ALIGN_SIZE, (total_rows + 1) * sizeof(int32));
+        buffer_len += offsets_size;
+        column_streams_func(pax::orc::proto::Stream_Kind_LENGTH, total_rows,
+                            offsets_size);
+
+        auto data_length = column->GetBuffer().second;
+        if (column->GetEncodingType() ==
+            ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+          data_length = TYPEALIGN(MEMORY_ALIGN_SIZE, data_length);
+        }
+
+        buffer_len += data_length;
+        column_streams_func(pax::orc::proto::Stream_Kind_DATA, non_null_rows,
+                            data_length);
+
+        break;
+      }
+      case kTypeFixed: {
+        auto data_length = column->GetBuffer().second;
+        if (column->GetEncodingType() ==
+            ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+          data_length = TYPEALIGN(MEMORY_ALIGN_SIZE, data_length);
+        }
+
+        buffer_len += data_length;
+        column_streams_func(pax::orc::proto::Stream_Kind_DATA, non_null_rows,
+                            data_length);
+        break;
+      }
+      case kTypeInvalid:
+      default: {
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+        break;
+      }
+    }
+
+    AssertImply(column->GetEncodingType() !=
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED,
+                column->GetOriginLength() >= 0);
+
+    column_encoding_func(
+        column->GetEncodingType(), column->GetCompressLevel(),
+        (column->GetEncodingType() !=
+         ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED)
+            ? TYPEALIGN(MEMORY_ALIGN_SIZE, column->GetOriginLength())
+            : column->GetOriginLength());
+  }
+  return buffer_len;
+}
+
+size_t PaxColumns::MeasureOrcDataBuffer(
     const ColumnStreamsFunc &column_streams_func,
     const ColumnEncodingFunc &column_encoding_func) {
   size_t buffer_len = 0;
@@ -181,26 +323,35 @@ size_t PaxColumns::MeasureDataBuffer(
 
     // has null will generate a bitmap in current stripe
     if (column->HasNull()) {
-      size_t non_null_length = column->GetNulls()->Used();
-      buffer_len += non_null_length;
-      column_streams_func(orc::proto::Stream_Kind_PRESENT, column->GetRows(),
-                          non_null_length);
+      auto bm = column->GetBitmap();
+      Assert(bm);
+      size_t bm_length = bm->MinimalStoredBytes(column->GetRows());
+      buffer_len += bm_length;
+      column_streams_func(pax::orc::proto::Stream_Kind_PRESENT,
+                          column->GetRows(), bm_length);
     }
 
     size_t column_size = column->GetNonNullRows();
 
     switch (column->GetPaxColumnTypeInMem()) {
       case kTypeNonFixed: {
-        size_t lengths_size = column_size * sizeof(int64);
+        size_t lengths_size = column_size * sizeof(int32);
+
+        if ((buffer_len + lengths_size) % column->GetAlignSize() != 0) {
+          auto align_buffer_len =
+              TYPEALIGN(column->GetAlignSize(), (buffer_len + lengths_size));
+          Assert(align_buffer_len - buffer_len > lengths_size);
+          lengths_size = align_buffer_len - buffer_len;
+        }
 
         buffer_len += lengths_size;
-        column_streams_func(orc::proto::Stream_Kind_LENGTH, column_size,
+        column_streams_func(pax::orc::proto::Stream_Kind_LENGTH, column_size,
                             lengths_size);
 
         auto length_data = column->GetBuffer().second;
         buffer_len += length_data;
 
-        column_streams_func(orc::proto::Stream_Kind_DATA, column_size,
+        column_streams_func(pax::orc::proto::Stream_Kind_DATA, column_size,
                             length_data);
 
         break;
@@ -208,7 +359,7 @@ size_t PaxColumns::MeasureDataBuffer(
       case kTypeFixed: {
         auto length_data = column->GetBuffer().second;
         buffer_len += length_data;
-        column_streams_func(orc::proto::Stream_Kind_DATA, column_size,
+        column_streams_func(pax::orc::proto::Stream_Kind_DATA, column_size,
                             length_data);
 
         break;
@@ -220,27 +371,108 @@ size_t PaxColumns::MeasureDataBuffer(
       }
     }
 
-    column_encoding_func(column->GetEncodingType(), column->GetOriginLength());
+    column_encoding_func(column->GetEncodingType(), column->GetCompressLevel(),
+                         column->GetOriginLength());
   }
   return buffer_len;
 }
 
-void PaxColumns::CombineDataBuffer() {
+void PaxColumns::CombineVecDataBuffer() {
   char *buffer = nullptr;
   size_t buffer_len = 0;
 
+  auto fill_padding_buffer = [](PaxColumn *column,
+                                DataBuffer<char> *data_buffer,
+                                size_t buffer_len, size_t align) {
+    Assert(data_buffer);
+
+    if (column && (column->GetEncodingType() !=
+                   ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED)) {
+      return;
+    }
+
+    auto gap_size = TYPEALIGN(align, buffer_len) - buffer_len;
+    if (!gap_size) {
+      return;
+    }
+
+    data_buffer->WriteZero(gap_size);
+    data_buffer->Brush(gap_size);
+  };
+
   for (auto column : columns_) {
     if (!column) {
       continue;
     }
 
     if (column->HasNull()) {
-      auto null_data_buffer = column->GetNulls();
-      size_t non_null_length = null_data_buffer->Used();
+      auto bm = column->GetBitmap();
+      auto nbytes = bm->MinimalStoredBytes(column->GetRows());
+      Assert(nbytes <= bm->Raw().size);
+
+      Assert(data_->Available() >= nbytes);
+      data_->Write(reinterpret_cast<char *>(bm->Raw().bitmap), nbytes);
+      data_->Brush(nbytes);
 
-      data_->Write(reinterpret_cast<char *>(null_data_buffer->GetBuffer()),
-                   non_null_length);
-      data_->Brush(non_null_length);
+      fill_padding_buffer(nullptr, data_, nbytes, MEMORY_ALIGN_SIZE);
+    }
+
+    switch (column->GetPaxColumnTypeInMem()) {
+      case kTypeNonFixed: {
+        auto no_fixed_column = reinterpret_cast<PaxVecNonFixedColumn *>(column);
+        auto offset_data_buffer = no_fixed_column->GetOffsetBuffer(true);
+
+        Assert(data_->Available() >= offset_data_buffer->Used());
+        data_->Write((char *)offset_data_buffer->GetBuffer(),
+                     offset_data_buffer->Used());
+        data_->Brush(offset_data_buffer->Used());
+
+        fill_padding_buffer(nullptr, data_, offset_data_buffer->Used(),
+                            MEMORY_ALIGN_SIZE);
+
+        std::tie(buffer, buffer_len) = column->GetBuffer();
+        Assert(data_->Available() >= buffer_len);
+        data_->Write(buffer, buffer_len);
+        data_->Brush(buffer_len);
+
+        fill_padding_buffer(no_fixed_column, data_, buffer_len,
+                            MEMORY_ALIGN_SIZE);
+
+        break;
+      }
+      case kTypeFixed: {
+        std::tie(buffer, buffer_len) = column->GetBuffer();
+
+        Assert(data_->Available() >= buffer_len);
+        data_->Write(buffer, buffer_len);
+        data_->Brush(buffer_len);
+
+        fill_padding_buffer(column, data_, buffer_len, MEMORY_ALIGN_SIZE);
+        break;
+      }
+      case kTypeInvalid:
+      default:
+        break;
+    }
+  }
+}
+
+void PaxColumns::CombineOrcDataBuffer() {
+  char *buffer = nullptr;
+  size_t buffer_len = 0;
+
+  for (auto column : columns_) {
+    if (!column) {
+      continue;
+    }
+
+    if (column->HasNull()) {
+      auto bm = column->GetBitmap();
+      auto nbytes = bm->MinimalStoredBytes(column->GetRows());
+      Assert(nbytes <= bm->Raw().size);
+
+      data_->Write(reinterpret_cast<char *>(bm->Raw().bitmap), nbytes);
+      data_->Brush(nbytes);
     }
 
     switch (column->GetPaxColumnTypeInMem()) {
@@ -248,10 +480,26 @@ void PaxColumns::CombineDataBuffer() {
         auto no_fixed_column = reinterpret_cast<PaxNonFixedColumn *>(column);
         auto length_data_buffer = no_fixed_column->GetLengthBuffer();
 
+        auto lengths_size = length_data_buffer->Used();
+        auto current_buffer_len = data_->Used();
+        if ((current_buffer_len + lengths_size) % column->GetAlignSize() != 0) {
+          auto align_buffer_len = TYPEALIGN(
+              column->GetAlignSize(), (current_buffer_len + lengths_size));
+          Assert(align_buffer_len - current_buffer_len > lengths_size);
+          lengths_size = align_buffer_len - current_buffer_len;
+        }
+
         memcpy(data_->GetAvailableBuffer(), length_data_buffer->GetBuffer(),
                length_data_buffer->Used());
         data_->Brush(length_data_buffer->Used());
 
+        Assert(lengths_size >= length_data_buffer->Used());
+        if (lengths_size > length_data_buffer->Used()) {
+          auto padding = lengths_size - length_data_buffer->Used();
+          data_->WriteZero(padding);
+          data_->Brush(padding);
+        }
+
         std::tie(buffer, buffer_len) = column->GetBuffer();
         data_->Write(buffer, buffer_len);
         data_->Brush(buffer_len);
@@ -270,4 +518,53 @@ void PaxColumns::CombineDataBuffer() {
     }
   }
 }
+
+std::pair<Datum, bool> GetColumnValue(PaxColumns *columns, size_t column_index,
+                                      size_t row_index) {
+  Assert(column_index < columns->GetColumns());
+  Assert(row_index < columns->GetRows());
+
+  Datum datum = 0;
+  auto column = (*columns)[column_index];
+  char *buffer;
+  size_t buffer_len;
+
+  Assert(column);
+  if (column->HasNull()) {
+    auto bitmap = column->GetBitmap();
+    if (!bitmap->Test(row_index)) return {datum, true};
+  }
+  auto nonnulls = column->GetRangeNonNullRows(0, row_index);
+  column->GetBuffer();
+  std::tie(buffer, buffer_len) = column->GetBuffer(nonnulls);
+  switch (column->GetPaxColumnTypeInMem()) {
+    case kTypeNonFixed:
+      datum = PointerGetDatum(buffer);
+      break;
+    case kTypeFixed: {
+      Assert(buffer_len > 0);
+      switch (buffer_len) {
+        case 1:
+          datum = cbdb::Int8ToDatum(*reinterpret_cast<int8 *>(buffer));
+          break;
+        case 2:
+          datum = cbdb::Int16ToDatum(*reinterpret_cast<int16 *>(buffer));
+          break;
+        case 4:
+          datum = cbdb::Int32ToDatum(*reinterpret_cast<int32 *>(buffer));
+          break;
+        case 8:
+          datum = cbdb::Int64ToDatum(*reinterpret_cast<int64 *>(buffer));
+          break;
+        default:
+          Assert(!"should't be here, fixed type len should be 1, 2, 4, 8");
+      }
+      break;
+    }
+    default:
+      Assert(!"should't be here, non-implemented column type in memory");
+      break;
+  }
+  return {datum, false};
+}
 }  //  namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_columns.h b/contrib/pax_storage/src/cpp/storage/columns/pax_columns.h
index c32fc29e441..6ee3b40c084 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_columns.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_columns.h
@@ -12,14 +12,23 @@ namespace pax {
 // Inheriting PaxCommColumn use to be able to nest itself
 class PaxColumns : public PaxColumn {
  public:
-  explicit PaxColumns(std::vector<orc::proto::Type_Kind> types,
-                      std::vector<ColumnEncoding_Kind> column_encoding_types);
+  explicit PaxColumns(const std::vector<pax::orc::proto::Type_Kind> &types,
+                      const std::vector<std::tuple<ColumnEncoding_Kind, int>>
+                          &column_encoding_types,
+                      const PaxStorageFormat &storage_format);
 
   PaxColumns();
 
   ~PaxColumns() override;
 
-  void Clear() override;
+  // Use to merge other columns, the columns pass in will be delete
+  // This method is horizontal merge, `Merge(PaxColumn *column)` is
+  // vertical merge.
+  // a horizontal merge example:
+  // columns1: c1   null c3
+  // columns2: null c2   null
+  // after merge: c1 c2 c3
+  void Merge(PaxColumns *columns);
 
   PaxColumn *operator[](uint64 i);
 
@@ -29,12 +38,16 @@ class PaxColumns : public PaxColumn {
 
   void Set(DataBuffer<char> *data);
 
+  void SetStorageFormat(PaxStorageFormat format);
+
   size_t PhysicalSize() const override;
 
   int64 GetOriginLength() const override;
 
   int32 GetTypeLength() const override;
 
+  PaxStorageFormat GetStorageFormat() const override;
+
   // Get number of column in columns
   virtual size_t GetColumns() const;
 
@@ -50,10 +63,10 @@ class PaxColumns : public PaxColumn {
   size_t GetNonNullRows() const override;
 
   using ColumnStreamsFunc =
-      std::function<void(const orc::proto::Stream_Kind &, size_t, size_t)>;
+      std::function<void(const pax::orc::proto::Stream_Kind &, size_t, size_t)>;
 
-  using ColumnEncodingFunc =
-      std::function<void(const ColumnEncoding_Kind &, size_t)>;
+  using ColumnEncodingFunc = std::function<void(
+      const ColumnEncoding_Kind &, const uint64 compress_lvl, size_t)>;
 
   // Get the combined data buffer of all columns
   // TODO(jiaqizho): consider add a new api which support split IO from
@@ -63,19 +76,30 @@ class PaxColumns : public PaxColumn {
       const ColumnEncodingFunc &column_encoding_func);
 
   inline void AddRows(size_t row_num) { row_nums_ += row_num; }
-  inline size_t GetRows() override { return row_nums_; }
+  inline size_t GetRows() const override { return row_nums_; }
 
  protected:
-  virtual size_t MeasureDataBuffer(
-      const ColumnStreamsFunc &column_streams_func,
-      const ColumnEncodingFunc &column_encoding_func);
+  static size_t AlignSize(size_t buf_len, size_t len, size_t align_size);
 
-  virtual void CombineDataBuffer();
+  size_t MeasureOrcDataBuffer(const ColumnStreamsFunc &column_streams_func,
+                              const ColumnEncodingFunc &column_encoding_func);
+
+  size_t MeasureVecDataBuffer(const ColumnStreamsFunc &column_streams_func,
+                              const ColumnEncodingFunc &column_encoding_func);
+
+  void CombineOrcDataBuffer();
+  void CombineVecDataBuffer();
 
  protected:
   std::vector<PaxColumn *> columns_;
+  std::vector<DataBuffer<char> *> data_holder_;
   DataBuffer<char> *data_;
   size_t row_nums_;
+
+  PaxStorageFormat storage_format_;
 };
 
+std::pair<Datum, bool> GetColumnValue(PaxColumns *columns, size_t column_index,
+                                      size_t row_index);
+
 }  //  namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_compress.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_compress.cc
index bcef91401b3..800fdea3e72 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_compress.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_compress.cc
@@ -1,6 +1,7 @@
 #include "storage/columns/pax_compress.h"
 
 #include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
 #include "zlib.h"  // NOLINT
 #include "zstd.h"  // NOLINT
 
@@ -11,11 +12,11 @@ PaxCompressor *PaxCompressor::CreateBlockCompressor(
   PaxCompressor *compressor = nullptr;
   switch (kind) {
     case ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZSTD: {
-      compressor = new PaxZSTDCompressor();
+      compressor = PAX_NEW<PaxZSTDCompressor>();
       break;
     }
     case ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZLIB: {
-      compressor = new PaxZlibCompressor();
+      compressor = PAX_NEW<PaxZlibCompressor>();
       break;
     }
     case ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED: {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_compress.h b/contrib/pax_storage/src/cpp/storage/columns/pax_compress.h
index f183f5a4762..6d472752ed2 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_compress.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_compress.h
@@ -4,8 +4,6 @@
 
 #include <string>
 
-#include "comm/cbdb_wrappers.h"
-#include "comm/singleton.h"
 #include "storage/columns/pax_encoding_utils.h"
 
 namespace pax {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_compress_test.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_compress_test.cc
index de6e4adbbed..7f5edc8c4e5 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_compress_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_compress_test.cc
@@ -5,18 +5,13 @@
 #include "comm/cbdb_wrappers.h"
 #include "comm/gtest_wrappers.h"
 #include "exceptions/CException.h"
+#include "pax_gtest_helper.h"
 #include "storage/columns/pax_encoding_utils.h"
 
 namespace pax::tests {
 class PaxCompressTest : public ::testing::TestWithParam<
                             ::testing::tuple<ColumnEncoding_Kind, uint32>> {
-  void SetUp() override {
-    MemoryContext pax_compress_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 200 * 1024 * 1024,
-        200 * 1024 * 1024, 200 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_compress_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 TEST_P(PaxCompressTest, TestCompressAndDecompress) {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.cc
index b1f73dbdbb1..44ab0b7a973 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.cc
@@ -1,5 +1,6 @@
 #include "storage/columns/pax_decoding.h"
 
+#include "comm/pax_memory.h"
 #include "storage/columns/pax_rlev2_decoding.h"
 
 namespace pax {
@@ -12,8 +13,8 @@ PaxDecoder *PaxDecoder::CreateDecoder(const DecodingOption &decoder_options) {
       // do nothing
       break;
     }
-    case ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2: {
-      decoder = new PaxOrcDecoder<T>(decoder_options);
+    case ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2: {
+      decoder = PAX_NEW<PaxOrcDecoder<T>>(decoder_options);
       break;
     }
     case ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA: {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.h b/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.h
index 8fac8f01792..177a3f89905 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_decoding.h
@@ -14,11 +14,13 @@ class PaxDecoder {
   struct DecodingOption {
     ColumnEncoding_Kind column_encode_type;
     bool is_sign;
+    int compress_level;
 
     DecodingOption()
         : column_encode_type(
               ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED),
-          is_sign(true) {}
+          is_sign(true),
+          compress_level(0) {}
   };
 
   explicit PaxDecoder(const DecodingOption &decoder_options);
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.cc
index e039220b65e..05fed4a743a 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.cc
@@ -2,6 +2,7 @@
 
 #include <utility>
 
+#include "comm/pax_memory.h"
 #include "storage/columns/pax_rlev2_encoding.h"
 
 namespace pax {
@@ -10,8 +11,8 @@ PaxEncoder *PaxEncoder::CreateStreamingEncoder(
     const EncodingOption &encoder_options) {
   PaxEncoder *encoder = nullptr;
   switch (encoder_options.column_encode_type) {
-    case ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2: {
-      encoder = new PaxOrcEncoder(std::move(encoder_options));
+    case ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2: {
+      encoder = PAX_NEW<PaxOrcEncoder>(std::move(encoder_options));
       break;
     }
     case ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA: {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.h b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.h
index 7bcb8d1707f..c0c95d3a89d 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding.h
@@ -3,6 +3,8 @@
 #include <stddef.h>
 #include <stdint.h>
 
+#include <map>
+
 #include "comm/cbdb_wrappers.h"
 #include "storage/columns/pax_encoding_utils.h"
 #include "storage/pax_buffer.h"
@@ -14,13 +16,13 @@ class PaxEncoder {
   struct EncodingOption {
     ColumnEncoding_Kind column_encode_type;
     bool is_sign;
-    int compress_lvl;
+    int compress_level;
 
     EncodingOption()
         : column_encode_type(
               ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED),
           is_sign(true),
-          compress_lvl(0) {}
+          compress_level(0) {}
   };
 
  public:
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.cc
index 12eba3d3818..13de2436d39 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.cc
@@ -1,40 +1,41 @@
 #include "storage/columns/pax_encoding_column.h"
 
+#include "storage/pax_defined.h"
 #include "storage/proto/proto_wrappers.h"
 namespace pax {
 
 template <typename T>
 PaxEncodingColumn<T>::PaxEncodingColumn(
-    uint64 capacity, const PaxEncoder::EncodingOption &encoding_option)
+    uint32 capacity, const PaxEncoder::EncodingOption &encoding_option)
     : PaxCommColumn<T>(capacity),
       encoder_options_(encoding_option),
       encoder_(nullptr),
-      origin_len_(NO_ENCODE_ORIGIN_LEN),
-      non_null_rows_(0),
       decoder_(nullptr),
       shared_data_(nullptr),
       compressor_(nullptr),
-      compress_route_(true) {}
+      compress_route_(true) {
+  InitEncoder();
+}
 
 template <typename T>
 PaxEncodingColumn<T>::PaxEncodingColumn(
-    uint64 capacity, const PaxDecoder::DecodingOption &decoding_option)
+    uint32 capacity, const PaxDecoder::DecodingOption &decoding_option)
     : PaxCommColumn<T>(capacity),
       encoder_(nullptr),
-      origin_len_(NO_ENCODE_ORIGIN_LEN),
-      non_null_rows_(0),
       decoder_options_{decoding_option},
       decoder_(nullptr),
       shared_data_(nullptr),
       compressor_(nullptr),
-      compress_route_(false) {}
+      compress_route_(false) {
+  InitDecoder();
+}
 
 template <typename T>
 PaxEncodingColumn<T>::~PaxEncodingColumn() {
-  delete encoder_;
-  delete decoder_;
-  delete shared_data_;
-  delete compressor_;
+  PAX_DELETE(encoder_);
+  PAX_DELETE(decoder_);
+  PAX_DELETE(shared_data_);
+  PAX_DELETE(compressor_);
 }
 
 template <typename T>
@@ -44,7 +45,8 @@ void PaxEncodingColumn<T>::InitEncoder() {
     encoder_options_.column_encode_type = GetDefaultColumnType();
   }
 
-  PaxColumn::encoded_type_ = encoder_options_.column_encode_type;
+  PaxColumn::SetEncodeType(encoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(encoder_options_.compress_level);
 
   // Create a streaming encoder
   // If current `encoded_type_` can not create a streaming encoder,
@@ -57,54 +59,45 @@ void PaxEncodingColumn<T>::InitEncoder() {
   // Not allow pass `default`type` of `encoded_type_` into
   // `CreateStreamingEncoder`, caller should change it before create a encoder.
   encoder_ = PaxEncoder::CreateStreamingEncoder(encoder_options_);
-
   if (encoder_) {
-    origin_len_ = 0;
-    // The memory owner change to `shared_data_`
-    // Because PaxEncodingColumn can not predict when to resize the memory.
-    // Should allow call memory resize in the encoding.
-    PaxCommColumn<T>::data_->SetMemTakeOver(false);
-    shared_data_ = new DataBuffer<char>(*PaxCommColumn<T>::data_);
-    shared_data_->SetMemTakeOver(true);
-
-    encoder_->SetDataBuffer(shared_data_);
-  } else {
-    // Create a block compressor
-    // Compressor have a different interface with pax encoder
-    // If no pax encoder no provided, then try to create a compressor.
-    compressor_ =
-        PaxCompressor::CreateBlockCompressor(PaxColumn::encoded_type_);
-
-    // can't find any encoder or compressor
-    // then should reset encode type
-    // or will got origin length is -1 but still have encode type
-    if (!compressor_) {
-      PaxColumn::encoded_type_ =
-          ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED;
-    }
+    return;
+  }
+
+  // Create a block compressor
+  // Compressor have a different interface with pax encoder
+  // If no pax encoder no provided, then try to create a compressor.
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
+  if (compressor_) {
+    return;
   }
+
+  // can't find any encoder or compressor
+  // then should reset encode type
+  // or will got origin length is -1 but still have encode type
+  PaxColumn::SetEncodeType(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
+  PaxColumn::SetCompressLevel(0);
 }
 
 template <typename T>
 void PaxEncodingColumn<T>::InitDecoder() {
   Assert(decoder_options_.column_encode_type !=
          ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED);
-  PaxColumn::encoded_type_ = decoder_options_.column_encode_type;
+
+  PaxColumn::SetEncodeType(decoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(decoder_options_.compress_level);
 
   decoder_ = PaxDecoder::CreateDecoder<T>(decoder_options_);
   if (decoder_) {
-    shared_data_ = new DataBuffer<char>(*PaxCommColumn<T>::data_);
+    // init the shared_data_ with the buffer from PaxCommColumn<T>::data_
+    // cause decoder_ need a DataBuffer<char> * as dst buffer
+    shared_data_ = PAX_NEW<DataBuffer<char>>(*PaxCommColumn<T>::data_);
     decoder_->SetDataBuffer(shared_data_);
-    // still need set source data buffer in `Set`
-  } else {
-    compressor_ =
-        PaxCompressor::CreateBlockCompressor(PaxColumn::encoded_type_);
-    if (compressor_) {
-      PaxCommColumn<T>::data_->SetMemTakeOver(false);
-      shared_data_ = new DataBuffer<char>(*PaxCommColumn<T>::data_);
-      shared_data_->SetMemTakeOver(true);
-    }
+    return;
   }
+
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
 }
 
 template <typename T>
@@ -114,76 +107,70 @@ void PaxEncodingColumn<T>::Set(DataBuffer<T> *data) {
     if (data->Used() != 0) {
       Assert(shared_data_);
       decoder_->SetSrcBuffer(data->Start(), data->Used());
-      // should not setting null bitmap until vec version
       decoder_->Decoding(nullptr, 0);
+
+      // `data_` have the same buffer with `shared_data_`
+      PaxCommColumn<T>::data_->Brush(shared_data_->Used());
     }
 
     Assert(!data->IsMemTakeOver());
-    delete data;
+    PAX_DELETE(data);
   } else if (compressor_) {
     if (data->Used() != 0) {
-      Assert(shared_data_);
-      size_t d_size = compressor_->Decompress(shared_data_->Start(),
-                                              shared_data_->Capacity(),
-                                              data->Start(), data->Used());
+      // should not init `shared_data_`, direct uncompress to `data_`
+      Assert(!shared_data_);
+      size_t d_size = compressor_->Decompress(
+          PaxCommColumn<T>::data_->Start(), PaxCommColumn<T>::data_->Capacity(),
+          data->Start(), data->Used());
       if (compressor_->IsError(d_size)) {
         // log error with `compressor_->ErrorName(d_size)`
         CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
       }
 
-      shared_data_->Brush(d_size);
+      PaxCommColumn<T>::data_->Brush(d_size);
     }
 
-    // FIXME(jiaqizho): DataBuffer copy should change to ptr copy
-    // Then we don't need update back `data_`
-    PaxCommColumn<T>::data_->Reset();
-    PaxCommColumn<T>::data_->Set(shared_data_->Start(),
-                                 shared_data_->Capacity(), 0);
-    PaxCommColumn<T>::data_->Brush(shared_data_->Used());
-
     Assert(!data->IsMemTakeOver());
-    delete data;
+    PAX_DELETE(data);
   } else {
     PaxCommColumn<T>::Set(data);
   }
 }
 
-template <typename T>
-std::pair<char *, size_t> PaxEncodingColumn<T>::GetBuffer(size_t position) {
-  CBDB_CHECK(!encoder_, cbdb::CException::ExType::kExTypeLogicError);
-
-  if (decoder_) {
-    Assert(shared_data_);
-    CBDB_CHECK(position < shared_data_->Used() / sizeof(T),
-               cbdb::CException::ExType::kExTypeOutOfRange);
-
-    return std::make_pair(shared_data_->Start() + (sizeof(T) * position),
-                          sizeof(T));
-  }
-  return PaxCommColumn<T>::GetBuffer(position);
-}
-
 template <typename T>
 std::pair<char *, size_t> PaxEncodingColumn<T>::GetBuffer() {
-  if (encoder_) {
-    encoder_->Flush();
-  }
+  if (compress_route_) {
+    // already done with decoding/compress
+    if (shared_data_) {
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    }
 
-  if (shared_data_) {
-    return std::make_pair(shared_data_->Start(), shared_data_->Used());
-  } else if (compressor_ && !shared_data_ && compress_route_) {
-    // all null field should not compress
+    // no data for encoding
     if (PaxCommColumn<T>::data_->Used() == 0) {
       return PaxCommColumn<T>::GetBuffer();
-    } else {
+    }
+
+    if (encoder_) {
+      // changed streaming encode to blocking encode
+      // because we still need store a origin data in `PaxCommColumn<T>`
+      auto origin_data_buffer = PaxCommColumn<T>::data_;
+
+      shared_data_ = PAX_NEW<DataBuffer<char>>(origin_data_buffer->Used());
+      encoder_->SetDataBuffer(shared_data_);
+      for (size_t i = 0; i < origin_data_buffer->GetSize(); i++) {
+        encoder_->Append((*origin_data_buffer)[i]);
+      }
+      encoder_->Flush();
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    } else if (compressor_) {
       size_t bound_size =
           compressor_->GetCompressBound(PaxCommColumn<T>::data_->Used());
-      shared_data_ = new DataBuffer<char>(bound_size);
+      shared_data_ = PAX_NEW<DataBuffer<char>>(bound_size);
 
       size_t c_size = compressor_->Compress(
           shared_data_->Start(), shared_data_->Capacity(),
           PaxCommColumn<T>::data_->Start(), PaxCommColumn<T>::data_->Used(),
-          encoder_options_.compress_lvl);
+          encoder_options_.compress_level);
 
       if (compressor_->IsError(c_size)) {
         // log error with `compressor_->ErrorName(c_size)`
@@ -193,77 +180,47 @@ std::pair<char *, size_t> PaxEncodingColumn<T>::GetBuffer() {
       shared_data_->Brush(c_size);
       return std::make_pair(shared_data_->Start(), shared_data_->Used());
     }
-  } else {
-    return PaxCommColumn<T>::GetBuffer();
+
+    // no encoding here, fall through
   }
 
-  // unreach
-  Assert(false);
+  return PaxCommColumn<T>::GetBuffer();
 }
 
 template <typename T>
-std::pair<char *, size_t> PaxEncodingColumn<T>::GetRangeBuffer(size_t start_pos,
-                                                               size_t len) {
-  CBDB_CHECK(!encoder_, cbdb::CException::ExType::kExTypeLogicError);
-
-  if (decoder_) {
-    Assert(shared_data_);
-    CBDB_CHECK((start_pos + len) <= GetNonNullRows(),
-               cbdb::CException::ExType::kExTypeOutOfRange);
-    return std::make_pair(shared_data_->Start() + (sizeof(T) * start_pos),
-                          sizeof(T) * len);
-  }
-
-  return PaxCommColumn<T>::GetRangeBuffer(start_pos, len);
+int64 PaxEncodingColumn<T>::GetOriginLength() const {
+  return encoder_options_.column_encode_type ==
+                 ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED
+             ? NO_ENCODE_ORIGIN_LEN
+             : PaxCommColumn<T>::data_->Used();
 }
 
 template <typename T>
-void PaxEncodingColumn<T>::Append(char *buffer, size_t size) {
-  Assert(size == sizeof(T));
-  if (encoder_) {
-    // Should not call `PaxCommColumn::Append`,
-    // but still need call `PaxColumn::Append` to push null bitmap.
-    PaxColumn::Append(buffer, size);  // NOLINT
-
-    non_null_rows_++;
-    origin_len_ += size;
-    encoder_->Append(*reinterpret_cast<T *>(buffer));
-    if (shared_data_->Capacity() != PaxCommColumn<T>::capacity_) {
-      PaxCommColumn<T>::capacity_ = shared_data_->Capacity();
-    }
-    return;
+size_t PaxEncodingColumn<T>::PhysicalSize() const {
+  if (shared_data_) {
+    return shared_data_->Used();
   }
 
-  PaxCommColumn<T>::Append(buffer, size);
-}
-
-template <typename T>
-int64 PaxEncodingColumn<T>::GetOriginLength() const {
-  return compressor_ ? PaxCommColumn<T>::data_->Used() : origin_len_;
+  return PaxCommColumn<T>::PhysicalSize();
 }
 
 template <typename T>
-size_t PaxEncodingColumn<T>::GetNonNullRows() const {
-  if (decoder_) {
-    // must be decoded
-    Assert(shared_data_);
-    return shared_data_->Used() / sizeof(T);
-  }
-
-  if (encoder_) {
-    return non_null_rows_;
+size_t PaxEncodingColumn<T>::GetAlignSize() const {
+  if (encoder_options_.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    return PaxColumn::GetAlignSize();
   }
 
-  return PaxCommColumn<T>::GetNonNullRows();
+  return PAX_DATA_NO_ALIGN;
 }
 
 template <typename T>
-size_t PaxEncodingColumn<T>::PhysicalSize() const {
-  if (shared_data_) {
-    return shared_data_->Used();
-  }
-
-  return PaxCommColumn<T>::PhysicalSize();
+ColumnEncoding_Kind PaxEncodingColumn<T>::GetDefaultColumnType() {
+  return ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
+  // TODO(jiaqizho): after support DELTA encoding
+  // return sizeof(T) >= 4 ? ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2
+  //                       :
+  //                       ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA;
 }
 
 template class PaxEncodingColumn<int8>;
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.h b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.h
index 626621865e8..463daf54256 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_column.h
@@ -9,43 +9,34 @@ namespace pax {
 template <typename T>
 class PaxEncodingColumn : public PaxCommColumn<T> {
  public:
-  PaxEncodingColumn(uint64 capacity,
+  PaxEncodingColumn(uint32 capacity,
                     const PaxEncoder::EncodingOption &encoding_option);
 
-  PaxEncodingColumn(uint64 capacity,
+  PaxEncodingColumn(uint32 capacity,
                     const PaxDecoder::DecodingOption &decoding_option);
 
   ~PaxEncodingColumn() override;
 
   void Set(DataBuffer<T> *data) override;
 
-  void Append(char *buffer, size_t size) override;
-
-  std::pair<char *, size_t> GetBuffer(size_t position) override;
-
   std::pair<char *, size_t> GetBuffer() override;
 
-  std::pair<char *, size_t> GetRangeBuffer(size_t start_pos,
-                                           size_t len) override;
-
-  size_t GetNonNullRows() const override;
-
   int64 GetOriginLength() const override;
 
   size_t PhysicalSize() const override;
 
+  size_t GetAlignSize() const override;
+
  protected:
   void InitEncoder();
 
   void InitDecoder();
 
-  virtual ColumnEncoding_Kind GetDefaultColumnType() = 0;
+  ColumnEncoding_Kind GetDefaultColumnType();
 
  protected:
   PaxEncoder::EncodingOption encoder_options_;
   PaxEncoder *encoder_;
-  uint64 origin_len_;
-  uint64 non_null_rows_;
 
   PaxDecoder::DecodingOption decoder_options_;
   PaxDecoder *decoder_;
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.cc
index e7f190f9445..4a473fb7154 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.cc
@@ -1,9 +1,12 @@
 #include "storage/columns/pax_encoding_non_fixed_column.h"
 
+#include "comm/pax_memory.h"
+#include "storage/pax_defined.h"
+
 namespace pax {
 
 PaxNonFixedEncodingColumn::PaxNonFixedEncodingColumn(
-    uint64 capacity, const PaxEncoder::EncodingOption &encoder_options)
+    uint32 capacity, const PaxEncoder::EncodingOption &encoder_options)
     : PaxNonFixedColumn(capacity),
       encoder_options_(encoder_options),
       compressor_(nullptr),
@@ -13,17 +16,20 @@ PaxNonFixedEncodingColumn::PaxNonFixedEncodingColumn(
       ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED) {
     encoder_options_.column_encode_type = ColumnEncoding_Kind_COMPRESS_ZSTD;
   }
+  PaxColumn::SetEncodeType(encoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(encoder_options_.compress_level);
 
-  PaxColumn::encoded_type_ = encoder_options_.column_encode_type;
-  compressor_ = PaxCompressor::CreateBlockCompressor(PaxColumn::encoded_type_);
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
   if (!compressor_) {
-    PaxColumn::encoded_type_ =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED;
+    PaxColumn::SetEncodeType(
+        ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
+    PaxColumn::SetCompressLevel(0);
   }
 }
 
 PaxNonFixedEncodingColumn::PaxNonFixedEncodingColumn(
-    uint64 capacity, const PaxDecoder::DecodingOption &decoding_option)
+    uint32 capacity, const PaxDecoder::DecodingOption &decoding_option)
     : PaxNonFixedColumn(capacity),
       decoder_options_(decoding_option),
       compressor_(nullptr),
@@ -31,96 +37,91 @@ PaxNonFixedEncodingColumn::PaxNonFixedEncodingColumn(
       shared_data_(nullptr) {
   Assert(decoder_options_.column_encode_type !=
          ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED);
-  PaxColumn::encoded_type_ = decoder_options_.column_encode_type;
-  compressor_ = PaxCompressor::CreateBlockCompressor(PaxColumn::encoded_type_);
-  if (compressor_) {
-    PaxNonFixedColumn::data_->SetMemTakeOver(false);
-    shared_data_ = new DataBuffer<char>(*PaxNonFixedColumn::data_);
-    shared_data_->SetMemTakeOver(true);
-  }
+  PaxColumn::SetEncodeType(decoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(decoder_options_.compress_level);
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
 }
 
 PaxNonFixedEncodingColumn::~PaxNonFixedEncodingColumn() {
-  delete compressor_;
-  delete shared_data_;
+  PAX_DELETE(compressor_);
+  PAX_DELETE(shared_data_);
 }
 
 void PaxNonFixedEncodingColumn::Set(DataBuffer<char> *data,
-                                    DataBuffer<int64> *lengths,
+                                    DataBuffer<int32> *lengths,
                                     size_t total_size) {
   if (compressor_) {
-    Assert(shared_data_);
+    Assert(!compress_route_);
 
     // still need update origin logic
-    if (lengths_) {
-      delete lengths_;
-    }
-
+    PAX_DELETE(lengths_);
     estimated_size_ = total_size;
     lengths_ = lengths;
-    offsets_.clear();
-    for (size_t i = 0; i < lengths_->GetSize(); i++) {
-      offsets_.emplace_back(i == 0 ? 0 : offsets_[i - 1] + (*lengths_)[i - 1]);
-    }
+    BuildOffsets();
 
     if (data->Used() != 0) {
-      auto d_size = compressor_->Decompress(shared_data_->Start(),
-                                            shared_data_->Capacity(),
-                                            data->Start(), data->Used());
+      auto d_size = compressor_->Decompress(
+          PaxNonFixedColumn::data_->Start(),
+          PaxNonFixedColumn::data_->Capacity(), data->Start(), data->Used());
       if (compressor_->IsError(d_size)) {
         // log error with `compressor_->ErrorName(d_size)`
         CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
       }
-      shared_data_->Brush(d_size);
+      PaxNonFixedColumn::data_->Brush(d_size);
     }
 
-    // FIXME(jiaqizho): DataBuffer copy should change to ptr copy
-    // Then we don't need update back `data_`
-    PaxNonFixedColumn::data_->Reset();
-    PaxNonFixedColumn::data_->Set(shared_data_->Start(),
-                                  shared_data_->Capacity(), 0);
-    PaxNonFixedColumn::data_->Brush(shared_data_->Used());
-
-    Assert(!data->IsMemTakeOver());
-    delete data;
+    PAX_DELETE(data);
   } else {
     PaxNonFixedColumn::Set(data, lengths, total_size);
   }
 }
 
 std::pair<char *, size_t> PaxNonFixedEncodingColumn::GetBuffer() {
-  if (shared_data_) {
-    return std::make_pair(shared_data_->Start(), shared_data_->Used());
-  } else if (compressor_ && !shared_data_ && compress_route_) {
+  if (compressor_ && compress_route_) {
+    // already compressed
+    if (shared_data_) {
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    }
+
+    // do compressed
     if (PaxNonFixedColumn::data_->Used() == 0) {
       return PaxNonFixedColumn::GetBuffer();
-    } else {
-      size_t bound_size =
-          compressor_->GetCompressBound(PaxNonFixedColumn::data_->Used());
-      shared_data_ = new DataBuffer<char>(bound_size);
+    }
 
-      auto c_size = compressor_->Compress(
-          shared_data_->Start(), shared_data_->Capacity(),
-          PaxNonFixedColumn::data_->Start(), PaxNonFixedColumn::data_->Used(),
-          encoder_options_.compress_lvl);
+    size_t bound_size =
+        compressor_->GetCompressBound(PaxNonFixedColumn::data_->Used());
+    shared_data_ = PAX_NEW<DataBuffer<char>>(bound_size);
 
-      if (compressor_->IsError(c_size)) {
-        // log error with `compressor_->ErrorName(d_size)`
-        CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
-      }
-      shared_data_->Brush(c_size);
-      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    auto c_size = compressor_->Compress(
+        shared_data_->Start(), shared_data_->Capacity(),
+        PaxNonFixedColumn::data_->Start(), PaxNonFixedColumn::data_->Used(),
+        encoder_options_.compress_level);
+
+    if (compressor_->IsError(c_size)) {
+      // log error with `compressor_->ErrorName(d_size)`
+      CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
     }
-  } else {
-    return PaxNonFixedColumn::GetBuffer();
+
+    shared_data_->Brush(c_size);
+    return std::make_pair(shared_data_->Start(), shared_data_->Used());
   }
 
-  // unreach
-  Assert(false);
+  // no compress or uncompressed
+  return PaxNonFixedColumn::GetBuffer();
 }
 
 int64 PaxNonFixedEncodingColumn::GetOriginLength() const {
   return compressor_ ? PaxNonFixedColumn::data_->Used() : NO_ENCODE_ORIGIN_LEN;
 }
 
+size_t PaxNonFixedEncodingColumn::GetAlignSize() const {
+  if (encoder_options_.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    return PaxColumn::GetAlignSize();
+  }
+
+  return PAX_DATA_NO_ALIGN;
+}
+
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.h b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.h
index 6de603a4ea8..83fd20a1b00 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.h
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_non_fixed_column.h
@@ -5,24 +5,25 @@
 #include "storage/columns/pax_encoding.h"
 
 namespace pax {
-
 class PaxNonFixedEncodingColumn final : public PaxNonFixedColumn {
  public:
-  PaxNonFixedEncodingColumn(uint64 capacity,
+  PaxNonFixedEncodingColumn(uint32 capacity,
                             const PaxEncoder::EncodingOption &encoder_options);
 
-  PaxNonFixedEncodingColumn(uint64 capacity,
+  PaxNonFixedEncodingColumn(uint32 capacity,
                             const PaxDecoder::DecodingOption &decoding_option);
 
   ~PaxNonFixedEncodingColumn() override;
 
-  void Set(DataBuffer<char> *data, DataBuffer<int64> *lengths,
+  void Set(DataBuffer<char> *data, DataBuffer<int32> *lengths,
            size_t total_size) override;
 
   std::pair<char *, size_t> GetBuffer() override;
 
   int64 GetOriginLength() const override;
 
+  size_t GetAlignSize() const override;
+
   // The reason why `PaxNonFixedEncodingColumn` not override the
   // method `GetRangeBuffer` and `GetNonNullRows` is that
   // `PaxNonFixedEncodingColumn` don't have any streaming encoding, also
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_test.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_test.cc
index fa51aed2510..2e24b6e84e9 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_encoding_test.cc
@@ -8,11 +8,11 @@
 #include "comm/cbdb_wrappers.h"
 #include "comm/gtest_wrappers.h"
 #include "exceptions/CException.h"
+#include "pax_gtest_helper.h"
 #include "storage/columns/pax_decoding.h"
 #include "storage/columns/pax_encoding_utils.h"
 #include "storage/columns/pax_rlev2_decoding.h"
 #include "storage/columns/pax_rlev2_encoding.h"
-
 namespace pax::tests {
 
 PaxDecoder *GetDecoderByBits(
@@ -44,36 +44,18 @@ PaxDecoder *GetDecoderByBits(
 }
 
 class PaxEncodingTest : public ::testing::Test {
-  void SetUp() override {
-    MemoryContext pax_encoding_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 200 * 1024 * 1024,
-        200 * 1024 * 1024, 200 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_encoding_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxEncodingRangeTest
     : public ::testing::TestWithParam<::testing::tuple<uint64, bool>> {
-  void SetUp() override {
-    MemoryContext pax_encoding_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 1 * 1024 * 1024,
-        1 * 1024 * 1024, 1 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_encoding_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxEncodingRangeWithBitsTest
     : public ::testing::TestWithParam<::testing::tuple<uint64, bool, uint8>> {
  public:
-  void SetUp() override {
-    MemoryContext pax_encoding_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 1 * 1024 * 1024,
-        1 * 1024 * 1024, 1 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_encoding_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxEncodingShortRepeatRangeTest : public PaxEncodingRangeWithBitsTest {};
@@ -82,13 +64,7 @@ class PaxEncodingWriteReadLongsRangeTest : public PaxEncodingRangeTest {};
 
 class PaxEncodingDeltaIncDecRangeTest
     : public ::testing::TestWithParam<::testing::tuple<uint64, uint64, bool>> {
-  void SetUp() override {
-    MemoryContext pax_encoding_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 1 * 1024 * 1024,
-        1 * 1024 * 1024, 1 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_encoding_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxEncodingDirectRangeTest : public PaxEncodingDeltaIncDecRangeTest {};
@@ -96,13 +72,7 @@ class PaxEncodingDirectRangeTest : public PaxEncodingDeltaIncDecRangeTest {};
 class PaxEncodingRawDataTest
     : public testing::TestWithParam<
           ::testing::tuple<std::vector<int64>, uint8>> {
-  void SetUp() override {
-    MemoryContext pax_encoding_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxCompressTestMemoryContext", 200 * 1024 * 1024,
-        200 * 1024 * 1024, 200 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_encoding_memory_context);
-  }
+  void SetUp() override { CreateMemoryContext(); }
 };
 
 class PaxEncodingPBTest : public PaxEncodingRawDataTest {};
@@ -218,7 +188,7 @@ TEST_P(PaxEncodingShortRepeatRangeTest, TestOrcShortRepeatEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -247,7 +217,7 @@ TEST_P(PaxEncodingShortRepeatRangeTest, TestOrcShortRepeatEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
 
   PaxDecoder *decoder =
@@ -334,7 +304,7 @@ TEST_P(PaxEncodingDeltaRangeTest, TestOrcDeltaEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -364,7 +334,7 @@ TEST_P(PaxEncodingDeltaRangeTest, TestOrcDeltaEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
 
   PaxDecoder *decoder =
@@ -449,7 +419,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcIncDeltaEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -484,7 +454,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcIncDeltaEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
   auto decoder =
       PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -522,7 +492,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcIncWithoutFixedDeltaEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -556,7 +526,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcIncWithoutFixedDeltaEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
   auto decoder =
       PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -594,7 +564,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcDecDeltaEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -631,7 +601,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcDecDeltaEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
   auto decoder =
       PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -669,7 +639,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcDecWithoutFixedDeltaEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -706,7 +676,7 @@ TEST_P(PaxEncodingDeltaIncDecRangeTest, TestOrcDecWithoutFixedDeltaEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
   auto decoder =
       PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -816,7 +786,7 @@ TEST_P(PaxEncodingDirectRangeTest, TestOrcDirectEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = sign;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -856,7 +826,7 @@ TEST_P(PaxEncodingDirectRangeTest, TestOrcDirectEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = sign;
   auto decoder =
       PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -899,7 +869,7 @@ TEST_P(PaxEncodingPBTest, TestOrcPBEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = true;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -920,7 +890,7 @@ TEST_P(PaxEncodingPBTest, TestOrcPBEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = true;
 
   auto decoder =
@@ -990,7 +960,7 @@ TEST_P(PaxEncodingRawDataTest, TestOrcMixEncoding) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = true;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -1012,7 +982,7 @@ TEST_P(PaxEncodingRawDataTest, TestOrcMixEncoding) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = true;
 
   auto decoder =
@@ -1112,7 +1082,7 @@ TEST_F(PaxEncodingTest, TestOrcShortRepeatWithNULL) {
   PaxEncoder::EncodingOption encoder_options;
 
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = true;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -1148,7 +1118,7 @@ TEST_F(PaxEncodingTest, TestOrcShortRepeatWithNULL) {
     }
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1188,7 +1158,7 @@ TEST_F(PaxEncodingTest, TestOrcShortRepeatWithNULL) {
     }
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1229,7 +1199,7 @@ TEST_F(PaxEncodingTest, TestOrcShortRepeatWithNULL) {
 
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1276,7 +1246,7 @@ TEST_F(PaxEncodingTest, TestOrcDeltaEncodingWithNULL) {
 
   PaxEncoder::EncodingOption encoder_options;
   encoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   encoder_options.is_sign = true;
   encoder = PaxEncoder::CreateStreamingEncoder(encoder_options);
 
@@ -1309,7 +1279,7 @@ TEST_F(PaxEncodingTest, TestOrcDeltaEncodingWithNULL) {
     }
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1349,7 +1319,7 @@ TEST_F(PaxEncodingTest, TestOrcDeltaEncodingWithNULL) {
     }
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1389,7 +1359,7 @@ TEST_F(PaxEncodingTest, TestOrcDeltaEncodingWithNULL) {
 
     PaxDecoder::DecodingOption decoder_options;
     decoder_options.column_encode_type =
-        ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+        ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
     decoder_options.is_sign = true;
     auto decoder =
         PaxDecoder::CreateDecoder<int64>(decoder_options)
@@ -1436,7 +1406,7 @@ TEST_F(PaxEncodingTest, TestEncodingWithAllNULL) {
 
   PaxDecoder::DecodingOption decoder_options;
   decoder_options.column_encode_type =
-      ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2;
+      ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
   decoder_options.is_sign = true;
   auto decoder = PaxDecoder::CreateDecoder<int64>(decoder_options)
                      ->SetSrcBuffer(nullptr, 0);
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_decoding.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_decoding.cc
index 614a604f527..7d25f066eaa 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_decoding.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_decoding.cc
@@ -4,6 +4,8 @@
 #include <cmath>
 #include <vector>
 
+#include "comm/pax_memory.h"
+
 namespace pax {
 
 #ifndef RUN_GTEST
@@ -568,15 +570,9 @@ PaxOrcDecoder<T>::PaxOrcDecoder(
 
 template <typename T>
 PaxOrcDecoder<T>::~PaxOrcDecoder() {
-  if (data_buffer_) {
-    delete data_buffer_;
-  }
-  if (copy_data_buffer_) {
-    delete copy_data_buffer_;
-  }
-  if (unpacked_data_) {
-    delete unpacked_data_;
-  }
+  PAX_DELETE(data_buffer_);
+  PAX_DELETE(copy_data_buffer_);
+  PAX_DELETE(unpacked_data_);
 }
 
 template <typename T>
@@ -584,9 +580,9 @@ PaxDecoder *PaxOrcDecoder<T>::SetSrcBuffer(char *data, size_t data_len) {
   Assert(!data_buffer_);
   if (data) {
     data_buffer_ =
-        new TreatedDataBuffer<int64>(reinterpret_cast<int64 *>(data), data_len);
+        PAX_NEW<TreatedDataBuffer<int64>>(reinterpret_cast<int64 *>(data), data_len);
     copy_data_buffer_ =
-        new DataBuffer<int64>(ORC_MAX_LITERAL_SIZE * sizeof(int64));
+        PAX_NEW<DataBuffer<int64>>(ORC_MAX_LITERAL_SIZE * sizeof(int64));
   }
 
   return this;
@@ -957,7 +953,7 @@ uint64 PaxOrcDecoder<T>::NextPatched(TreatedDataBuffer<int64> *data_buffer,
   }
 
   if (unpacked_data_ == nullptr) {
-    unpacked_data_ = new DataBuffer<int64>(pl * sizeof(int64));
+    unpacked_data_ = PAX_NEW<DataBuffer<int64>>(pl * sizeof(int64));
   } else {
     unpacked_data_->BrushBackAll();
     if (unpacked_data_->Capacity() < (pl * sizeof(int64))) {
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_encoding.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_encoding.cc
index 1dc7da364ae..88c0cbcea77 100644
--- a/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_encoding.cc
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_rlev2_encoding.cc
@@ -6,6 +6,7 @@
 #include <vector>
 
 #include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
 
 namespace pax {
 
@@ -197,15 +198,15 @@ void PaxOrcEncoder::EncoderContext::ResetPbCtx() const {
 
 PaxOrcEncoder::PaxOrcEncoder(const EncodingOption &encoder_options)
     : PaxEncoder(encoder_options),
-      data_buffer_(new UntreatedDataBuffer<int64>(1024)),
-      zigzag_buffer_(new DataBuffer<int64>(128)),
+      data_buffer_(PAX_NEW<UntreatedDataBuffer<int64>>(1024)),
+      zigzag_buffer_(PAX_NEW<DataBuffer<int64>>(128)),
       status_(EncoderStatus::kInit) {
   encoder_context_.is_sign = encoder_options_.is_sign;
 }
 
 PaxOrcEncoder::~PaxOrcEncoder() {
-  delete data_buffer_;
-  delete zigzag_buffer_;
+  PAX_DELETE(data_buffer_);
+  PAX_DELETE(zigzag_buffer_);
 }
 
 void PaxOrcEncoder::Append(const int64 data) { AppendInternal(data, false); }
@@ -599,7 +600,7 @@ void PaxOrcEncoder::AppendInternal(const int64 data, bool is_flush) {
       case EncoderStatus::kTreatPatchedBase: {
         TreatPatchedBase();
         encoder_context_.var_len = 0;
-        encoder_context_.ResetPbCtx();
+
         keep_push_status = true;
         SwitchStatusTo(kTreatDone);
         break;
@@ -611,7 +612,7 @@ void PaxOrcEncoder::AppendInternal(const int64 data, bool is_flush) {
         } else {
           encoder_context_.var_len = 0;
         }
-        encoder_context_.ResetDeltaCtx();
+
         keep_push_status = true;
         SwitchStatusTo(kTreatDone);
 
@@ -619,6 +620,9 @@ void PaxOrcEncoder::AppendInternal(const int64 data, bool is_flush) {
       }
       case EncoderStatus::kTreatDone: {
         Assert(data_buffer_->UnTreated() != 0);
+        encoder_context_.ResetDeltaCtx();
+        encoder_context_.ResetDirectCtx();
+        encoder_context_.ResetPbCtx();
 
         // left shift
         data_buffer_->TreatedAll();
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.cc
new file mode 100644
index 00000000000..ff5ad83938f
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.cc
@@ -0,0 +1,259 @@
+#include "storage/columns/pax_vec_column.h"
+
+#include "comm/pax_memory.h"
+
+namespace pax {
+
+template <typename T>
+PaxVecCommColumn<T>::PaxVecCommColumn(uint32 capacity) {
+  data_ = PAX_NEW<DataBuffer<T>>(TYPEALIGN(MEMORY_ALIGN_SIZE, capacity * sizeof(T)));
+}
+
+template <typename T>
+PaxVecCommColumn<T>::~PaxVecCommColumn() {
+  PAX_DELETE(data_);
+}
+
+template <typename T>  // NOLINT: redirect constructor
+PaxVecCommColumn<T>::PaxVecCommColumn() : PaxVecCommColumn(DEFAULT_CAPACITY) {}
+
+template <typename T>
+void PaxVecCommColumn<T>::Set(DataBuffer<T> *data, size_t non_null_rows) {
+  PAX_DELETE(data_);
+
+  data_ = data;
+  non_null_rows_ = non_null_rows;
+}
+
+template <typename T>
+void PaxVecCommColumn<T>::AppendInternal(char *buffer, size_t size) {  // NOLINT
+  auto buffer_t = reinterpret_cast<T *>(buffer);
+  Assert(size % sizeof(T) == 0);
+  Assert(data_->Capacity() >= sizeof(T));
+
+  if (data_->Available() == 0) {
+    data_->ReSize(data_->Capacity() * 2);
+  }
+
+  data_->Write(buffer_t, sizeof(T));
+  data_->Brush(sizeof(T));
+}
+
+template <typename T>
+void PaxVecCommColumn<T>::Append(char *buffer, size_t size) {
+  PaxColumn::Append(buffer, size);
+  AppendInternal(buffer, size);
+}
+
+static char null_buffer[sizeof(int64)] = {0};
+
+template <typename T>
+void PaxVecCommColumn<T>::AppendNull() {
+  PaxColumn::AppendNull();
+  static_assert(sizeof(T) <= sizeof(int64), "invalid append null");
+  AppendInternal(null_buffer, sizeof(T));
+}
+
+template <typename T>
+PaxColumnTypeInMem PaxVecCommColumn<T>::GetPaxColumnTypeInMem() const {
+  return PaxColumnTypeInMem::kTypeFixed;
+}
+
+template <typename T>
+PaxStorageFormat PaxVecCommColumn<T>::GetStorageFormat() const {
+  return PaxStorageFormat::kTypeStorageOrcVec;
+}
+
+template <typename T>
+size_t PaxVecCommColumn<T>::PhysicalSize() const {
+  return data_->Used();
+}
+
+template <typename T>
+int64 PaxVecCommColumn<T>::GetOriginLength() const {
+  return NO_ENCODE_ORIGIN_LEN;
+}
+
+template <typename T>
+int32 PaxVecCommColumn<T>::GetTypeLength() const {
+  return sizeof(T);
+}
+
+template <typename T>
+std::pair<char *, size_t> PaxVecCommColumn<T>::GetBuffer() {
+  return std::make_pair(data_->Start(), data_->Used());
+}
+
+template <typename T>
+std::pair<char *, size_t> PaxVecCommColumn<T>::GetBuffer(size_t position) {
+  CBDB_CHECK(position < GetRows(), cbdb::CException::ExType::kExTypeOutOfRange);
+  return std::make_pair(data_->Start() + (sizeof(T) * position), sizeof(T));
+}
+
+template <typename T>
+std::pair<char *, size_t> PaxVecCommColumn<T>::GetRangeBuffer(size_t start_pos,
+                                                              size_t len) {
+  CBDB_CHECK((start_pos + len) <= GetRows(),
+             cbdb::CException::ExType::kExTypeOutOfRange);
+  return std::make_pair(data_->Start() + (sizeof(T) * start_pos),
+                        sizeof(T) * len);
+}
+
+template <typename T>
+DataBuffer<T> *PaxVecCommColumn<T>::GetDataBuffer() {
+  return data_;
+}
+
+template class PaxVecCommColumn<char>;
+template class PaxVecCommColumn<int8>;
+template class PaxVecCommColumn<int16>;
+template class PaxVecCommColumn<int32>;
+template class PaxVecCommColumn<int64>;
+template class PaxVecCommColumn<float>;
+template class PaxVecCommColumn<double>;
+
+PaxVecNonFixedColumn::PaxVecNonFixedColumn(uint32 capacity)
+    : estimated_size_(0),
+      data_(PAX_NEW<DataBuffer<char>>(
+          TYPEALIGN(MEMORY_ALIGN_SIZE, capacity * sizeof(char)))),
+      offsets_(PAX_NEW<DataBuffer<int32>>(capacity)),
+      next_offsets_(0) {
+  Assert(capacity % sizeof(int64) == 0);
+}
+
+PaxVecNonFixedColumn::PaxVecNonFixedColumn()
+    : PaxVecNonFixedColumn(DEFAULT_CAPACITY) {}
+
+PaxVecNonFixedColumn::~PaxVecNonFixedColumn() {
+  PAX_DELETE(data_);
+  PAX_DELETE(offsets_);
+}
+
+void PaxVecNonFixedColumn::Set(DataBuffer<char> *data,
+                               DataBuffer<int32> *offsets, size_t total_size,
+                               size_t non_null_rows) {
+  PAX_DELETE(data_);
+  PAX_DELETE(offsets_);
+  Assert(data && offsets);
+
+  estimated_size_ = total_size;
+  data_ = data;
+  offsets_ = offsets;
+  non_null_rows_ = non_null_rows;
+  next_offsets_ = -1;
+}
+
+void PaxVecNonFixedColumn::Append(char *buffer, size_t size) {
+  PaxColumn::Append(buffer, size);
+  // vec format will remove the val header
+  // so we don't need do align with the datum
+
+  Assert(data_->Capacity() > 0);
+  if (data_->Available() < size) {
+    data_->ReSize(data_->Used() + size, 2);
+  }
+
+  estimated_size_ += size;
+  data_->Write(buffer, size);
+  data_->Brush(size);
+
+  Assert(offsets_->Capacity() >= sizeof(int32));
+  if (offsets_->Available() == 0) {
+    offsets_->ReSize(offsets_->Used() + sizeof(int32), 2);
+  }
+
+  Assert(next_offsets_ != -1);
+  offsets_->Write(next_offsets_);
+  offsets_->Brush(sizeof(next_offsets_));
+  next_offsets_ += size;
+}
+
+void PaxVecNonFixedColumn::AppendNull() {
+  PaxColumn::AppendNull();
+  Assert(offsets_->Capacity() >= sizeof(int32));
+  if (offsets_->Available() == 0) {
+    offsets_->ReSize(offsets_->Capacity() * 2);
+  }
+
+  Assert(next_offsets_ != -1);
+  offsets_->Write(next_offsets_);
+  offsets_->Brush(sizeof(next_offsets_));
+}
+
+DataBuffer<int32> *PaxVecNonFixedColumn::GetOffsetBuffer(bool append_last) {
+  if (append_last) {
+    Assert(offsets_->Capacity() >= sizeof(int32));
+    if (offsets_->Available() == 0) {
+      offsets_->ReSize(offsets_->Capacity() + sizeof(int32));
+    }
+    offsets_->Write(next_offsets_);
+    offsets_->Brush(sizeof(next_offsets_));
+    next_offsets_ = -1;
+  }
+
+  return offsets_;
+}
+
+PaxColumnTypeInMem PaxVecNonFixedColumn::GetPaxColumnTypeInMem() const {
+  return PaxColumnTypeInMem::kTypeNonFixed;
+}
+
+PaxStorageFormat PaxVecNonFixedColumn::GetStorageFormat() const {
+  return PaxStorageFormat::kTypeStorageOrcVec;
+}
+
+std::pair<char *, size_t> PaxVecNonFixedColumn::GetBuffer() {
+  return std::make_pair(data_->GetBuffer(), data_->Used());
+}
+
+size_t PaxVecNonFixedColumn::PhysicalSize() const { return estimated_size_; }
+
+int64 PaxVecNonFixedColumn::GetOriginLength() const {
+  return NO_ENCODE_ORIGIN_LEN;
+}
+
+int32 PaxVecNonFixedColumn::GetTypeLength() const { return -1; }
+
+std::pair<char *, size_t> PaxVecNonFixedColumn::GetBuffer(size_t position) {
+  CBDB_CHECK(position < offsets_->GetSize(),
+             cbdb::CException::ExType::kExTypeOutOfRange);
+  // This situation happend when writing
+  // The `offsets_` have not fill the last one
+  if (unlikely(position == offsets_->GetSize() - 1)) {
+    if (null_bitmap_ && null_bitmap_->Test(position)) {
+      return std::make_pair(nullptr, 0);
+    }
+    return std::make_pair(data_->GetBuffer() + (*offsets_)[position],
+                          next_offsets_);
+  }
+
+  auto start_offset = (*offsets_)[position];
+  auto last_offset = (*offsets_)[position + 1];
+
+  if (start_offset == last_offset) {
+    return std::make_pair(nullptr, 0);
+  }
+
+  return std::make_pair(data_->GetBuffer() + start_offset,
+                        last_offset - start_offset);
+}
+
+std::pair<char *, size_t> PaxVecNonFixedColumn::GetRangeBuffer(size_t start_pos,
+                                                               size_t len) {
+  CBDB_CHECK((start_pos + len) <= (offsets_->GetSize() - 1) && len >= 0,
+             cbdb::CException::ExType::kExTypeOutOfRange);
+
+  auto start_offset = (*offsets_)[start_pos];
+  auto last_offset = (*offsets_)[start_pos + len];
+  // all null here
+  if (start_offset == last_offset) {
+    return std::make_pair(data_->GetBuffer() + start_offset, 0);
+  }
+
+  return std::make_pair(data_->GetBuffer() + start_offset,
+                        last_offset - start_offset);
+}
+
+DataBuffer<char> *PaxVecNonFixedColumn::GetDataBuffer() { return data_; }
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.h b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.h
new file mode 100644
index 00000000000..7c14331ae53
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_column.h
@@ -0,0 +1,102 @@
+#pragma once
+#include "storage/columns/pax_column.h"
+
+namespace pax {
+
+template <typename T>
+class PaxVecCommColumn : public PaxColumn {
+ public:
+  explicit PaxVecCommColumn(uint32 capacity);
+
+  ~PaxVecCommColumn() override;
+
+  PaxVecCommColumn();
+
+  virtual void Set(DataBuffer<T> *data, size_t non_null_rows);
+
+  PaxColumnTypeInMem GetPaxColumnTypeInMem() const override;
+
+  PaxStorageFormat GetStorageFormat() const override;
+
+  void Append(char *buffer, size_t size) override;
+
+  void AppendNull() override;
+
+  std::pair<char *, size_t> GetBuffer() override;
+
+  std::pair<char *, size_t> GetBuffer(size_t position) override;
+
+  std::pair<char *, size_t> GetRangeBuffer(size_t start_pos,
+                                           size_t len) override;
+
+  size_t PhysicalSize() const override;
+
+  int64 GetOriginLength() const override;
+
+  int32 GetTypeLength() const override;
+
+  // directly pass the buffer to vec
+  DataBuffer<T> *GetDataBuffer();
+
+ protected:
+  void AppendInternal(char *buffer, size_t size);
+
+ protected:  // NOLINT
+  DataBuffer<T> *data_;
+};
+
+extern template class PaxVecCommColumn<char>;
+extern template class PaxVecCommColumn<int8>;
+extern template class PaxVecCommColumn<int16>;
+extern template class PaxVecCommColumn<int32>;
+extern template class PaxVecCommColumn<int64>;
+extern template class PaxVecCommColumn<float>;
+extern template class PaxVecCommColumn<double>;
+
+class PaxVecNonFixedColumn : public PaxColumn {
+ public:
+  explicit PaxVecNonFixedColumn(uint32 capacity);
+
+  PaxVecNonFixedColumn();
+
+  ~PaxVecNonFixedColumn() override;
+
+  virtual void Set(DataBuffer<char> *data, DataBuffer<int32> *offsets,
+                   size_t total_size, size_t non_null_rows);
+
+  void Append(char *buffer, size_t size) override;
+
+  void AppendNull() override;
+
+  PaxColumnTypeInMem GetPaxColumnTypeInMem() const override;
+
+  PaxStorageFormat GetStorageFormat() const override;
+
+  size_t PhysicalSize() const override;
+
+  int64 GetOriginLength() const override;
+
+  int32 GetTypeLength() const override;
+
+  std::pair<char *, size_t> GetBuffer() override;
+
+  std::pair<char *, size_t> GetBuffer(size_t position) override;
+
+  std::pair<char *, size_t> GetRangeBuffer(size_t start_pos,
+                                           size_t len) override;
+
+  DataBuffer<int32> *GetOffsetBuffer(bool append_last = false);
+
+  // directly pass the buffer to vec
+  DataBuffer<char> *GetDataBuffer();
+
+ protected:
+  size_t estimated_size_;
+  DataBuffer<char> *data_;
+  DataBuffer<int32> *offsets_;
+
+  // used in `kTypeStorageOrcVec`
+  int32 next_offsets_;
+};
+
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.cc b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.cc
new file mode 100644
index 00000000000..fd423caa90d
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.cc
@@ -0,0 +1,333 @@
+#include "storage/columns/pax_vec_encoding_column.h"
+
+#include "comm/pax_memory.h"
+
+namespace pax {
+
+template <typename T>
+PaxVecEncodingColumn<T>::PaxVecEncodingColumn(
+    uint32 capacity, const PaxEncoder::EncodingOption &encoding_option)
+    : PaxVecCommColumn<T>(capacity),
+      encoder_options_(encoding_option),
+      encoder_(nullptr),
+      decoder_(nullptr),
+      shared_data_(nullptr),
+      compressor_(nullptr),
+      compress_route_(true) {
+  PaxVecEncodingColumn<T>::InitEncoder();
+}
+
+template <typename T>
+PaxVecEncodingColumn<T>::PaxVecEncodingColumn(
+    uint32 capacity, const PaxDecoder::DecodingOption &decoding_option)
+    : PaxVecCommColumn<T>(capacity),
+      encoder_(nullptr),
+      decoder_options_{decoding_option},
+      decoder_(nullptr),
+      shared_data_(nullptr),
+      compressor_(nullptr),
+      compress_route_(false) {
+  PaxVecEncodingColumn<T>::InitDecoder();
+}
+
+template <typename T>
+PaxVecEncodingColumn<T>::~PaxVecEncodingColumn() {
+  PAX_DELETE(encoder_);
+  PAX_DELETE(decoder_);
+  PAX_DELETE(shared_data_);
+  PAX_DELETE(compressor_);
+}
+
+template <typename T>
+void PaxVecEncodingColumn<T>::InitEncoder() {
+  if (encoder_options_.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED) {
+    encoder_options_.column_encode_type = GetDefaultColumnType();
+  }
+
+  PaxColumn::SetEncodeType(encoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(encoder_options_.compress_level);
+
+  encoder_ = PaxEncoder::CreateStreamingEncoder(encoder_options_);
+  if (encoder_) {
+    return;
+  }
+
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
+  if (!compressor_) {
+    PaxColumn::SetEncodeType(
+        ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
+    PaxColumn::SetCompressLevel(0);
+  }
+}
+
+template <typename T>
+void PaxVecEncodingColumn<T>::InitDecoder() {
+  Assert(decoder_options_.column_encode_type !=
+         ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED);
+  PaxColumn::SetEncodeType(decoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(decoder_options_.compress_level);
+
+  decoder_ = PaxDecoder::CreateDecoder<T>(decoder_options_);
+  if (decoder_) {
+    // init the shared_data_ with the buffer from PaxVecCommColumn<T>::data_
+    // cause decoder_ need a DataBuffer<char> * as dst buffer
+    shared_data_ = PAX_NEW<DataBuffer<char>>(*PaxVecCommColumn<T>::data_);
+    decoder_->SetDataBuffer(shared_data_);
+    return;
+  }
+
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
+}
+
+template <typename T>
+void PaxVecEncodingColumn<T>::Set(DataBuffer<T> *data, size_t non_null_rows) {
+  PaxColumn::non_null_rows_ = non_null_rows;
+  if (decoder_) {
+    // should not decoding null
+    if (data->Used() != 0) {
+      Assert(shared_data_);
+      decoder_->SetSrcBuffer(data->Start(), data->Used());
+      decoder_->Decoding(nullptr, 0);
+      PaxVecCommColumn<T>::data_->Brush(shared_data_->Used());
+    }
+
+    Assert(!data->IsMemTakeOver());
+    PAX_DELETE(data);
+  } else if (compressor_) {
+    if (data->Used() != 0) {
+      // should not init `shared_data_`, direct uncompress to `data_`
+      Assert(!shared_data_);
+      size_t d_size = compressor_->Decompress(
+          PaxVecCommColumn<T>::data_->Start(),
+          PaxVecCommColumn<T>::data_->Capacity(), data->Start(), data->Used());
+      if (compressor_->IsError(d_size)) {
+        // log error with `compressor_->ErrorName(d_size)`
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
+      }
+
+      PaxVecCommColumn<T>::data_->Brush(d_size);
+    }
+
+    Assert(!data->IsMemTakeOver());
+    PAX_DELETE(data);
+  } else {
+    PaxVecCommColumn<T>::Set(data, non_null_rows);
+  }
+}
+
+template <typename T>
+std::pair<char *, size_t> PaxVecEncodingColumn<T>::GetBuffer() {
+  if (compress_route_) {
+    // already done with decoding/compress
+    if (shared_data_) {
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    }
+
+    // no data for encoding
+    if (PaxVecCommColumn<T>::data_->Used() == 0) {
+      return PaxVecCommColumn<T>::GetBuffer();
+    }
+
+    if (encoder_) {
+      // changed streaming encode to blocking encode
+      // because we still need store a origin data in `PaxVecCommColumn<T>`
+      auto origin_data_buffer = PaxVecCommColumn<T>::data_;
+
+      shared_data_ = PAX_NEW<DataBuffer<char>>(origin_data_buffer->Used());
+      encoder_->SetDataBuffer(shared_data_);
+      for (size_t i = 0; i < origin_data_buffer->GetSize(); i++) {
+        encoder_->Append((*origin_data_buffer)[i]);
+      }
+      encoder_->Flush();
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    } else if (compressor_) {
+      size_t bound_size =
+          compressor_->GetCompressBound(PaxVecCommColumn<T>::data_->Used());
+      shared_data_ = PAX_NEW<DataBuffer<char>>(bound_size);
+
+      size_t c_size = compressor_->Compress(
+          shared_data_->Start(), shared_data_->Capacity(),
+          PaxVecCommColumn<T>::data_->Start(),
+          PaxVecCommColumn<T>::data_->Used(), encoder_options_.compress_level);
+
+      if (compressor_->IsError(c_size)) {
+        // log error with `compressor_->ErrorName(c_size)`
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
+      }
+
+      shared_data_->Brush(c_size);
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    }
+
+    // no encoding here, fall through
+  }
+
+  return PaxVecCommColumn<T>::GetBuffer();
+}
+
+template <typename T>
+int64 PaxVecEncodingColumn<T>::GetOriginLength() const {
+  return encoder_options_.column_encode_type ==
+                 ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED
+             ? NO_ENCODE_ORIGIN_LEN
+             : PaxVecCommColumn<T>::data_->Used();
+}
+
+template <typename T>
+size_t PaxVecEncodingColumn<T>::PhysicalSize() const {
+  if (shared_data_) {
+    return shared_data_->Used();
+  }
+
+  return PaxVecCommColumn<T>::PhysicalSize();
+}
+
+template <typename T>
+size_t PaxVecEncodingColumn<T>::GetAlignSize() const {
+  if (encoder_options_.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    return PaxColumn::GetAlignSize();
+  }
+
+  return PAX_DATA_NO_ALIGN;
+}
+
+template <typename T>
+ColumnEncoding_Kind PaxVecEncodingColumn<T>::GetDefaultColumnType() {
+  return ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2;
+  // TODO(jiaqizho): after support DELTA encoding
+  // return sizeof(T) >= 4 ? ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2
+  //                       :
+  //                       ColumnEncoding_Kind::ColumnEncoding_Kind_DIRECT_DELTA;
+}
+
+template class PaxVecEncodingColumn<int8>;
+template class PaxVecEncodingColumn<int16>;
+template class PaxVecEncodingColumn<int32>;
+template class PaxVecEncodingColumn<int64>;
+
+PaxVecNonFixedEncodingColumn::PaxVecNonFixedEncodingColumn(
+    uint32 capacity, const PaxEncoder::EncodingOption &encoder_options)
+    : PaxVecNonFixedColumn(capacity),
+      encoder_options_(encoder_options),
+      compressor_(nullptr),
+      compress_route_(true),
+      shared_data_(nullptr) {
+  if (encoder_options.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED) {
+    encoder_options_.column_encode_type = ColumnEncoding_Kind_COMPRESS_ZSTD;
+  }
+
+  PaxColumn::SetEncodeType(encoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(encoder_options_.compress_level);
+
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
+  if (!compressor_) {
+    PaxColumn::SetEncodeType(
+        ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
+    PaxColumn::SetCompressLevel(0);
+  }
+}
+
+PaxVecNonFixedEncodingColumn::PaxVecNonFixedEncodingColumn(
+    uint32 capacity, const PaxDecoder::DecodingOption &decoding_option)
+    : PaxVecNonFixedColumn(capacity),
+      decoder_options_(decoding_option),
+      compressor_(nullptr),
+      compress_route_(false),
+      shared_data_(nullptr) {
+  Assert(decoder_options_.column_encode_type !=
+         ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED);
+  PaxColumn::SetEncodeType(decoder_options_.column_encode_type);
+  PaxColumn::SetCompressLevel(decoder_options_.compress_level);
+  compressor_ =
+      PaxCompressor::CreateBlockCompressor(PaxColumn::GetEncodingType());
+}
+
+PaxVecNonFixedEncodingColumn::~PaxVecNonFixedEncodingColumn() {
+  PAX_DELETE(compressor_);
+  PAX_DELETE(shared_data_);
+}
+
+void PaxVecNonFixedEncodingColumn::Set(DataBuffer<char> *data,
+                                       DataBuffer<int32> *offsets,
+                                       size_t total_size,
+                                       size_t non_null_rows) {
+  PaxColumn::non_null_rows_ = non_null_rows;
+  if (compressor_) {
+    Assert(!compress_route_);
+
+    // still need update origin logic
+    PAX_DELETE(offsets_);
+    offsets_ = offsets;
+
+    if (data->Used() != 0) {
+      auto d_size = compressor_->Decompress(
+          PaxVecNonFixedColumn::data_->Start(),
+          PaxVecNonFixedColumn::data_->Capacity(), data->Start(), data->Used());
+      if (compressor_->IsError(d_size)) {
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
+      }
+      PaxVecNonFixedColumn::data_->Brush(d_size);
+    }
+
+    Assert(!data->IsMemTakeOver());
+    PAX_DELETE(data);
+  } else {
+    PaxVecNonFixedColumn::Set(data, offsets_, total_size, non_null_rows);
+  }
+}
+
+std::pair<char *, size_t> PaxVecNonFixedEncodingColumn::GetBuffer() {
+  if (compressor_ && compress_route_) {
+    // already compressed
+    if (shared_data_) {
+      return std::make_pair(shared_data_->Start(), shared_data_->Used());
+    }
+
+    // do compressed
+    if (PaxVecNonFixedColumn::data_->Used() == 0) {
+      return PaxVecNonFixedColumn::GetBuffer();
+    }
+
+    size_t bound_size =
+        compressor_->GetCompressBound(PaxVecNonFixedColumn::data_->Used());
+    shared_data_ = PAX_NEW<DataBuffer<char>>(bound_size);
+
+    auto c_size = compressor_->Compress(
+        shared_data_->Start(), shared_data_->Capacity(),
+        PaxVecNonFixedColumn::data_->Start(),
+        PaxVecNonFixedColumn::data_->Used(), encoder_options_.compress_level);
+
+    if (compressor_->IsError(c_size)) {
+      // log error with `compressor_->ErrorName(d_size)`
+      CBDB_RAISE(cbdb::CException::ExType::kExTypeCompressError);
+    }
+
+    shared_data_->Brush(c_size);
+    return std::make_pair(shared_data_->Start(), shared_data_->Used());
+  }
+
+  // no compress or uncompressed
+  return PaxVecNonFixedColumn::GetBuffer();
+}
+
+int64 PaxVecNonFixedEncodingColumn::GetOriginLength() const {
+  return compressor_ ? PaxVecNonFixedColumn::data_->Used()
+                     : NO_ENCODE_ORIGIN_LEN;
+}
+
+size_t PaxVecNonFixedEncodingColumn::GetAlignSize() const {
+  if (encoder_options_.column_encode_type ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    return PaxColumn::GetAlignSize();
+  }
+
+  return PAX_DATA_NO_ALIGN;
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.h b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.h
new file mode 100644
index 00000000000..a42a09cf296
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/columns/pax_vec_encoding_column.h
@@ -0,0 +1,83 @@
+#pragma once
+
+#include "storage/columns/pax_compress.h"
+#include "storage/columns/pax_decoding.h"
+#include "storage/columns/pax_encoding.h"
+#include "storage/columns/pax_vec_column.h"
+
+namespace pax {
+
+template <typename T>
+class PaxVecEncodingColumn : public PaxVecCommColumn<T> {
+ public:
+  PaxVecEncodingColumn(uint32 capacity,
+                       const PaxEncoder::EncodingOption &encoding_option);
+
+  PaxVecEncodingColumn(uint32 capacity,
+                       const PaxDecoder::DecodingOption &decoding_option);
+
+  ~PaxVecEncodingColumn() override;
+
+  void Set(DataBuffer<T> *data, size_t non_null_rows) override;
+
+  std::pair<char *, size_t> GetBuffer() override;
+
+  int64 GetOriginLength() const override;
+
+  size_t PhysicalSize() const override;
+
+  size_t GetAlignSize() const override;
+
+ protected:
+  void InitEncoder();
+
+  void InitDecoder();
+
+  ColumnEncoding_Kind GetDefaultColumnType();
+
+ protected:
+  PaxEncoder::EncodingOption encoder_options_;
+  PaxEncoder *encoder_;
+
+  PaxDecoder::DecodingOption decoder_options_;
+  PaxDecoder *decoder_;
+  DataBuffer<char> *shared_data_;
+
+  PaxCompressor *compressor_;
+  bool compress_route_;
+};
+
+extern template class PaxVecEncodingColumn<int8>;
+extern template class PaxVecEncodingColumn<int16>;
+extern template class PaxVecEncodingColumn<int32>;
+extern template class PaxVecEncodingColumn<int64>;
+
+class PaxVecNonFixedEncodingColumn : public PaxVecNonFixedColumn {
+ public:
+  PaxVecNonFixedEncodingColumn(
+      uint32 capacity, const PaxEncoder::EncodingOption &encoder_options);
+
+  PaxVecNonFixedEncodingColumn(
+      uint32 capacity, const PaxDecoder::DecodingOption &decoding_option);
+
+  ~PaxVecNonFixedEncodingColumn() override;
+
+  void Set(DataBuffer<char> *data, DataBuffer<int32> *offsets,
+           size_t total_size, size_t non_null_rows) override;
+
+  std::pair<char *, size_t> GetBuffer() override;
+
+  int64 GetOriginLength() const override;
+
+  size_t GetAlignSize() const override;
+
+ protected:
+  PaxEncoder::EncodingOption encoder_options_;
+  PaxDecoder::DecodingOption decoder_options_;
+
+  PaxCompressor *compressor_;
+  bool compress_route_;
+  DataBuffer<char> *shared_data_;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/file_system.h b/contrib/pax_storage/src/cpp/storage/file_system.h
index 9040db75580..c2acbfeff9e 100644
--- a/contrib/pax_storage/src/cpp/storage/file_system.h
+++ b/contrib/pax_storage/src/cpp/storage/file_system.h
@@ -1,10 +1,19 @@
 #pragma once
 
+#include <fcntl.h>
+
 #include <string>
 #include <vector>
 
 namespace pax {
 
+namespace fs {
+const int kWriteMode = O_CREAT | O_WRONLY | O_EXCL;
+const int kReadMode = O_RDONLY;
+const int kReadWriteMode = O_CREAT | O_RDWR | O_EXCL;
+const int kDefaultWritePerm = 0640;
+};  // namespace fs
+
 /*
  * The IO functions may have error that have two different ways
  * to handle errors. In C style, the function returns -1 and set
@@ -36,6 +45,7 @@ class File {
   virtual void PReadN(void *buf, size_t count, off_t offset);
 
   virtual void Flush() = 0;
+  virtual void Delete() = 0;
   virtual void Close() = 0;
   virtual size_t FileLength() const = 0;
   virtual std::string GetPath() const = 0;
@@ -44,7 +54,7 @@ class File {
 class FileSystem {
  public:
   virtual ~FileSystem() = default;
-  virtual File *Open(const std::string &file_path) = 0;
+  virtual File *Open(const std::string &file_path, int flags) = 0;
   virtual std::string BuildPath(const File *file) const = 0;
   virtual void Delete(const std::string &file_path) const = 0;
   virtual std::vector<std::string> ListDirectory(
@@ -54,6 +64,7 @@ class FileSystem {
   virtual int CreateDirectory(const std::string &path) const = 0;
   virtual void DeleteDirectory(const std::string &path,
                                bool delete_topleveldir) const = 0;
+
  protected:
 };
 
diff --git a/contrib/pax_storage/src/cpp/storage/file_system_test.cc b/contrib/pax_storage/src/cpp/storage/file_system_test.cc
index 592e313cee9..f102addd9b4 100644
--- a/contrib/pax_storage/src/cpp/storage/file_system_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/file_system_test.cc
@@ -30,7 +30,7 @@ TEST_F(LocalFileSystemTest, Open) {
   auto local_fs = pax::Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
   file_ptr->Close();
@@ -41,7 +41,7 @@ TEST_F(LocalFileSystemTest, BuildPath) {
   auto local_fs = pax::Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   ASSERT_NE(nullptr, file_ptr);
 
   auto path = local_fs->BuildPath(file_ptr);
@@ -55,7 +55,7 @@ TEST_F(LocalFileSystemTest, WriteRead) {
   auto local_fs = pax::Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   ASSERT_NE(nullptr, file_ptr);
 
   auto write_size = file_ptr->Write("abc", 3);
@@ -63,7 +63,7 @@ TEST_F(LocalFileSystemTest, WriteRead) {
 
   file_ptr->Flush();
   file_ptr->Close();
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
   ASSERT_NE(nullptr, file_ptr);
 
   char buff[10] = {0};
@@ -87,7 +87,7 @@ TEST_F(LocalFileSystemTest, ListDirectory) {
     path.append(file_path_);
     path.append("/test");
     path.append(std::to_string(i));
-    File *f = fs->Open(path);
+    File *f = fs->Open(path, fs::kWriteMode);
     f->Close();
   }
 
@@ -97,7 +97,7 @@ TEST_F(LocalFileSystemTest, ListDirectory) {
 
 TEST_F(LocalFileSystemTest, CopyFile) {
   static const char *pax_copy_test_dir = "./copytest";
-  static const char *pax_copy_src_path = "./test_src";
+  static const char *pax_copy_src_path = file_name_.c_str();
   static const char *pax_copy_dst_path = "./copytest/test_dst";
 
   int result = 0;
@@ -106,7 +106,7 @@ TEST_F(LocalFileSystemTest, CopyFile) {
   fs->DeleteDirectory(pax_copy_test_dir, true);
   ASSERT_NE(access(pax_copy_test_dir, F_OK), 0);
 
-  File *f = fs->Open(pax_copy_src_path);
+  File *f = fs->Open(pax_copy_src_path, fs::kWriteMode);
   f->Close();
 
   cbdb::MakedirRecursive(pax_copy_test_dir);
@@ -147,7 +147,7 @@ TEST_F(LocalFileSystemTest, CreateDeleteDirectory) {
     path.append(file_path_);
     path.append("/test");
     path.append(std::to_string(i));
-    File *f = fs->Open(path);
+    File *f = fs->Open(path, fs::kWriteMode);
     f->Close();
   }
 
@@ -173,7 +173,7 @@ TEST_F(LocalFileSystemTest, DeleteDirectoryReserveToplevel) {
     path.append(file_path_);
     path.append("/test");
     path.append(std::to_string(i));
-    File *f = fs->Open(path);
+    File *f = fs->Open(path, fs::kWriteMode);
     f->Close();
   }
 
diff --git a/contrib/pax_storage/src/cpp/storage/local_file_system.cc b/contrib/pax_storage/src/cpp/storage/local_file_system.cc
index d9952a84ab2..79c97da8d66 100644
--- a/contrib/pax_storage/src/cpp/storage/local_file_system.cc
+++ b/contrib/pax_storage/src/cpp/storage/local_file_system.cc
@@ -4,13 +4,64 @@
 #include <sys/stat.h>
 #include <unistd.h>
 
+#include <iostream>
+
+#include "comm/pax_memory.h"
 #include "exceptions/CException.h"
 
 namespace pax {
 
-LocalFile::LocalFile(int fd, const std::string &file_path)
-    : File(), fd_(fd), file_path_(file_path) {
-  Assert(fd >= 0);
+struct pax_fd_handle_t {
+  int fd;
+
+  struct pax_fd_handle_t *prev;
+  struct pax_fd_handle_t *next;
+};
+
+static struct pax_fd_handle_t *open_local_fd_handle = NULL;
+static std::mutex fd_resouce_owner_mutex;
+
+static inline struct pax_fd_handle_t *RememberFdHandle(int fd) {
+  struct pax_fd_handle_t *h;
+
+  h = (struct pax_fd_handle_t *)malloc(sizeof(struct pax_fd_handle_t));
+  if (!h) {
+    close(fd);
+    return h;
+  }
+
+  h->prev = NULL;
+  h->fd = fd;
+
+  {
+    std::lock_guard<std::mutex> lock(fd_resouce_owner_mutex);
+    h->next = open_local_fd_handle;
+    if (open_local_fd_handle) open_local_fd_handle->prev = h;
+    open_local_fd_handle = h;
+  }
+
+  return h;
+}
+
+static inline void ForgetFdHandle(struct pax_fd_handle_t *h) {
+  {
+    std::lock_guard<std::mutex> lock(fd_resouce_owner_mutex);
+
+    // unlink from linked list first
+    if (h->prev)
+      h->prev->next = h->next;
+    else
+      open_local_fd_handle = h->next;
+    if (h->next) h->next->prev = h->prev;
+  }
+
+  free(h);
+}
+
+LocalFile::LocalFile(pax_fd_handle_t *ht, const std::string &file_path)
+    : File(), fd_(ht->fd), handle_t_(ht), file_path_(file_path) {
+  Assert(fd_ >= 0);
+  Assert(handle_t_);
 }
 
 ssize_t LocalFile::Read(void *ptr, size_t n) {
@@ -57,15 +108,6 @@ ssize_t LocalFile::PWrite(const void *ptr, size_t n, off_t offset) {
   return num;
 }
 
-void LocalFile::Close() {
-  int rc;
-
-  do {
-    rc = close(fd_);
-  } while (unlikely(rc == -1 && errno == EINTR));
-  CBDB_CHECK(rc == 0, cbdb::CException::ExType::kExTypeIOError);
-}
-
 size_t LocalFile::FileLength() const {
   struct stat file_stat {};
 
@@ -78,14 +120,45 @@ void LocalFile::Flush() {
   CBDB_CHECK(fsync(fd_) == 0, cbdb::CException::ExType::kExTypeIOError);
 }
 
+void LocalFile::Delete() {
+  int rc;
+
+  rc = remove(file_path_.c_str());
+  CBDB_CHECK(rc == 0 || errno == ENOENT,
+             cbdb::CException::ExType::kExTypeIOError);
+}
+
+void LocalFile::Close() {
+  int rc;
+
+  do {
+    rc = close(fd_);
+  } while (unlikely(rc == -1 && errno == EINTR));
+  CBDB_CHECK(rc == 0, cbdb::CException::ExType::kExTypeIOError);
+
+  handle_t_->fd = -1;
+  ForgetFdHandle(handle_t_);
+}
+
 std::string LocalFile::GetPath() const { return file_path_; }
 
-File *LocalFileSystem::Open(const std::string &file_path) {
+File *LocalFileSystem::Open(const std::string &file_path, int flags) {
   LocalFile *local_file;
-  int fd = open(file_path.c_str(), O_CREAT | O_RDWR, 0644);
+  int fd;
+  pax_fd_handle_t *ht;
+
+  if (flags & O_CREAT) {
+    fd = open(file_path.c_str(), flags, fs::kDefaultWritePerm);
+  } else {
+    fd = open(file_path.c_str(), flags);
+  }
 
   CBDB_CHECK(fd >= 0, cbdb::CException::ExType::kExTypeIOError);
-  local_file = new LocalFile(fd, file_path);
+
+  ht = RememberFdHandle(fd);
+  CBDB_CHECK(ht, cbdb::CException::ExType::kExTypeIOError);
+
+  local_file = PAX_NEW<LocalFile>(ht, file_path);
   return local_file;
 }
 
@@ -147,3 +220,31 @@ void LocalFileSystem::DeleteDirectory(const std::string &path,
 
 }  // namespace pax
 
+namespace paxc {
+
+void FdHandleAbortCallback(ResourceReleasePhase phase, bool is_commit,
+                           bool /*isTopLevel*/, void * /*arg*/) {
+  struct pax::pax_fd_handle_t *curr;
+  struct pax::pax_fd_handle_t *temp;
+
+  if (phase != RESOURCE_RELEASE_AFTER_LOCKS) return;
+
+  if (pax::open_local_fd_handle && is_commit)
+    elog(WARNING, "pax local fds reference leak");
+
+  // make sure all of thread have been finished before call this callback
+  curr = pax::open_local_fd_handle;
+  AssertImply(curr, !(curr->prev));
+  while (curr) {
+    temp = curr;
+    curr = curr->next;
+
+    Assert(temp->fd >= 0);
+    close(temp->fd);
+    free(temp);
+  }
+
+  pax::open_local_fd_handle = NULL;
+}
+
+}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/storage/local_file_system.h b/contrib/pax_storage/src/cpp/storage/local_file_system.h
index ff9bb0c9eb9..cc6b0483b9f 100644
--- a/contrib/pax_storage/src/cpp/storage/local_file_system.h
+++ b/contrib/pax_storage/src/cpp/storage/local_file_system.h
@@ -10,32 +10,40 @@
 #include "comm/singleton.h"
 #include "storage/file_system.h"
 
+namespace paxc {
+extern void FdHandleAbortCallback(ResourceReleasePhase phase, bool is_commit,
+                                  bool is_top_level, void *arg);
+}
 
 namespace pax {
+
+struct pax_fd_handle_t;
+
 class LocalFile final : public File {
  public:
-  LocalFile(int fd, const std::string &file_path);
+  LocalFile(pax_fd_handle_t *ht, const std::string &file_path);
 
   ssize_t Read(void *ptr, size_t n) override;
   ssize_t Write(const void *ptr, size_t n) override;
   ssize_t PWrite(const void *ptr, size_t n, off_t offset) override;
   ssize_t PRead(void *ptr, size_t n, off_t offset) override;
   size_t FileLength() const override;
-  void Close() override;
   void Flush() override;
+  void Delete() override;
+  void Close() override;
   std::string GetPath() const override;
 
  private:
   int fd_;
+  pax_fd_handle_t *handle_t_;
   std::string file_path_;
-  // TODO(jiaqizho): added resource owner
 };
 
 class LocalFileSystem final : public FileSystem {
   friend class Singleton<LocalFileSystem>;
 
  public:
-  File *Open(const std::string &file_path) override;
+  File *Open(const std::string &file_path, int flags) override;
   std::string BuildPath(const File *file) const override;
   void Delete(const std::string &file_path) const override;
   std::vector<std::string> ListDirectory(
@@ -45,8 +53,8 @@ class LocalFileSystem final : public FileSystem {
   int CreateDirectory(const std::string &path) const override;
   void DeleteDirectory(const std::string &path,
                        bool delete_topleveldir) const override;
+
  private:
   LocalFileSystem() = default;
 };
 }  // namespace pax
-
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition.cc b/contrib/pax_storage/src/cpp/storage/micro_partition.cc
index 227d928a6a6..feed4066b15 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition.cc
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition.cc
@@ -2,27 +2,12 @@
 
 #include <utility>
 
+#include "comm/pax_memory.h"
+#include "storage/pax_filter.h"
 #include "storage/pax_itemptr.h"
 
 namespace pax {
 
-CTupleSlot::CTupleSlot(TupleTableSlot *tuple_slot)
-    : slot_(tuple_slot), table_no_(0), block_number_(0), offset_(0) {}
-
-void CTupleSlot::StoreVirtualTuple() {
-  // TODO(gongxun): set tts_tid, how to get block number from block id
-  slot_->tts_tid =
-      PaxItemPointer::GetTupleId(table_no_, block_number_, offset_);
-  slot_->tts_flags &= ~TTS_FLAG_EMPTY;
-  slot_->tts_nvalid = slot_->tts_tupleDescriptor->natts;
-}
-
-TupleDesc CTupleSlot::GetTupleDesc() const {
-  return slot_->tts_tupleDescriptor;
-}
-
-TupleTableSlot *CTupleSlot::GetTupleTableSlot() const { return slot_; }
-
 MicroPartitionWriter::MicroPartitionWriter(const WriterOptions &writer_options)
     : writer_options_(writer_options) {}
 
@@ -34,18 +19,53 @@ MicroPartitionWriter *MicroPartitionWriter::SetWriteSummaryCallback(
 
 MicroPartitionWriter *MicroPartitionWriter::SetStatsCollector(
     MicroPartitionStats *mpstats) {
-  Assert(mpstats_ == nullptr);
-  mpstats_ = mpstats;
+  Assert(mp_stats_ == nullptr);
+  mp_stats_ = mpstats;
   return this;
 }
 
-const MicroPartitionWriter::WriterOptions &MicroPartitionWriter::Options()
-    const {
-  return writer_options_;
+MicroPartitionReaderProxy::~MicroPartitionReaderProxy() { PAX_DELETE(reader_); }
+
+void MicroPartitionReaderProxy::Open(
+    const MicroPartitionReader::ReaderOptions &options) {
+  Assert(reader_);
+  reader_->Open(options);
+}
+
+void MicroPartitionReaderProxy::Close() {
+  Assert(reader_);
+  reader_->Close();
+}
+
+bool MicroPartitionReaderProxy::ReadTuple(TupleTableSlot *slot) {
+  Assert(reader_);
+  return reader_->ReadTuple(slot);
+}
+
+bool MicroPartitionReaderProxy::GetTuple(TupleTableSlot *slot,
+                                         size_t row_index) {
+  Assert(reader_);
+  return reader_->GetTuple(slot, row_index);
+}
+
+void MicroPartitionReaderProxy::SetReader(MicroPartitionReader *reader) {
+  Assert(reader);
+  Assert(!reader_);
+  reader_ = reader;
+}
+
+size_t MicroPartitionReaderProxy::GetGroupNums() {
+  return reader_->GetGroupNums();
+}
+
+std::unique_ptr<ColumnStatsProvider>
+MicroPartitionReaderProxy::GetGroupStatsInfo(size_t group_index) {
+  return std::move(reader_->GetGroupStatsInfo(group_index));
 }
 
-const std::string &MicroPartitionWriter::FileName() const {
-  return writer_options_.file_name;
+MicroPartitionReader::Group *MicroPartitionReaderProxy::ReadGroup(
+    size_t index) {
+  return reader_->ReadGroup(index);
 }
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition.h b/contrib/pax_storage/src/cpp/storage/micro_partition.h
index f01139f82f1..3a313c6ae9a 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition.h
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition.h
@@ -10,38 +10,10 @@
 
 #include "storage/columns/pax_columns.h"
 #include "storage/micro_partition_metadata.h"
+#include "storage/pax_defined.h"
+#include "storage/pax_filter.h"
 
 namespace pax {
-class CTupleSlot {
- public:
-  explicit CTupleSlot(TupleTableSlot *tuple_slot);
-
-  inline void ClearTuple() { slot_->tts_ops->clear(slot_); }
-
-  inline uint32 GetOffset() const { return offset_; }
-
-  inline uint8 GetTableNo() const { return table_no_; }
-
-  inline void SetOffset(uint64 offset) { offset_ = offset; }
-
-  inline void SetBlockNumber(const int &block_number) {
-    block_number_ = block_number;
-  }
-
-  inline void SetTableNo(uint8 table_no) { table_no_ = table_no; }
-
-  void StoreVirtualTuple();
-
-  TupleDesc GetTupleDesc() const;
-
-  TupleTableSlot *GetTupleTableSlot() const;
-
- private:
-  TupleTableSlot *slot_;
-  uint8 table_no_;
-  int block_number_;
-  uint32 offset_;
-};
 
 struct WriteSummary;
 class FileSystem;
@@ -53,8 +25,31 @@ class MicroPartitionWriter {
   struct WriterOptions {
     std::string file_name;
     std::string block_id;
-    TupleDesc desc;
-    Oid rel_oid;
+    TupleDesc desc = nullptr;
+    Oid rel_oid = InvalidOid;
+    std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
+
+    size_t group_limit = pax_max_tuples_per_group;
+    PaxStorageFormat storage_format = PaxStorageFormat::kTypeStorageOrcNonVec;
+
+    WriterOptions() = default;
+    WriterOptions(const WriterOptions &other) = default;
+    WriterOptions(WriterOptions &&wo)
+        : file_name(std::move(wo.file_name)),
+          block_id(std::move(wo.block_id)),
+          desc(wo.desc),
+          rel_oid(wo.rel_oid),
+          encoding_opts(std::move(wo.encoding_opts)),
+          group_limit(wo.group_limit) {}
+    WriterOptions &operator=(WriterOptions &&wo) {
+      file_name = std::move(wo.file_name);
+      block_id = std::move(wo.block_id);
+      desc = wo.desc;
+      rel_oid = wo.rel_oid;
+      encoding_opts = std::move(wo.encoding_opts);
+      group_limit = wo.group_limit;
+      return *this;
+    }
   };
 
   explicit MicroPartitionWriter(const WriterOptions &writer_options);
@@ -74,8 +69,16 @@ class MicroPartitionWriter {
 
   // append tuple to the current micro partition file
   // return the number of tuples the current micro partition has written
-  virtual void WriteTuple(CTupleSlot *slot) = 0;
-  virtual void WriteTupleN(CTupleSlot **slot, size_t n) = 0;
+  virtual void WriteTuple(TupleTableSlot *slot) = 0;
+
+  // The current writer merges with another open `MicroPartitionWriter`
+  // two of `MicroPartitionWriter` must be the same sub-class.
+  // Notice that: not support different format writer call `Merge`
+  //
+  // - Combine the group in memory
+  // - Merge the group from disk and remove the unstate file in disk
+  // - Merge the summary
+  virtual void MergeTo(MicroPartitionWriter *writer) = 0;
 
   using WriteSummaryCallback = std::function<void(const WriteSummary &summary)>;
 
@@ -86,27 +89,65 @@ class MicroPartitionWriter {
 
   virtual MicroPartitionWriter *SetStatsCollector(MicroPartitionStats *mpstats);
 
-  const WriterOptions &Options() const;
-
-  // return the file name of the current micro partition, excluding its
-  // directory path
-  const std::string &FileName() const;
-
  protected:
   WriteSummaryCallback summary_callback_;
-  const WriterOptions &writer_options_;
+  WriterOptions writer_options_;
   FileSystem *file_system_ = nullptr;
   // only reference the mpstats, not the owner
-  MicroPartitionStats *mpstats_ = nullptr;
+  MicroPartitionStats *mp_stats_ = nullptr;
 };
 
+#ifdef ENABLE_PLASMA
+class PaxCache;
+#endif
+
 template <typename T>
 class DataBuffer;
+
 class MicroPartitionReader {
  public:
+  class Group {
+   public:
+    virtual ~Group() = default;
+
+    virtual size_t GetRows() const = 0;
+
+    virtual size_t GetRowOffset() const = 0;
+
+    // `ReadTuple` is the same interface in the `MicroPartitionReader`
+    // this interface at the group level, if no rows remain in current
+    // group, then the first value in return std::pair will be `false`.
+    //
+    // the secord value in return std::pair is the row offset of current
+    // group.
+    virtual std::pair<bool, size_t> ReadTuple(TupleTableSlot *slot) = 0;
+
+    // ------------------------------------------
+    // The below interfaces is used to directly access
+    // the pax columns in the group.
+    // Other `MicroPartitionReader` can quickly perform
+    // some operations, like filter, convert format...
+    // ------------------------------------------
+    virtual bool GetTuple(TupleTableSlot *slot, size_t row_index) = 0;
+
+    // Direct get datum from columns by column index + row index
+    virtual std::pair<Datum, bool> GetColumnValue(TupleDesc desc,
+                                                  size_t column_index,
+                                                  size_t row_index) = 0;
+
+    // Allow different MicroPartitionReader shared columns
+    // but should not let export columns out of micro partition
+    //
+    // In MicroPartition writer/reader implementation, all in-memory data should
+    // be accessed by pax column This is because most of the common logic of
+    // column operation is done in pax column, such as type mapping, bitwise
+    // fetch, compression/encoding. At the same time, pax column can also be
+    // used as a general interface for internal using, because it's zero copy
+    // from buffer. more details in `storage/columns`
+    virtual PaxColumns *GetAllColumns() const = 0;
+  };
+
   struct ReaderOptions {
-    // file name(excluding directory path) for read
-    std::string file_name;
     // additioinal info to initialize a reader.
     std::string block_id;
 
@@ -115,8 +156,10 @@ class MicroPartitionReader {
     DataBuffer<char> *reused_buffer = nullptr;
 
     PaxFilter *filter = nullptr;
+#ifdef ENABLE_PLASMA
+    PaxCache *pax_cache = nullptr;
+#endif  // ENABLE_PLASMA
   };
-
   MicroPartitionReader() = default;
 
   virtual ~MicroPartitionReader() = default;
@@ -133,7 +176,62 @@ class MicroPartitionReader {
   // NOTE: the ctid is stored in slot, mapping from block_id to micro partition
   // is also created during this stage, no matter the map relation is needed or
   // not. We may optimize to avoid creating the map relation later.
-  virtual bool ReadTuple(CTupleSlot *slot) = 0;
+  virtual bool ReadTuple(TupleTableSlot *slot) = 0;
+
+  // ------------------------------------------
+  // below interface different with `ReadTuple`
+  //
+  // direct read with `Group` from current `MicroPartitionReader` with group
+  // index. The group index will not be changed, and won't have any middle state
+  // in this process.
+  // ------------------------------------------
+  virtual bool GetTuple(TupleTableSlot *slot, size_t row_index) = 0;
+
+  virtual size_t GetGroupNums() = 0;
+
+  virtual Group *ReadGroup(size_t group_index) = 0;
+
+  virtual std::unique_ptr<ColumnStatsProvider> GetGroupStatsInfo(
+      size_t group_index) = 0;
+
+#ifdef VEC_BUILD
+ private:
+  friend class PaxVecReader;
+#endif
+};
+
+class MicroPartitionReaderProxy : public MicroPartitionReader {
+ public:
+  MicroPartitionReaderProxy() = default;
+
+  ~MicroPartitionReaderProxy() override;
+
+  void Open(const MicroPartitionReader::ReaderOptions &options) override;
+
+  // Close the current reader. It may be re-Open.
+  void Close() override;
+
+  // read tuple from the micro partition with a filter.
+  // the default behavior doesn't push the predicate down to
+  // the low-level storage code.
+  // returns the offset of the tuple in the micro partition
+  // NOTE: the ctid is stored in slot, mapping from block_id to micro partition
+  // is also created during this stage, no matter the map relation is needed or
+  // not. We may optimize to avoid creating the map relation later.
+  bool ReadTuple(TupleTableSlot *slot) override;
+
+  bool GetTuple(TupleTableSlot *slot, size_t row_index) override;
+
+  size_t GetGroupNums() override;
+
+  std::unique_ptr<ColumnStatsProvider> GetGroupStatsInfo(
+      size_t group_index) override;
+
+  Group *ReadGroup(size_t index) override;
+
+  void SetReader(MicroPartitionReader *reader);
+  MicroPartitionReader *GetReader() { return reader_; }
+  const MicroPartitionReader *GetReader() const { return reader_; }
 
  protected:
   // Allow different MicroPartitionReader shared columns
@@ -145,11 +243,8 @@ class MicroPartitionReader {
   // fetch, compression/encoding. At the same time, pax column can also be used
   // as a general interface for internal using, because it's zero copy from
   // buffer. more details in `storage/columns`
-  virtual PaxColumns *GetAllColumns() = 0;
-#ifdef VEC_BUILD
- private:
-  friend class PaxVecReader;
-#endif
+
+  MicroPartitionReader *reader_ = nullptr;
 };
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory.cc b/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory.cc
index 7d14e774214..4ede489b6b1 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory.cc
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory.cc
@@ -1,5 +1,6 @@
 #include "storage/micro_partition_file_factory.h"
 
+#include "comm/pax_memory.h"
 #include "storage/orc/orc.h"
 
 namespace pax {
@@ -7,7 +8,7 @@ MicroPartitionReader *MicroPartitionFileFactory::CreateMicroPartitionReader(
     const std::string &type, File *file,
     const MicroPartitionReader::ReaderOptions &options) {
   if (type == MICRO_PARTITION_TYPE_PAX) {
-    MicroPartitionReader *reader = new OrcReader(file);
+    MicroPartitionReader *reader = PAX_NEW<OrcReader>(file);
 
     reader->Open(options);
     return reader;
@@ -20,12 +21,10 @@ MicroPartitionWriter *MicroPartitionFileFactory::CreateMicroPartitionWriter(
     const std::string &type, File *file,
     const MicroPartitionWriter::WriterOptions &options) {
   if (type == MICRO_PARTITION_TYPE_PAX) {
-    std::vector<orc::proto::Type_Kind> type_kinds;
-    std::vector<ColumnEncoding_Kind> encoding_types;
+    std::vector<pax::orc::proto::Type_Kind> type_kinds;
     MicroPartitionWriter *writer = nullptr;
-    std::tie(type_kinds, encoding_types) = OrcWriter::BuildSchema(options);
-    writer = new OrcWriter(std::move(options), std::move(type_kinds),
-                           std::move(encoding_types), file);
+    type_kinds = OrcWriter::BuildSchema(options.desc);
+    writer = PAX_NEW<OrcWriter>(std::move(options), std::move(type_kinds), file);
     return writer;
   }
   CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory_test.cc b/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory_test.cc
index bdb2cdb6774..b60e10953e1 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_file_factory_test.cc
@@ -12,146 +12,24 @@
 #include "comm/gtest_wrappers.h"
 #include "comm/singleton.h"
 #include "exceptions/CException.h"
+#include "pax_gtest_helper.h"
 #include "storage/local_file_system.h"
 
 namespace pax::tests {
-// 3 clomun - string(len 100), string(len 100), int(len 4)
-#define COLUMN_NUMS 3
-#define COLUMN_SIZE 100
-#define INT32_COLUMN_VALUE 0x123
-#define INT32_COLUMN_VALUE_DEFAULT 0x001
-
-static void GenFakeBuffer(char *buffer, size_t length) {
-  for (size_t i = 0; i < length; i++) {
-    buffer[i] = static_cast<char>(i);
-  }
-}
 
 class MicroPartitionFileFactoryTest : public ::testing::Test {
  public:
   const char *pax_format = MICRO_PARTITION_TYPE_PAX;
   void SetUp() override {
-    Singleton<LocalFileSystem>::GetInstance();
-    remove(file_name_.c_str());
-
-    MemoryContext micro_partition_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "OrcTestMemoryContext", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
 
-    MemoryContextSwitchTo(micro_partition_test_memory_context);
-    CurrentResourceOwner = ResourceOwnerCreate(NULL, "OrcTestResourceOwner");
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
   void TearDown() override {
     Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    ResourceOwner tmp_resource_owner = CurrentResourceOwner;
-    CurrentResourceOwner = NULL;
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_BEFORE_LOCKS, false,
-                         true);
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_LOCKS, false, true);
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_AFTER_LOCKS, false,
-                         true);
-    ResourceOwnerDelete(tmp_resource_owner);
-  }
-
- protected:
-  static CTupleSlot *CreateFakeCTupleSlot(bool with_value = true) {
-    TupleTableSlot *tuple_slot = nullptr;
-
-    auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
-        sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
-
-    tuple_desc->natts = COLUMN_NUMS;
-    tuple_desc->attrs[0] = {
-        .atttypid = TEXTOID,
-        .attlen = -1,
-        .attbyval = false,
-        .attisdropped = false,
-    };
-
-    tuple_desc->attrs[1] = {
-        .atttypid = TEXTOID,
-        .attlen = -1,
-        .attbyval = false,
-        .attisdropped = false,
-    };
-
-    tuple_desc->attrs[2] = {
-        .atttypid = INT4OID,
-        .attlen = 4,
-        .attbyval = true,
-        .attisdropped = false,
-    };
-
-    tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
-
-    if (with_value) {
-      char column_buff[COLUMN_SIZE * 2];
-      GenFakeBuffer(column_buff, COLUMN_SIZE);
-      GenFakeBuffer(column_buff + COLUMN_SIZE, COLUMN_SIZE);
-
-      bool *fake_is_null =
-          reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * COLUMN_NUMS));
-
-      fake_is_null[0] = false;
-      fake_is_null[1] = false;
-      fake_is_null[2] = false;
-
-      tuple_slot->tts_values[0] =
-          cbdb::DatumFromCString(column_buff, COLUMN_SIZE);
-      tuple_slot->tts_values[1] =
-          cbdb::DatumFromCString(column_buff + COLUMN_SIZE, COLUMN_SIZE);
-      tuple_slot->tts_values[2] = cbdb::Int32ToDatum(INT32_COLUMN_VALUE);
-      tuple_slot->tts_isnull = fake_is_null;
-    }
-
-    auto ctuple_slot = new CTupleSlot(tuple_slot);
-
-    return ctuple_slot;
-  }
-
-  static CTupleSlot *CreateEmptyCTupleSlot() {
-    auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
-        sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
-    bool *fake_is_null =
-        reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * COLUMN_NUMS));
-    auto tuple_slot = reinterpret_cast<TupleTableSlot *>(
-        cbdb::Palloc0(sizeof(TupleTableSlot)));
-    auto tts_values =
-        reinterpret_cast<Datum *>(cbdb::Palloc0(sizeof(Datum) * COLUMN_NUMS));
-    tuple_desc->natts = COLUMN_NUMS;
-    tuple_desc->attrs[0] = {
-        .attlen = -1,
-        .attbyval = false,
-        .attisdropped = false,
-    };
-
-    tuple_desc->attrs[1] = {
-        .attlen = -1,
-        .attbyval = false,
-        .attisdropped = false,
-    };
-
-    tuple_desc->attrs[2] = {
-        .attlen = 4,
-        .attbyval = true,
-        .attisdropped = false,
-    };
-    tuple_slot->tts_tupleDescriptor = tuple_desc;
-    tuple_slot->tts_values = tts_values;
-    tuple_slot->tts_isnull = fake_is_null;
-    return new CTupleSlot(tuple_slot);
-  }
-
-  static void DeleteCTupleSlot(CTupleSlot *ctuple_slot) {
-    auto tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    cbdb::Pfree(tuple_table_slot->tts_tupleDescriptor);
-    if (tuple_table_slot->tts_isnull) {
-      cbdb::Pfree(tuple_table_slot->tts_isnull);
-    }
-
-    cbdb::Pfree(tuple_table_slot);
-    delete ctuple_slot;
+    ReleaseTestResourceOwner();
   }
 
  protected:
@@ -159,15 +37,24 @@ class MicroPartitionFileFactoryTest : public ::testing::Test {
 };
 
 TEST_F(MicroPartitionFileFactoryTest, CreateMicroPartitionWriter) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
+
   MicroPartitionWriter::WriterOptions writer_options;
-  writer_options.desc = tuple_slot->GetTupleDesc();
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  writer_options.encoding_opts = types_encoding;
 
   auto writer = MicroPartitionFileFactory::CreateMicroPartitionWriter(
       pax_format, file_ptr, writer_options);
@@ -175,56 +62,50 @@ TEST_F(MicroPartitionFileFactoryTest, CreateMicroPartitionWriter) {
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
 }
 
 TEST_F(MicroPartitionFileFactoryTest, CreateMicroPartitionReader) {
-  char column_buff[COLUMN_SIZE];
-
-  GenFakeBuffer(column_buff, COLUMN_SIZE);
-
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  MicroPartitionWriter::WriterOptions writer_options;
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
 
-  writer_options.desc = tuple_slot->GetTupleDesc();
+  MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  writer_options.encoding_opts = types_encoding;
 
   auto writer = MicroPartitionFileFactory::CreateMicroPartitionWriter(
       pax_format, file_ptr, writer_options);
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
 
   auto reader = MicroPartitionFileFactory::CreateMicroPartitionReader(
       pax_format, file_ptr, reader_options);
-  tuple_slot_empty->GetTupleDesc()->natts = COLUMN_NUMS;
   reader->ReadTuple(tuple_slot_empty);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty));
 
-  auto vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[0]);
-  auto tunpacked = pg_detoast_datum_packed(vl);
-  EXPECT_EQ((Pointer)vl, (Pointer)tunpacked);
-
-  int read_len = VARSIZE(tunpacked);
-  char *read_data = VARDATA_ANY(tunpacked);
-
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, memcmp(read_data, column_buff, COLUMN_SIZE));
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.cc b/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.cc
index f329e7651ac..19e48e6d573 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.cc
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.cc
@@ -1,13 +1,21 @@
 #include "storage/micro_partition_iterator.h"
 
+#include "catalog/pax_aux_table.h"
 #include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
 #include "exceptions/CException.h"
-#include "catalog/pax_aux_table.h"
 
 namespace pax {
+
+MicroPartitionInfoIterator::MicroPartitionInfoIterator(Relation pax_rel,
+                                                       Snapshot snapshot,
+                                                       std::string rel_path)
+    : rel_path_(rel_path), pax_rel_(pax_rel), snapshot_(snapshot) {}
+
+MicroPartitionInfoIterator::~MicroPartitionInfoIterator() { End(); }
+
 void MicroPartitionInfoIterator::Begin() {
   Assert(pax_rel_);
-  Assert(snapshot_);
   Assert(!desc_);
   Assert(!tuple_);
 
@@ -16,7 +24,8 @@ void MicroPartitionInfoIterator::Begin() {
     aux_rel_ = cbdb::TableOpen(aux_oid, AccessShareLock);
   }
 
-  desc_ = cbdb::SystableBeginScan(aux_rel_, InvalidOid, false, snapshot_, 0, NULL);
+  desc_ =
+      cbdb::SystableBeginScan(aux_rel_, InvalidOid, false, snapshot_, 0, NULL);
 }
 
 void MicroPartitionInfoIterator::End() {
@@ -51,17 +60,16 @@ void MicroPartitionInfoIterator::Rewind() {
   Begin();
 }
 
-std::unique_ptr<IteratorBase<MicroPartitionMetadata>> MicroPartitionInfoIterator::New(Relation pax_rel, Snapshot snapshot) {
+std::unique_ptr<IteratorBase<MicroPartitionMetadata>>
+MicroPartitionInfoIterator::New(Relation pax_rel, Snapshot snapshot) {
   MicroPartitionInfoIterator *it;
-  it = new MicroPartitionInfoIterator(pax_rel, snapshot);
+  it = PAX_NEW<MicroPartitionInfoIterator>(
+      pax_rel, snapshot,
+      cbdb::BuildPaxDirectoryPath(pax_rel->rd_node, pax_rel->rd_backend));
   it->Begin();
   return std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(it);
 }
 
-MicroPartitionInfoIterator::~MicroPartitionInfoIterator() {
-  End();
-}
-
 MicroPartitionMetadata MicroPartitionInfoIterator::ToValue(HeapTuple tuple) {
   MicroPartitionMetadata v;
   ::pax::stats::MicroPartitionStatisticsInfo stats_info;
@@ -69,29 +77,33 @@ MicroPartitionMetadata MicroPartitionInfoIterator::ToValue(HeapTuple tuple) {
   auto tup_desc = RelationGetDescr(aux_rel_);
 
   {
-    auto blockid = cbdb::HeapGetAttr(tuple, ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME, tup_desc, &is_null);
+    auto blockid = cbdb::HeapGetAttr(
+        tuple, ANUM_PG_PAX_BLOCK_TABLES_PTBLOCKNAME, tup_desc, &is_null);
     CBDB_CHECK(!is_null, cbdb::CException::kExTypeLogicError);
 
-    auto name = DatumGetName(blockid)->data;
-    auto file_name = cbdb::BuildPaxFilePath(pax_rel_, name);
+    auto name = NameStr(*DatumGetName(blockid));
+    auto file_name = cbdb::BuildPaxFilePath(rel_path_, name);
     v.SetFileName(std::move(file_name));
-    v.SetMicroPartitionId(std::move(name));
+    v.SetMicroPartitionId(name);
   }
 
-  auto tup_count = cbdb::HeapGetAttr(tuple, ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT, tup_desc, &is_null);
+  auto tup_count = cbdb::HeapGetAttr(tuple, ANUM_PG_PAX_BLOCK_TABLES_PTTUPCOUNT,
+                                     tup_desc, &is_null);
   CBDB_CHECK(!is_null, cbdb::CException::kExTypeLogicError);
   v.SetTupleCount(cbdb::DatumToInt32(tup_count));
 
   {
-    auto stats = reinterpret_cast<struct varlena *>(cbdb::DatumToPointer(cbdb::HeapGetAttr(tuple, ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS, tup_desc, &is_null)));
+    auto stats = reinterpret_cast<struct varlena *>(cbdb::DatumToPointer(
+        cbdb::HeapGetAttr(tuple, ANUM_PG_PAX_BLOCK_TABLES_PTSTATISITICS,
+                          tup_desc, &is_null)));
     CBDB_CHECK(!is_null, cbdb::CException::kExTypeLogicError);
     auto flat_stats = cbdb::PgDeToastDatumPacked(stats);
-    auto ok = stats_info.ParseFromArray(VARDATA_ANY(flat_stats), VARSIZE_ANY_EXHDR(flat_stats));
+    auto ok = stats_info.ParseFromArray(VARDATA_ANY(flat_stats),
+                                        VARSIZE_ANY_EXHDR(flat_stats));
     CBDB_CHECK(ok, cbdb::CException::kExTypeIOError);
     v.SetStats(std::move(stats_info));
 
-    if (flat_stats != stats)
-      cbdb::Pfree(flat_stats);
+    if (flat_stats != stats) cbdb::Pfree(flat_stats);
   }
 
   // deserialize protobuf message
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.h b/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.h
index 38e2b4ee888..da67b73facb 100644
--- a/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.h
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_iterator.h
@@ -1,28 +1,34 @@
 #pragma once
 
+#include "comm/cbdb_api.h"
+
 #include <utility>
 
-#include "comm/cbdb_api.h"
 #include "comm/iterator.h"
 #include "storage/micro_partition_metadata.h"
 
 namespace pax {
-class MicroPartitionInfoIterator final: public IteratorBase<MicroPartitionMetadata> {
+class MicroPartitionInfoIterator final
+    : public IteratorBase<MicroPartitionMetadata> {
  public:
-  static std::unique_ptr<IteratorBase<MicroPartitionMetadata>> New(Relation pax_rel, Snapshot snapshot);
+  static std::unique_ptr<IteratorBase<MicroPartitionMetadata>> New(
+      Relation pax_rel, Snapshot snapshot);
 
   bool HasNext() override;
   MicroPartitionMetadata Next() override;
   void Rewind() override;
 
  private:
-  MicroPartitionInfoIterator(Relation pax_rel, Snapshot snapshot)
-  : pax_rel_(pax_rel), snapshot_(snapshot) {}
+  MicroPartitionInfoIterator(Relation pax_rel, Snapshot snapshot,
+                             std::string rel_path);
+  template <typename T, typename... Args>
+  friend T *PAX_NEW(Args &&...args);
   ~MicroPartitionInfoIterator() override;
   void Begin();
   void End();
   MicroPartitionMetadata ToValue(HeapTuple tuple);
 
+  std::string rel_path_;
   Relation pax_rel_ = nullptr;
   Relation aux_rel_ = nullptr;
   Snapshot snapshot_ = nullptr;
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.cc b/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.cc
new file mode 100644
index 00000000000..c6325a72a56
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.cc
@@ -0,0 +1,102 @@
+#include "storage/micro_partition_row_filter_reader.h"
+
+#include "comm/guc.h"
+#include "comm/log.h"
+#include "comm/pax_memory.h"
+#include "storage/pax_defined.h"
+#include "storage/pax_filter.h"
+#include "storage/pax_itemptr.h"
+
+namespace pax {
+static inline bool TestExecQual(ExprState *estate, ExprContext *econtext) {
+  CBDB_WRAP_START;
+  { return ExecQual(estate, econtext); }
+  CBDB_WRAP_END;
+}
+
+MicroPartitionRowFilterReader *MicroPartitionRowFilterReader::New(
+    MicroPartitionReader *reader, PaxFilter *filter) {
+  Assert(reader);
+  Assert(filter && filter->HasRowScanFilter());
+
+  auto r = PAX_NEW<MicroPartitionRowFilterReader>();
+  r->SetReader(reader);
+  r->filter_ = filter;
+  return r;
+}
+
+MicroPartitionReader::Group *MicroPartitionRowFilterReader::GetNextGroup(
+    TupleDesc desc) {
+  auto ngroups = reader_->GetGroupNums();
+retry_next_group:
+  if (group_index_ >= ngroups) return nullptr;
+  auto info = reader_->GetGroupStatsInfo(group_index_);
+  ++group_index_;
+  if (filter_ &&
+      !filter_->TestScan(*info, desc, PaxFilterStatisticsKind::kGroup)) {
+    goto retry_next_group;
+  }
+  group_ = reader_->ReadGroup(group_index_ - 1);
+  row_index_ = 0;
+  return group_;
+}
+
+bool MicroPartitionRowFilterReader::ReadTuple(TupleTableSlot *slot) {
+  auto g = group_;
+  auto ctx = filter_->GetExecutionFilterContext();
+  const auto &remaining_columns = filter_->GetRemainingColumns();
+  size_t nrows;
+  TupleDesc desc;
+
+  desc = slot->tts_tupleDescriptor;
+  slot->tts_nvalid = desc->natts;
+
+retry_next_group:
+  if (group_ == nullptr) {
+    g = GetNextGroup(desc);
+    if (!g) return false;
+  }
+  nrows = g->GetRows();
+retry_next:
+  if (row_index_ >= nrows) {
+    PAX_DELETE(group_);
+    group_ = nullptr;
+    goto retry_next_group;
+  }
+  for (int i = 0; i < ctx->size; i++) {
+    auto attno = ctx->attnos[i];
+    Assert(attno > 0);
+    std::tie(slot->tts_values[attno - 1], slot->tts_isnull[attno - 1]) =
+        g->GetColumnValue(desc, attno - 1, row_index_);
+    if (!TestRowScanInternal(slot, ctx->estates[i], attno)) {
+      row_index_++;
+      goto retry_next;
+    }
+  }
+  for (auto attno : remaining_columns) {
+    std::tie(slot->tts_values[attno - 1], slot->tts_isnull[attno - 1]) =
+        g->GetColumnValue(desc, attno - 1, row_index_);
+  }
+  row_index_++;
+  if (ctx->estate_final && !TestRowScanInternal(slot, ctx->estate_final, 0))
+    goto retry_next;
+
+  SetTupleOffset(&slot->tts_tid, g->GetRowOffset() + row_index_ - 1);
+  return true;
+}
+
+bool MicroPartitionRowFilterReader::TestRowScanInternal(TupleTableSlot *slot,
+                                                        ExprState *estate,
+                                                        AttrNumber attno) {
+  Assert(filter_);
+  Assert(estate);
+  Assert(slot);
+  Assert(attno >= 0);
+
+  auto ctx = filter_->GetExecutionFilterContext();
+  auto econtext = ctx->econtext;
+  econtext->ecxt_scantuple = slot;
+
+  return TestExecQual(estate, econtext);
+}
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.h b/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.h
new file mode 100644
index 00000000000..35f2e94fdf0
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_row_filter_reader.h
@@ -0,0 +1,26 @@
+#pragma once
+
+#include "storage/micro_partition.h"
+
+namespace pax {
+class MicroPartitionRowFilterReader : public MicroPartitionReaderProxy {
+ public:
+  static MicroPartitionRowFilterReader *New(MicroPartitionReader *reader,
+                                            PaxFilter *filter);
+  MicroPartitionRowFilterReader() = default;
+  ~MicroPartitionRowFilterReader() override = default;
+  bool ReadTuple(TupleTableSlot *slot) override;
+  MicroPartitionReader::Group *GetNextGroup(TupleDesc desc);
+
+ private:
+  bool TestRowScanInternal(TupleTableSlot *slot, ExprState *estate,
+                           AttrNumber attno);
+
+  // filter is referenced only, the reader doesn't own it.
+  PaxFilter *filter_ = nullptr;
+  size_t row_index_ = 0;
+  size_t group_index_ = 0;
+  size_t local_index_ = 0;
+  MicroPartitionReader::Group *group_ = nullptr;
+};
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_stats.cc b/contrib/pax_storage/src/cpp/storage/micro_partition_stats.cc
new file mode 100644
index 00000000000..1e24d897d63
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_stats.cc
@@ -0,0 +1,509 @@
+#include "storage/micro_partition_stats.h"
+
+#include "comm/cbdb_api.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
+#include "storage/micro_partition_metadata.h"
+#include "storage/proto/proto_wrappers.h"
+
+namespace pax {
+
+MicroPartitionStats::MicroPartitionStats(bool allow_fallback_to_pg)
+    : allow_fallback_to_pg_(allow_fallback_to_pg) {}
+
+MicroPartitionStats::~MicroPartitionStats() { PAX_DELETE(stats_); }
+// SetStatsMessage may be called several times in a write,
+// one for each micro partition, so all members need to reset.
+// Some metainfo like typid, collation, oids for less/greater,
+// fmgr should be exactly consistent.
+MicroPartitionStats *MicroPartitionStats::SetStatsMessage(
+    MicroPartitionStatsData *stats, int natts) {
+  FmgrInfo finfo;
+
+  Assert(natts >= 0);
+  Assert(stats);
+  initial_check_ = false;
+  PAX_DELETE(stats_);
+  stats_ = stats;
+
+  memset(&finfo, 0, sizeof(finfo));
+  opfamilies_.clear();
+  finfos_.clear();
+  local_funcs_.clear();
+  status_.clear();
+  for (int i = 0; i < natts; i++) {
+    opfamilies_.emplace_back(InvalidOid);
+    finfos_.emplace_back(std::pair<FmgrInfo, FmgrInfo>({finfo, finfo}));
+    local_funcs_.emplace_back(
+        std::pair<OperMinMaxFunc, OperMinMaxFunc>({nullptr, nullptr}));
+    status_.emplace_back('u');
+  }
+  Assert(stats_->ColumnSize() == natts);
+  return this;
+}
+
+MicroPartitionStats *MicroPartitionStats::LightReset() {
+  for (char &status : status_) {
+    Assert(status == 'n' || status == 'y' || status == 'x');
+    if (status == 'y') status = 'n';
+  }
+  return this;
+}
+
+void MicroPartitionStats::AddRow(TupleTableSlot *slot) {
+  auto desc = slot->tts_tupleDescriptor;
+  auto n = desc->natts;
+
+  DoInitialCheck(desc);
+  CBDB_CHECK(status_.size() == static_cast<size_t>(n),
+             cbdb::CException::ExType::kExTypeSchemaNotMatch);
+  for (auto i = 0; i < n; i++) {
+    auto att = &desc->attrs[i];
+
+    AssertImply(att->attisdropped, slot->tts_isnull[i]);
+    if (slot->tts_isnull[i])
+      AddNullColumn(i);
+    else
+      AddNonNullColumn(i, slot->tts_values[i], desc);
+  }
+}
+
+void MicroPartitionStats::MergeTo(MicroPartitionStats *stats, TupleDesc desc) {
+  Assert(status_.size() == stats->status_.size());
+  for (size_t column_index = 0; column_index < status_.size(); column_index++) {
+    Assert(status_[column_index] != 'u' && stats->status_[column_index] != 'u');
+    AssertImply(stats->status_[column_index] == 'x',
+                status_[column_index] == 'x');
+
+    if (stats->status_[column_index] == 'n' ||
+        stats->status_[column_index] == 'x') {
+      // still need update all and has null
+      if (stats_->GetAllNull(column_index) &&
+          !stats->stats_->GetAllNull(column_index)) {
+        stats_->SetAllNull(column_index, false);
+      }
+
+      if (!stats_->GetHasNull(column_index) &&
+          stats->stats_->GetHasNull(column_index)) {
+        stats_->SetHasNull(column_index, true);
+      }
+      continue;
+    }
+
+    Assert(stats->status_[column_index] == 'y');
+    Assert(status_[column_index] != 'x');
+    if (status_[column_index] == 'y') {
+      auto col_basic_stats_merge =
+          stats->stats_->GetColumnBasicInfo(column_index);
+      auto col_data_stats_merge =
+          stats->stats_->GetColumnDataStats(column_index);
+
+      auto col_basic_stats = stats_->GetColumnBasicInfo(column_index);
+
+      auto att = TupleDescAttr(desc, column_index);
+      auto collation = att->attcollation;
+      auto typlen = att->attlen;
+      auto typbyval = att->attbyval;
+
+      Assert(col_basic_stats->typid() == col_basic_stats_merge->typid());
+      Assert(col_basic_stats->opfamily() == col_basic_stats_merge->opfamily());
+      Assert(col_basic_stats->collation() ==
+             col_basic_stats_merge->collation());
+      Assert(col_basic_stats->collation() == collation);
+
+      if (stats_->GetAllNull(column_index) &&
+          !stats->stats_->GetAllNull(column_index)) {
+        stats_->SetAllNull(column_index, false);
+      }
+
+      if (!stats_->GetHasNull(column_index) &&
+          stats->stats_->GetHasNull(column_index)) {
+        stats_->SetHasNull(column_index, true);
+      }
+
+      bool ok = false;
+      auto min_val =
+          FromValue(col_data_stats_merge->minimal(), typlen, typbyval, &ok);
+      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+      auto max_val =
+          FromValue(col_data_stats_merge->maximum(), typlen, typbyval, &ok);
+      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+
+      UpdateMinMaxValue(column_index, min_val, collation, typlen, typbyval);
+      UpdateMinMaxValue(column_index, max_val, collation, typlen, typbyval);
+    } else if (status_[column_index] == 'n') {
+      stats_->CopyFrom(stats->stats_);
+      status_[column_index] = 'y';
+    } else {
+      Assert(false);
+    }
+  }
+}
+
+void MicroPartitionStats::AddNullColumn(int column_index) {
+  Assert(column_index >= 0);
+  Assert(column_index < static_cast<int>(opfamilies_.size()));
+
+  stats_->SetHasNull(column_index, true);
+}
+
+void MicroPartitionStats::AddNonNullColumn(int column_index, Datum value,
+                                           TupleDesc desc) {
+  Assert(column_index >= 0);
+  Assert(column_index < static_cast<int>(opfamilies_.size()));
+
+  auto att = TupleDescAttr(desc, column_index);
+  auto collation = att->attcollation;
+  auto typlen = att->attlen;
+  auto typbyval = att->attbyval;
+  auto info = stats_->GetColumnBasicInfo(column_index);
+  auto data_stats = stats_->GetColumnDataStats(column_index);
+  stats_->SetAllNull(column_index, false);
+
+  // update min/max
+  switch (status_[column_index]) {
+    case 'x':
+      break;
+    case 'y':
+      Assert(data_stats->has_minimal());
+      Assert(data_stats->has_maximum());
+      Assert(info->has_typid());
+      Assert(info->has_opfamily());
+      Assert(info->typid() == att->atttypid);
+      Assert(info->collation() == collation);
+      Assert(info->opfamily() == opfamilies_[column_index]);
+
+      UpdateMinMaxValue(column_index, value, collation, typlen, typbyval);
+      break;
+    case 'n': {
+      AssertImply(info->has_typid(), info->typid() == att->atttypid);
+      AssertImply(info->has_collation(), info->collation() == collation);
+      AssertImply(info->has_opfamily(),
+                  info->opfamily() == opfamilies_[column_index]);
+      Assert(!data_stats->has_minimal());
+      Assert(!data_stats->has_maximum());
+
+      info->set_typid(att->atttypid);
+      info->set_collation(collation);
+      info->set_opfamily(opfamilies_[column_index]);
+      data_stats->set_minimal(ToValue(value, typlen, typbyval));
+      data_stats->set_maximum(ToValue(value, typlen, typbyval));
+      status_[column_index] = 'y';
+      break;
+    }
+    default:
+      Assert(false);
+  }
+}
+
+void MicroPartitionStats::UpdateMinMaxValue(int column_index, Datum datum,
+                                            Oid collation, int typlen,
+                                            bool typbyval) {
+  auto data_stats = stats_->GetColumnDataStats(column_index);
+  const auto &min = data_stats->minimal();
+  const auto &max = data_stats->maximum();
+  Datum min_datum, max_datum;
+  bool ok, umin = false, umax = false;
+
+  Assert(initial_check_);
+  Assert(column_index >= 0 &&
+         static_cast<size_t>(column_index) < status_.size());
+  Assert(status_[column_index] == 'y');
+
+  min_datum = FromValue(min, typlen, typbyval, &ok);
+  CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+
+  max_datum = FromValue(max, typlen, typbyval, &ok);
+  CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+
+  // If do have local oper here, then direct call it
+  // But if local oper is null, it must be fallback to pg
+  auto &lfunc = local_funcs_[column_index];
+  if (lfunc.first && CollateIsSupport(collation)) {
+    Assert(lfunc.second);
+
+    umin = lfunc.first(&datum, &min_datum, collation);
+    umax = lfunc.second(&datum, &max_datum, collation);
+  } else if (allow_fallback_to_pg_) {  // may not support collation,
+    auto &finfos = finfos_[column_index];
+    umin = DatumGetBool(
+        cbdb::FunctionCall2Coll(&finfos.first, collation, datum, min_datum));
+    umax = DatumGetBool(
+        cbdb::FunctionCall2Coll(&finfos.second, collation, datum, max_datum));
+  } else {
+    // unreachable
+    Assert(false);
+  }
+
+  if (umin) data_stats->set_minimal(ToValue(datum, typlen, typbyval));
+  if (umax) data_stats->set_maximum(ToValue(datum, typlen, typbyval));
+}
+
+void MicroPartitionStats::DoInitialCheck(TupleDesc desc) {
+  auto natts = desc->natts;
+
+  Assert(natts == static_cast<int>(status_.size()));
+  Assert(status_.size() == opfamilies_.size());
+  Assert(status_.size() == finfos_.size());
+
+  if (initial_check_) {
+    return;
+  }
+
+  for (int i = 0; i < natts; i++) {
+    auto att = TupleDescAttr(desc, i);
+
+    if (att->attisdropped) {
+      status_[i] = 'x';
+      continue;
+    }
+
+    if (GetStrategyProcinfo(att->atttypid, att->atttypid, local_funcs_[i])) {
+      status_[i] = 'n';
+      continue;
+    }
+
+    if (!allow_fallback_to_pg_ ||
+        !GetStrategyProcinfo(att->atttypid, att->atttypid, &opfamilies_[i],
+                             finfos_[i])) {
+      status_[i] = 'x';
+      continue;
+    }
+
+    status_[i] = 'n';
+  }
+  initial_check_ = true;
+}
+
+Datum MicroPartitionStats::FromValue(const std::string &s, int typlen,
+                                     bool typbyval, bool *ok) {
+  const char *p = s.data();
+  *ok = true;
+  if (typbyval) {
+    Assert(typlen > 0);
+    switch (typlen) {
+      case 1: {
+        int8 i = *reinterpret_cast<const int8 *>(p);
+        return cbdb::Int8ToDatum(i);
+      }
+      case 2: {
+        int16 i = *reinterpret_cast<const int16 *>(p);
+        return cbdb::Int16ToDatum(i);
+      }
+      case 4: {
+        int32 i = *reinterpret_cast<const int32 *>(p);
+        return cbdb::Int32ToDatum(i);
+      }
+      case 8: {
+        int64 i = *reinterpret_cast<const int64 *>(p);
+        return cbdb::Int64ToDatum(i);
+      }
+      default:
+        Assert(!"unexpected typbyval, len not in 1,2,4,8");
+        *ok = false;
+        break;
+    }
+    return 0;
+  }
+
+  Assert(typlen == -1 || typlen > 0);
+  return PointerGetDatum(p);
+}
+
+std::string MicroPartitionStats::ToValue(Datum datum, int typlen,
+                                         bool typbyval) {
+  if (typbyval) {
+    Assert(typlen > 0);
+    switch (typlen) {
+      case 1: {
+        int8 i = cbdb::DatumToInt8(datum);
+        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
+      }
+      case 2: {
+        int16 i = cbdb::DatumToInt16(datum);
+        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
+      }
+      case 4: {
+        int32 i = cbdb::DatumToInt32(datum);
+        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
+      }
+      case 8: {
+        int64 i = cbdb::DatumToInt64(datum);
+        return std::string(reinterpret_cast<char *>(&i), sizeof(i));
+      }
+      default:
+        Assert(!"unexpected typbyval, len not in 1,2,4,8");
+        break;
+    }
+    CBDB_RAISE(cbdb::CException::kExTypeLogicError);
+  }
+
+  if (typlen == -1) {
+    void *v;
+    int len;
+
+    v = cbdb::PointerAndLenFromDatum(datum, &len);
+    Assert(v && len != -1);
+    return std::string(reinterpret_cast<char *>(v), len);
+  }
+  // byref but fixed size
+  Assert(typlen > 0);
+  return std::string(reinterpret_cast<char *>(cbdb::DatumToPointer(datum)),
+                     typlen);
+}
+
+MicroPartittionFileStatsData::MicroPartittionFileStatsData(
+    ::pax::stats::MicroPartitionStatisticsInfo *info, int natts)
+    : info_(info) {
+  Assert(info);
+  Assert(info->columnstats_size() == 0);
+  for (int i = 0; i < natts; i++) {
+    auto col = info->add_columnstats();
+    Assert(col->allnull() && !col->hasnull());
+  }
+  Assert(info->columnstats_size() == natts);
+}
+
+void MicroPartittionFileStatsData::CopyFrom(MicroPartitionStatsData *stats) {
+  Assert(stats);
+  if (typeid(this) == typeid(stats)) {
+    auto file_stats = dynamic_cast<MicroPartittionFileStatsData *>(stats);
+    Assert(file_stats);
+    info_->CopyFrom(*file_stats->info_);
+  } else {
+    Assert(info_->columnstats_size() == stats->ColumnSize());
+    for (int index = 0; index < stats->ColumnSize(); index++) {
+      auto column_stats = info_->mutable_columnstats(index);
+      column_stats->set_allnull(stats->GetAllNull(index));
+      column_stats->set_hasnull(stats->GetHasNull(index));
+      column_stats->mutable_datastats()->CopyFrom(
+          *stats->GetColumnDataStats(index));
+      column_stats->mutable_info()->CopyFrom(*stats->GetColumnBasicInfo(index));
+    }
+  }
+}
+
+::pax::stats::ColumnBasicInfo *MicroPartittionFileStatsData::GetColumnBasicInfo(
+    int column_index) {
+  return info_->mutable_columnstats(column_index)->mutable_info();
+}
+::pax::stats::ColumnDataStats *MicroPartittionFileStatsData::GetColumnDataStats(
+    int column_index) {
+  return info_->mutable_columnstats(column_index)->mutable_datastats();
+}
+int MicroPartittionFileStatsData::ColumnSize() const {
+  return info_->columnstats_size();
+}
+void MicroPartittionFileStatsData::SetAllNull(int column_index, bool allnull) {
+  info_->mutable_columnstats(column_index)->set_allnull(allnull);
+}
+void MicroPartittionFileStatsData::SetHasNull(int column_index, bool hasnull) {
+  info_->mutable_columnstats(column_index)->set_hasnull(hasnull);
+}
+
+bool MicroPartittionFileStatsData::GetAllNull(int column_index) {
+  return info_->columnstats(column_index).allnull();
+}
+
+bool MicroPartittionFileStatsData::GetHasNull(int column_index) {
+  return info_->columnstats(column_index).hasnull();
+}
+
+MicroPartitionStatsProvider::MicroPartitionStatsProvider(
+    const ::pax::stats::MicroPartitionStatisticsInfo &stats)
+    : stats_(stats) {}
+int MicroPartitionStatsProvider::ColumnSize() const {
+  return stats_.columnstats_size();
+}
+bool MicroPartitionStatsProvider::AllNull(int column_index) const {
+  return stats_.columnstats(column_index).allnull();
+}
+bool MicroPartitionStatsProvider::HasNull(int column_index) const {
+  return stats_.columnstats(column_index).hasnull();
+}
+const ::pax::stats::ColumnBasicInfo &MicroPartitionStatsProvider::ColumnInfo(
+    int column_index) const {
+  return stats_.columnstats(column_index).info();
+}
+const ::pax::stats::ColumnDataStats &MicroPartitionStatsProvider::DataStats(
+    int column_index) const {
+  return stats_.columnstats(column_index).datastats();
+}
+}  // namespace pax
+
+static inline const char *BoolToString(bool b) { return b ? "true" : "false"; }
+
+static char *TypeValueToCString(Oid typid, Oid collation,
+                                const std::string &value) {
+  FmgrInfo finfo;
+  HeapTuple tuple;
+  Form_pg_type form;
+  Datum datum;
+  bool ok;
+
+  tuple = SearchSysCache1(TYPEOID, ObjectIdGetDatum(typid));
+  if (!HeapTupleIsValid(tuple))
+    elog(ERROR, "cache lookup failed for type %u", typid);
+
+  form = (Form_pg_type)GETSTRUCT(tuple);
+  Assert(OidIsValid(form->typoutput));
+
+  datum = pax::MicroPartitionStats::FromValue(value, form->typlen,
+                                              form->typbyval, &ok);
+  if (!ok) elog(ERROR, "unexpected typlen: %d\n", form->typlen);
+
+  fmgr_info_cxt(form->typoutput, &finfo, CurrentMemoryContext);
+  datum = FunctionCall1Coll(&finfo, collation, datum);
+  ReleaseSysCache(tuple);
+
+  return DatumGetCString(datum);
+}
+
+// define stat type for custom output
+extern "C" {
+extern Datum MicroPartitionStatsInput(PG_FUNCTION_ARGS);
+extern Datum MicroPartitionStatsOutput(PG_FUNCTION_ARGS);
+PG_FUNCTION_INFO_V1(MicroPartitionStatsInput);
+PG_FUNCTION_INFO_V1(MicroPartitionStatsOutput);
+}
+
+Datum MicroPartitionStatsInput(PG_FUNCTION_ARGS) {
+  ereport(ERROR, (errmsg("unsupport MicroPartitionStatsInput")));
+  (void)fcinfo;
+  PG_RETURN_POINTER(NULL);
+}
+
+Datum MicroPartitionStatsOutput(PG_FUNCTION_ARGS) {
+  struct varlena *v = PG_GETARG_VARLENA_PP(0);
+  pax::stats::MicroPartitionStatisticsInfo stats;
+  StringInfoData str;
+
+  bool ok = stats.ParseFromArray(VARDATA_ANY(v), VARSIZE_ANY_EXHDR(v));
+  if (!ok) ereport(ERROR, (errmsg("micropartition stats is corrupt")));
+
+  initStringInfo(&str);
+  for (int i = 0, n = stats.columnstats_size(); i < n; i++) {
+    const auto &column = stats.columnstats(i);
+
+    if (i > 0) appendStringInfoChar(&str, ',');
+
+    appendStringInfo(&str, "[(%s,%s)", BoolToString(column.allnull()),
+                     BoolToString(column.hasnull()));
+
+    if (!column.has_datastats()) {
+      appendStringInfoString(&str, ",None]");
+      continue;
+    }
+
+    const auto &data_stats = column.datastats();
+    const auto &info = column.info();
+    appendStringInfo(&str, ",(%s,%s)]",
+                     TypeValueToCString(info.typid(), info.collation(),
+                                        data_stats.minimal()),
+                     TypeValueToCString(info.typid(), info.collation(),
+                                        data_stats.maximum()));
+  }
+
+  PG_RETURN_CSTRING(str.data);
+}
diff --git a/contrib/pax_storage/src/cpp/storage/micro_partition_stats.h b/contrib/pax_storage/src/cpp/storage/micro_partition_stats.h
new file mode 100644
index 00000000000..286c0b86a61
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/micro_partition_stats.h
@@ -0,0 +1,112 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#include <string>
+#include <utility>
+#include <vector>
+
+#include "comm/guc.h"
+#include "storage/oper/pax_stats.h"
+#include "storage/pax_filter.h"
+namespace pax {
+namespace stats {
+class MicroPartitionStatisticsInfo;
+class ColumnBasicInfo;
+class ColumnDataStats;
+}  // namespace stats
+
+class MicroPartitionStatsData {
+ public:
+  virtual void CopyFrom(MicroPartitionStatsData *stats) = 0;
+  virtual ::pax::stats::ColumnBasicInfo *GetColumnBasicInfo(
+      int column_index) = 0;
+  virtual ::pax::stats::ColumnDataStats *GetColumnDataStats(
+      int column_index) = 0;
+  virtual int ColumnSize() const = 0;
+  virtual void SetAllNull(int column_index, bool allnull) = 0;
+  virtual void SetHasNull(int column_index, bool hasnull) = 0;
+  virtual bool GetAllNull(int column_index) = 0;
+  virtual bool GetHasNull(int column_index) = 0;
+  virtual ~MicroPartitionStatsData() = default;
+};
+
+class MicroPartittionFileStatsData final : public MicroPartitionStatsData {
+ public:
+  MicroPartittionFileStatsData(::pax::stats::MicroPartitionStatisticsInfo *info,
+                               int natts);
+  void CopyFrom(MicroPartitionStatsData *stats) override;
+  ::pax::stats::ColumnBasicInfo *GetColumnBasicInfo(int column_index) override;
+  ::pax::stats::ColumnDataStats *GetColumnDataStats(int column_index) override;
+  int ColumnSize() const override;
+  void SetAllNull(int column_index, bool allnull) override;
+  void SetHasNull(int column_index, bool hasnull) override;
+  bool GetAllNull(int column_index) override;
+  bool GetHasNull(int column_index) override;
+
+ private:
+  ::pax::stats::MicroPartitionStatisticsInfo *info_ = nullptr;
+};
+
+class MicroPartitionStats final {
+ public:
+  explicit MicroPartitionStats(bool allow_fallback_to_pg = false);
+  ~MicroPartitionStats();
+  MicroPartitionStats *SetStatsMessage(MicroPartitionStatsData *stats,
+                                       int natts);
+  MicroPartitionStats *LightReset();
+
+  void AddRow(TupleTableSlot *slot);
+  MicroPartitionStatsData *GetStatsData() { return stats_; }
+  const MicroPartitionStatsData *GetStatsData() const { return stats_; }
+
+  void MergeTo(MicroPartitionStats *stats, TupleDesc desc);
+
+  static std::string ToValue(Datum datum, int typlen, bool typbyval);
+  static Datum FromValue(const std::string &s, int typlen, bool typbyval,
+                         bool *ok);
+
+  void DoInitialCheck(TupleDesc desc);
+
+ private:
+  void AddNullColumn(int column_index);
+  void AddNonNullColumn(int column_index, Datum value, TupleDesc desc);
+
+  void UpdateMinMaxValue(int column_index, Datum datum, Oid collation,
+                         int typlen, bool typbyval);
+
+  // stats_: only references the info object by pointer
+  MicroPartitionStatsData *stats_ = nullptr;
+
+  std::vector<Oid> opfamilies_;
+  // less: pair[0], greater: pair[1]
+  std::vector<std::pair<FmgrInfo, FmgrInfo>> finfos_;
+  std::vector<std::pair<OperMinMaxFunc, OperMinMaxFunc>> local_funcs_;
+  bool allow_fallback_to_pg_ = false;
+
+  // status to indicate whether the oids are initialized
+  // or the min-max values are initialized
+  // 'u': all is uninitialized
+  // 'x': column doesn't support min-max
+  // 'n': oids are initialized, but min-max value is missing
+  // 'y': min-max is set, needs update.
+  std::vector<char> status_;
+  bool initial_check_ = false;
+};
+
+class MicroPartitionStatsProvider final : public ColumnStatsProvider {
+ public:
+  explicit MicroPartitionStatsProvider(
+      const ::pax::stats::MicroPartitionStatisticsInfo &stats);
+  int ColumnSize() const override;
+  bool AllNull(int column_index) const override;
+  bool HasNull(int column_index) const override;
+  const ::pax::stats::ColumnBasicInfo &ColumnInfo(
+      int column_index) const override;
+  const ::pax::stats::ColumnDataStats &DataStats(
+      int column_index) const override;
+
+ private:
+  const ::pax::stats::MicroPartitionStatisticsInfo &stats_;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/oper/pax_oper.cc b/contrib/pax_storage/src/cpp/storage/oper/pax_oper.cc
new file mode 100644
index 00000000000..d5cde5734c5
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/oper/pax_oper.cc
@@ -0,0 +1,843 @@
+#include "storage/oper/pax_oper.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "exceptions/CException.h"
+
+namespace pax {
+
+namespace boolop {
+
+// oper(bool, bool)
+bool BoolLT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const bool *)l) < *((const bool *)r));
+}
+
+bool BoolLE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const bool *)l) <= *((const bool *)r));
+}
+
+bool BoolEQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const bool *)l) == *((const bool *)r));
+}
+
+bool BoolGE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const bool *)l) >= *((const bool *)r));
+}
+
+bool BoolGT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const bool *)l) > *((const bool *)r));
+}
+
+}  // namespace boolop
+
+namespace charop {
+
+// oper(char, char)
+bool CharLT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const uint8 *)l) < *((const uint8 *)r));
+}
+
+bool CharLE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const uint8 *)l) <= *((const uint8 *)r));
+}
+
+bool CharEQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const uint8 *)l) == *((const uint8 *)r));
+}
+
+bool CharGE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const uint8 *)l) >= *((const uint8 *)r));
+}
+
+bool CharGT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const uint8 *)l) > *((const uint8 *)r));
+}
+
+}  // namespace charop
+
+namespace int2op {
+
+// oper(int2, int2)
+bool Int2LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) < *((const int16 *)r));
+}
+
+bool Int2LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) <= *((const int16 *)r));
+}
+
+bool Int2EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) == *((const int16 *)r));
+}
+
+bool Int2GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) >= *((const int16 *)r));
+}
+
+bool Int2GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) > *((const int16 *)r));
+}
+
+// oper(int2, int4)
+bool Int24LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) < *((const int32 *)r));
+}
+
+bool Int24LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) <= *((const int32 *)r));
+}
+
+bool Int24EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) == *((const int32 *)r));
+}
+
+bool Int24GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) >= *((const int32 *)r));
+}
+
+bool Int24GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) > *((const int32 *)r));
+}
+
+// oper(int2, int8)
+bool Int28LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) < *((const int64 *)r));
+}
+
+bool Int28LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) <= *((const int64 *)r));
+}
+
+bool Int28EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) == *((const int64 *)r));
+}
+
+bool Int28GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) >= *((const int64 *)r));
+}
+
+bool Int28GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int16 *)l) > *((const int64 *)r));
+}
+
+}  // namespace int2op
+
+namespace dateop {
+
+// oper(date, date)
+bool DateLT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const DateADT *)l) < *((const DateADT *)r));
+}
+
+bool DateLE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const DateADT *)l) <= *((const DateADT *)r));
+}
+
+bool DateEQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const DateADT *)l) == *((const DateADT *)r));
+}
+
+bool DateGE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const DateADT *)l) >= *((const DateADT *)r));
+}
+
+bool DateGT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const DateADT *)l) > *((const DateADT *)r));
+}
+
+}  // namespace dateop
+
+namespace int4op {
+
+// oper(int4, int4)
+bool Int4LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) < *((const int32 *)r));
+}
+
+bool Int4LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) <= *((const int32 *)r));
+}
+
+bool Int4EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) == *((const int32 *)r));
+}
+
+bool Int4GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) >= *((const int32 *)r));
+}
+
+bool Int4GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) > *((const int32 *)r));
+}
+
+// oper(int4, int8)
+bool Int48LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) < *((const int64 *)r));
+}
+
+bool Int48LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) <= *((const int64 *)r));
+}
+
+bool Int48EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) == *((const int64 *)r));
+}
+
+bool Int48GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) >= *((const int64 *)r));
+}
+
+bool Int48GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) > *((const int64 *)r));
+}
+
+// oper(int4, int2)
+bool Int42LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) < *((const int16 *)r));
+}
+
+bool Int42LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) <= *((const int16 *)r));
+}
+
+bool Int42EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) == *((const int16 *)r));
+}
+
+bool Int42GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) >= *((const int16 *)r));
+}
+
+bool Int42GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int32 *)l) > *((const int16 *)r));
+}
+
+}  // namespace int4op
+
+namespace int8op {
+
+// oper(int8, int8)
+bool Int8LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) < *((const int64 *)r));
+}
+
+bool Int8LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) <= *((const int64 *)r));
+}
+
+bool Int8EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) == *((const int64 *)r));
+}
+
+bool Int8GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) >= *((const int64 *)r));
+}
+
+bool Int8GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) > *((const int64 *)r));
+}
+
+// oper(int8, int4)
+bool Int84LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) < *((const int32 *)r));
+}
+
+bool Int84LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) <= *((const int32 *)r));
+}
+
+bool Int84EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) == *((const int32 *)r));
+}
+
+bool Int84GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) >= *((const int32 *)r));
+}
+
+bool Int84GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) > *((const int32 *)r));
+}
+
+// oper(int8, int2)
+bool Int82LT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) < *((const int16 *)r));
+}
+
+bool Int82LE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) <= *((const int16 *)r));
+}
+
+bool Int82EQ(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) == *((const int16 *)r));
+}
+
+bool Int82GE(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) >= *((const int16 *)r));
+}
+
+bool Int82GT(const void *l, const void *r, Oid /*collation*/) {
+  return (*((const int64 *)l) > *((const int16 *)r));
+}
+
+}  // namespace int8op
+
+namespace float4op {
+
+bool Float4LT(const void *l, const void *r, Oid /*collation*/) {
+  float4 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 < val2);
+}
+
+bool Float4LE(const void *l, const void *r, Oid /*collation*/) {
+  float4 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 <= val2);
+}
+
+bool Float4EQ(const void *l, const void *r, Oid /*collation*/) {
+  float4 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float4 *)r);
+
+  return isnan(val1) ? isnan(val2) : !isnan(val2) && val1 == val2;
+}
+
+bool Float4GE(const void *l, const void *r, Oid /*collation*/) {
+  float4 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 >= val2);
+}
+
+bool Float4GT(const void *l, const void *r, Oid /*collation*/) {
+  float4 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 > val2);
+}
+
+bool Float48LT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 < val2);
+}
+
+bool Float48LE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 <= val2);
+}
+
+bool Float48EQ(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float8 *)r);
+
+  return isnan(val1) ? isnan(val2) : !isnan(val2) && val1 == val2;
+}
+
+bool Float48GE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 >= val2);
+}
+
+bool Float48GT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float4 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 > val2);
+}
+
+}  // namespace float4op
+
+namespace float8op {
+
+bool Float8LT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 < val2);
+}
+
+bool Float8LE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 <= val2);
+}
+
+bool Float8EQ(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float8 *)r);
+
+  return isnan(val1) ? isnan(val2) : !isnan(val2) && val1 == val2;
+}
+
+bool Float8GE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 >= val2);
+}
+
+bool Float8GT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float8 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 > val2);
+}
+
+bool Float84LT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 < val2);
+}
+
+bool Float84LE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 <= val2);
+}
+
+bool Float84EQ(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float4 *)r);
+
+  return isnan(val1) ? isnan(val2) : !isnan(val2) && val1 == val2;
+}
+
+bool Float84GE(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 >= val2);
+}
+
+bool Float84GT(const void *l, const void *r, Oid /*collation*/) {
+  float8 val1, val2;
+  val1 = *((const float8 *)l);
+  val2 = *((const float4 *)r);
+
+  return !isnan(val1) && (isnan(val2) || val1 > val2);
+}
+
+}  // namespace float8op
+
+namespace textop {
+#define TEXTBUFLEN 1024
+
+static inline bool LocaleIsC(Oid collation) {
+  static int result = -1;
+  if (result != -1) {
+    return (bool)result;
+  }
+
+  /*
+   * If we're asked about the default collation, we have to inquire of the C
+   * library.  Cache the result so we only have to compute it once.
+   */
+
+  if (collation == DEFAULT_COLLATION_OID) {
+    char *localeptr;
+    localeptr = setlocale(LC_COLLATE, NULL);
+    CBDB_CHECK(localeptr, cbdb::CException::ExType::kExTypeCError);
+
+    if ((strcmp(localeptr, "C") == 0 || strcmp(localeptr, "POSIX") == 0)) {
+      result = 1;
+    } else {
+      result = 0;
+    }
+
+  } else if (collation == C_COLLATION_OID || collation == POSIX_COLLATION_OID) {
+    result = 1;
+  } else {
+    result = 0;
+  }
+
+  return (bool)result;
+}
+
+static inline int VarstrCmp(const char *arg1, int len1, const char *arg2,
+                            int len2, Oid collid) {
+  int rc;
+
+  CBDB_CHECK(OidIsValid(collid), cbdb::CException::ExType::kExTypeLogicError);
+  if (LocaleIsC(collid)) {
+    rc = memcmp(arg1, arg2, Min(len1, len2));
+    if ((rc == 0) && (len1 != len2)) rc = (len1 < len2) ? -1 : 1;
+  } else if (collid == DEFAULT_COLLATION_OID) {
+    char a1buf[TEXTBUFLEN];
+    char a2buf[TEXTBUFLEN];
+    char *a1p, *a2p;
+    if (len1 == len2 && memcmp(arg1, arg2, len1) == 0) return 0;
+
+    a1p = (len1 >= TEXTBUFLEN) ? (char *)cbdb::Palloc(len1 + 1) : a1buf;
+    a2p = (len2 >= TEXTBUFLEN) ? (char *)cbdb::Palloc(len2 + 1) : a2buf;
+
+    memcpy(a1p, arg1, len1);
+    a1p[len1] = '\0';
+    memcpy(a2p, arg2, len2);
+    a2p[len2] = '\0';
+
+    rc = strcoll(a1p, a2p);
+
+    if (rc == 0) rc = strcmp(a1p, a2p);
+
+    if (a1p != a1buf) cbdb::Pfree(a1p);
+
+    if (a2p != a2buf) cbdb::Pfree(a2p);
+  } else {
+    // not support special provider
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeUnImplements);
+  }
+
+  return rc;
+}
+
+static inline int TextCmp(const text *arg1, const text *arg2, Oid collid) {
+  // safe to direct call toast_raw_datum_size
+  return VarstrCmp(VARDATA_ANY(arg1), VARSIZE_ANY_EXHDR(arg1),
+                   VARDATA_ANY(arg2), VARSIZE_ANY_EXHDR(arg2), collid);
+}
+
+bool TextLT(const void *l, const void *r, Oid collation) {
+  return TextCmp(*(const text **)l, *(const text **)r, collation) < 0;
+}
+
+bool TextLE(const void *l, const void *r, Oid collation) {
+  return TextCmp(*(const text **)l, *(const text **)r, collation) <= 0;
+}
+
+bool TextEQ(const void *l, const void *r, Oid collation) {
+  return TextCmp(*(const text **)l, *(const text **)r, collation) == 0;
+}
+
+bool TextGE(const void *l, const void *r, Oid collation) {
+  return TextCmp(*(const text **)l, *(const text **)r, collation) >= 0;
+}
+
+bool TextGT(const void *l, const void *r, Oid collation) {
+  return TextCmp(*(const text **)l, *(const text **)r, collation) > 0;
+}
+
+static inline int
+BcTruelen(const BpChar *arg)
+{
+	return bpchartruelen(VARDATA_ANY(arg), VARSIZE_ANY_EXHDR(arg));
+}
+
+bool BpCharLT(const void *l, const void *r, Oid collation) {
+  const BpChar *lbpchar = *(const BpChar **)l;
+  const BpChar *rbpchar = *(const BpChar **)r;
+
+  return VarstrCmp(VARDATA_ANY(lbpchar), BcTruelen(lbpchar), VARDATA_ANY(rbpchar), BcTruelen(rbpchar),
+					 collation) < 0;
+}
+
+bool BpCharLE(const void *l, const void *r, Oid collation) {
+  const BpChar *lbpchar = *(const BpChar **)l;
+  const BpChar *rbpchar = *(const BpChar **)r;
+
+  return VarstrCmp(VARDATA_ANY(lbpchar), BcTruelen(lbpchar), VARDATA_ANY(rbpchar), BcTruelen(rbpchar),
+					 collation) <= 0;
+}
+
+bool BpCharEQ(const void *l, const void *r, Oid collation) {
+  const BpChar *lbpchar = *(const BpChar **)l;
+  const BpChar *rbpchar = *(const BpChar **)r;
+
+  return VarstrCmp(VARDATA_ANY(lbpchar), BcTruelen(lbpchar), VARDATA_ANY(rbpchar), BcTruelen(rbpchar),
+					 collation) == 0;
+}
+
+bool BpCharGE(const void *l, const void *r, Oid collation) {
+  const BpChar *lbpchar = *(const BpChar **)l;
+  const BpChar *rbpchar = *(const BpChar **)r;
+
+  return VarstrCmp(VARDATA_ANY(lbpchar), BcTruelen(lbpchar), VARDATA_ANY(rbpchar), BcTruelen(rbpchar),
+					 collation) >= 0;
+}
+
+bool BpCharGT(const void *l, const void *r, Oid collation) {
+  const BpChar *lbpchar = *(const BpChar **)l;
+  const BpChar *rbpchar = *(const BpChar **)r;
+
+  return VarstrCmp(VARDATA_ANY(lbpchar), BcTruelen(lbpchar), VARDATA_ANY(rbpchar), BcTruelen(rbpchar),
+					 collation) > 0;
+}
+
+}  // namespace textop
+
+namespace numericop {
+
+bool NumericLT(const void *l, const void *r, Oid collation) {
+  // safe to direct call pg function
+  return cmp_numerics(*((const Numeric *)l), *((const Numeric *)r)) < 0;
+}
+
+bool NumericLE(const void *l, const void *r, Oid collation) {
+  return cmp_numerics(*((const Numeric *)l), *((const Numeric *)r)) <= 0;
+}
+
+bool NumericEQ(const void *l, const void *r, Oid collation) {
+  return cmp_numerics(*((const Numeric *)l), *((const Numeric *)r)) == 0;
+}
+
+bool NumericGE(const void *l, const void *r, Oid collation) {
+  return cmp_numerics(*((const Numeric *)l), *((const Numeric *)r)) >= 0;
+}
+
+bool NumericGT(const void *l, const void *r, Oid collation) {
+  return cmp_numerics(*((const Numeric *)l), *((const Numeric *)r)) > 0;
+}
+
+}  // namespace numericop
+
+#define INIT_MIN_MAX_OPER(L_OID, R_OID, SN, FUNC) \
+  { {L_OID, R_OID, SN}, FUNC }
+
+std::map<OperMinMaxKey, OperMinMaxFunc> min_max_opers = {
+    // oper(bool, bool)
+    INIT_MIN_MAX_OPER(BOOLOID, BOOLOID, BTLessStrategyNumber, boolop::BoolLT),
+    INIT_MIN_MAX_OPER(BOOLOID, BOOLOID, BTLessEqualStrategyNumber,
+                      boolop::BoolLE),
+    INIT_MIN_MAX_OPER(BOOLOID, BOOLOID, BTEqualStrategyNumber, boolop::BoolEQ),
+    INIT_MIN_MAX_OPER(BOOLOID, BOOLOID, BTGreaterEqualStrategyNumber,
+                      boolop::BoolGE),
+    INIT_MIN_MAX_OPER(BOOLOID, BOOLOID, BTGreaterStrategyNumber,
+                      boolop::BoolGT),
+
+    // oper(char, char)
+    INIT_MIN_MAX_OPER(CHAROID, CHAROID, BTLessStrategyNumber, charop::CharLT),
+    INIT_MIN_MAX_OPER(CHAROID, CHAROID, BTLessEqualStrategyNumber,
+                      charop::CharLE),
+    INIT_MIN_MAX_OPER(CHAROID, CHAROID, BTEqualStrategyNumber, charop::CharEQ),
+    INIT_MIN_MAX_OPER(CHAROID, CHAROID, BTGreaterEqualStrategyNumber,
+                      charop::CharGE),
+    INIT_MIN_MAX_OPER(CHAROID, CHAROID, BTGreaterStrategyNumber,
+                      charop::CharGT),
+
+    // oper(int2, int2)
+    INIT_MIN_MAX_OPER(INT2OID, INT2OID, BTLessStrategyNumber, int2op::Int2LT),
+    INIT_MIN_MAX_OPER(INT2OID, INT2OID, BTLessEqualStrategyNumber,
+                      int2op::Int2LE),
+    INIT_MIN_MAX_OPER(INT2OID, INT2OID, BTEqualStrategyNumber, int2op::Int2EQ),
+    INIT_MIN_MAX_OPER(INT2OID, INT2OID, BTGreaterEqualStrategyNumber,
+                      int2op::Int2GE),
+    INIT_MIN_MAX_OPER(INT2OID, INT2OID, BTGreaterStrategyNumber,
+                      int2op::Int2GT),
+
+    // oper(int2, int4)
+    INIT_MIN_MAX_OPER(INT2OID, INT4OID, BTLessStrategyNumber, int2op::Int24LT),
+    INIT_MIN_MAX_OPER(INT2OID, INT4OID, BTLessEqualStrategyNumber,
+                      int2op::Int24LE),
+    INIT_MIN_MAX_OPER(INT2OID, INT4OID, BTEqualStrategyNumber, int2op::Int24EQ),
+    INIT_MIN_MAX_OPER(INT2OID, INT4OID, BTGreaterEqualStrategyNumber,
+                      int2op::Int24GE),
+    INIT_MIN_MAX_OPER(INT2OID, INT4OID, BTGreaterStrategyNumber,
+                      int2op::Int24GT),
+
+    // oper(int2, int8)
+    INIT_MIN_MAX_OPER(INT2OID, INT8OID, BTLessStrategyNumber, int2op::Int28LT),
+    INIT_MIN_MAX_OPER(INT2OID, INT8OID, BTLessEqualStrategyNumber,
+                      int2op::Int28LE),
+    INIT_MIN_MAX_OPER(INT2OID, INT8OID, BTEqualStrategyNumber, int2op::Int28EQ),
+    INIT_MIN_MAX_OPER(INT2OID, INT8OID, BTGreaterEqualStrategyNumber,
+                      int2op::Int28GE),
+    INIT_MIN_MAX_OPER(INT2OID, INT8OID, BTGreaterStrategyNumber,
+                      int2op::Int28GT),
+
+    // oper(date, date)
+    INIT_MIN_MAX_OPER(DATEOID, DATEOID, BTLessStrategyNumber, dateop::DateLT),
+    INIT_MIN_MAX_OPER(DATEOID, DATEOID, BTLessEqualStrategyNumber,
+                      dateop::DateLE),
+    INIT_MIN_MAX_OPER(DATEOID, DATEOID, BTEqualStrategyNumber, dateop::DateEQ),
+    INIT_MIN_MAX_OPER(DATEOID, DATEOID, BTGreaterEqualStrategyNumber,
+                      dateop::DateGE),
+    INIT_MIN_MAX_OPER(DATEOID, DATEOID, BTGreaterStrategyNumber,
+                      dateop::DateGT),
+
+    // oper(int4, int4)
+    INIT_MIN_MAX_OPER(INT4OID, INT4OID, BTLessStrategyNumber, int4op::Int4LT),
+    INIT_MIN_MAX_OPER(INT4OID, INT4OID, BTLessEqualStrategyNumber,
+                      int4op::Int4LE),
+    INIT_MIN_MAX_OPER(INT4OID, INT4OID, BTEqualStrategyNumber, int4op::Int4EQ),
+    INIT_MIN_MAX_OPER(INT4OID, INT4OID, BTGreaterEqualStrategyNumber,
+                      int4op::Int4GE),
+    INIT_MIN_MAX_OPER(INT4OID, INT4OID, BTGreaterStrategyNumber,
+                      int4op::Int4GT),
+
+    // oper(int4, int8)
+    INIT_MIN_MAX_OPER(INT4OID, INT8OID, BTLessStrategyNumber, int4op::Int48LT),
+    INIT_MIN_MAX_OPER(INT4OID, INT8OID, BTLessEqualStrategyNumber,
+                      int4op::Int48LE),
+    INIT_MIN_MAX_OPER(INT4OID, INT8OID, BTEqualStrategyNumber, int4op::Int48EQ),
+    INIT_MIN_MAX_OPER(INT4OID, INT8OID, BTGreaterEqualStrategyNumber,
+                      int4op::Int48GE),
+    INIT_MIN_MAX_OPER(INT4OID, INT8OID, BTGreaterStrategyNumber,
+                      int4op::Int48GT),
+
+    // oper(int4, int2)
+    INIT_MIN_MAX_OPER(INT4OID, INT2OID, BTLessStrategyNumber, int4op::Int42LT),
+    INIT_MIN_MAX_OPER(INT4OID, INT2OID, BTLessEqualStrategyNumber,
+                      int4op::Int42LE),
+    INIT_MIN_MAX_OPER(INT4OID, INT2OID, BTEqualStrategyNumber, int4op::Int42EQ),
+    INIT_MIN_MAX_OPER(INT4OID, INT2OID, BTGreaterEqualStrategyNumber,
+                      int4op::Int42GE),
+    INIT_MIN_MAX_OPER(INT4OID, INT2OID, BTGreaterStrategyNumber,
+                      int4op::Int42GT),
+
+    // oper(int8, int8)
+    INIT_MIN_MAX_OPER(INT8OID, INT8OID, BTLessStrategyNumber, int8op::Int8LT),
+    INIT_MIN_MAX_OPER(INT8OID, INT8OID, BTLessEqualStrategyNumber,
+                      int8op::Int8LE),
+    INIT_MIN_MAX_OPER(INT8OID, INT8OID, BTEqualStrategyNumber, int8op::Int8EQ),
+    INIT_MIN_MAX_OPER(INT8OID, INT8OID, BTGreaterEqualStrategyNumber,
+                      int8op::Int8GE),
+    INIT_MIN_MAX_OPER(INT8OID, INT8OID, BTGreaterStrategyNumber,
+                      int8op::Int8GT),
+
+    // oper(int8, int4)
+    INIT_MIN_MAX_OPER(INT8OID, INT4OID, BTLessStrategyNumber, int8op::Int84LT),
+    INIT_MIN_MAX_OPER(INT8OID, INT4OID, BTLessEqualStrategyNumber,
+                      int8op::Int84LE),
+    INIT_MIN_MAX_OPER(INT8OID, INT4OID, BTEqualStrategyNumber, int8op::Int84EQ),
+    INIT_MIN_MAX_OPER(INT8OID, INT4OID, BTGreaterEqualStrategyNumber,
+                      int8op::Int84GE),
+    INIT_MIN_MAX_OPER(INT8OID, INT4OID, BTGreaterStrategyNumber,
+                      int8op::Int84GT),
+
+    // oper(int8, int2)
+    INIT_MIN_MAX_OPER(INT8OID, INT2OID, BTLessStrategyNumber, int8op::Int82LT),
+    INIT_MIN_MAX_OPER(INT8OID, INT2OID, BTLessEqualStrategyNumber,
+                      int8op::Int82LE),
+    INIT_MIN_MAX_OPER(INT8OID, INT2OID, BTEqualStrategyNumber, int8op::Int82EQ),
+    INIT_MIN_MAX_OPER(INT8OID, INT2OID, BTGreaterEqualStrategyNumber,
+                      int8op::Int82GE),
+    INIT_MIN_MAX_OPER(INT8OID, INT2OID, BTGreaterStrategyNumber,
+                      int8op::Int82GT),
+
+    // oper(float4, float4)
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT4OID, BTLessStrategyNumber,
+                      float4op::Float4LT),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT4OID, BTLessEqualStrategyNumber,
+                      float4op::Float4LE),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT4OID, BTEqualStrategyNumber,
+                      float4op::Float4EQ),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT4OID, BTGreaterEqualStrategyNumber,
+                      float4op::Float4GE),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT4OID, BTGreaterStrategyNumber,
+                      float4op::Float4GT),
+
+    // oper(float4, float8)
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT8OID, BTLessStrategyNumber,
+                      float4op::Float48LT),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT8OID, BTLessEqualStrategyNumber,
+                      float4op::Float48LE),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT8OID, BTEqualStrategyNumber,
+                      float4op::Float48EQ),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT8OID, BTGreaterEqualStrategyNumber,
+                      float4op::Float48GE),
+    INIT_MIN_MAX_OPER(FLOAT4OID, FLOAT8OID, BTGreaterStrategyNumber,
+                      float4op::Float48GT),
+
+    // oper(float8, float8)
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT8OID, BTLessStrategyNumber,
+                      float8op::Float8LT),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT8OID, BTLessEqualStrategyNumber,
+                      float8op::Float8LE),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT8OID, BTEqualStrategyNumber,
+                      float8op::Float8EQ),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT8OID, BTGreaterEqualStrategyNumber,
+                      float8op::Float8GE),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT8OID, BTGreaterStrategyNumber,
+                      float8op::Float8GT),
+
+    // oper(float8, float4)
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT4OID, BTLessStrategyNumber,
+                      float8op::Float84LT),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT4OID, BTLessEqualStrategyNumber,
+                      float8op::Float84LE),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT4OID, BTEqualStrategyNumber,
+                      float8op::Float84EQ),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT4OID, BTGreaterEqualStrategyNumber,
+                      float8op::Float84GE),
+    INIT_MIN_MAX_OPER(FLOAT8OID, FLOAT4OID, BTGreaterStrategyNumber,
+                      float8op::Float84GT),
+
+    // oper(text, text)
+    INIT_MIN_MAX_OPER(TEXTOID, TEXTOID, BTLessStrategyNumber, textop::TextLT),
+    INIT_MIN_MAX_OPER(TEXTOID, TEXTOID, BTLessEqualStrategyNumber,
+                      textop::TextLE),
+    INIT_MIN_MAX_OPER(TEXTOID, TEXTOID, BTEqualStrategyNumber, textop::TextEQ),
+    INIT_MIN_MAX_OPER(TEXTOID, TEXTOID, BTGreaterEqualStrategyNumber,
+                      textop::TextGE),
+    INIT_MIN_MAX_OPER(TEXTOID, TEXTOID, BTGreaterStrategyNumber,
+                      textop::TextGT),
+
+    // oper(bpchar, bpchar)
+    INIT_MIN_MAX_OPER(BPCHAROID, BPCHAROID, BTLessStrategyNumber, textop::BpCharLT),
+    INIT_MIN_MAX_OPER(BPCHAROID, BPCHAROID, BTLessEqualStrategyNumber,
+                      textop::BpCharLE),
+    INIT_MIN_MAX_OPER(BPCHAROID, BPCHAROID, BTEqualStrategyNumber, textop::BpCharEQ),
+    INIT_MIN_MAX_OPER(BPCHAROID, BPCHAROID, BTGreaterEqualStrategyNumber,
+                      textop::BpCharGE),
+    INIT_MIN_MAX_OPER(BPCHAROID, BPCHAROID, BTGreaterStrategyNumber,
+                      textop::BpCharGT),
+
+    // oper(numeric, numeric)
+    INIT_MIN_MAX_OPER(NUMERICOID, NUMERICOID, BTLessStrategyNumber,
+                      numericop::NumericLT),
+    INIT_MIN_MAX_OPER(NUMERICOID, NUMERICOID, BTLessEqualStrategyNumber,
+                      numericop::NumericLE),
+    INIT_MIN_MAX_OPER(NUMERICOID, NUMERICOID, BTEqualStrategyNumber,
+                      numericop::NumericEQ),
+    INIT_MIN_MAX_OPER(NUMERICOID, NUMERICOID, BTGreaterEqualStrategyNumber,
+                      numericop::NumericGE),
+    INIT_MIN_MAX_OPER(NUMERICOID, NUMERICOID, BTGreaterStrategyNumber,
+                      numericop::NumericGT),
+
+    // FIXME(jiaqizho): support below oper in the feature
+    // BPCHAROID
+    // VARCHAROID
+    // TIMESTAMPTZOID
+    // TIMEOID
+    // TIMESTAMPOID
+    // DATEOID
+    // NAMEOID
+    // INT8ARRAYOID,
+    // FLOAT8ARRAYOID
+    // BYTEAOID
+    // OIDOID
+    // XIDOID
+    // CIDOID
+    // REGPROCOID
+};
+
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/oper/pax_oper.h b/contrib/pax_storage/src/cpp/storage/oper/pax_oper.h
new file mode 100644
index 00000000000..434bf63e332
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/oper/pax_oper.h
@@ -0,0 +1,151 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#include <functional>
+#include <map>
+
+namespace pax {
+
+using OperMinMaxFunc = std::function<bool(const void *, const void *, Oid)>;
+using OperMinMaxKey = std::tuple<Oid, Oid, StrategyNumber>;
+
+namespace boolop {
+extern bool BoolLT(const void *l, const void *r, Oid /*collation*/);
+extern bool BoolLE(const void *l, const void *r, Oid /*collation*/);
+extern bool BoolEQ(const void *l, const void *r, Oid /*collation*/);
+extern bool BoolGE(const void *l, const void *r, Oid /*collation*/);
+extern bool BoolGT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace boolop
+
+namespace charop {
+extern bool CharLT(const void *l, const void *r, Oid /*collation*/);
+extern bool CharLE(const void *l, const void *r, Oid /*collation*/);
+extern bool CharEQ(const void *l, const void *r, Oid /*collation*/);
+extern bool CharGE(const void *l, const void *r, Oid /*collation*/);
+extern bool CharGT(const void *l, const void *r, Oid /*collation*/);
+
+}  // namespace charop
+
+namespace int2op {
+extern bool Int2LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int2LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int2EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int2GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int2GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int24LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int24LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int24EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int24GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int24GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int28LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int28LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int28EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int28GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int28GT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace int2op
+
+namespace dateop {
+extern bool DateLT(const void *l, const void *r, Oid /*collation*/);
+extern bool DateLE(const void *l, const void *r, Oid /*collation*/);
+extern bool DateEQ(const void *l, const void *r, Oid /*collation*/);
+extern bool DateGE(const void *l, const void *r, Oid /*collation*/);
+extern bool DateGT(const void *l, const void *r, Oid /*collation*/);
+
+}  // namespace dateop
+
+namespace int4op {
+extern bool Int4LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int4LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int4EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int4GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int4GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int48LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int48LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int48EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int48GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int48GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int42LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int42LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int42EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int42GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int42GT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace int4op
+
+namespace int8op {
+extern bool Int8LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int8LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int8EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int8GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int8GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int84LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int84LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int84EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int84GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int84GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Int82LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Int82LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int82EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Int82GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Int82GT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace int8op
+
+namespace float4op {
+extern bool Float4LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Float4LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float4EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Float4GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float4GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Float48LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Float48LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float48EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Float48GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float48GT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace float4op
+
+namespace float8op {
+extern bool Float8LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Float8LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float8EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Float8GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float8GT(const void *l, const void *r, Oid /*collation*/);
+
+extern bool Float84LT(const void *l, const void *r, Oid /*collation*/);
+extern bool Float84LE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float84EQ(const void *l, const void *r, Oid /*collation*/);
+extern bool Float84GE(const void *l, const void *r, Oid /*collation*/);
+extern bool Float84GT(const void *l, const void *r, Oid /*collation*/);
+}  // namespace float8op
+
+namespace textop {
+extern bool TextLT(const void *l, const void *r, Oid collation);
+extern bool TextLE(const void *l, const void *r, Oid collation);
+extern bool TextEQ(const void *l, const void *r, Oid collation);
+extern bool TextGE(const void *l, const void *r, Oid collation);
+extern bool TextGT(const void *l, const void *r, Oid collation);
+
+extern bool BpCharLT(const void *l, const void *r, Oid /*collation*/);
+extern bool BpCharLE(const void *l, const void *r, Oid /*collation*/);
+extern bool BpCharEQ(const void *l, const void *r, Oid /*collation*/);
+extern bool BpCharGE(const void *l, const void *r, Oid /*collation*/);
+extern bool BpCharGT(const void *l, const void *r, Oid /*collation*/);
+
+}  // namespace textop
+
+namespace numericop {
+extern bool NumericLT(const void *l, const void *r, Oid collation);
+extern bool NumericLE(const void *l, const void *r, Oid collation);
+extern bool NumericEQ(const void *l, const void *r, Oid collation);
+extern bool NumericGE(const void *l, const void *r, Oid collation);
+extern bool NumericGT(const void *l, const void *r, Oid collation);
+}  // namespace numericop
+
+extern std::map<OperMinMaxKey, OperMinMaxFunc> min_max_opers;
+
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/oper/pax_stats.cc b/contrib/pax_storage/src/cpp/storage/oper/pax_stats.cc
new file mode 100644
index 00000000000..8394ff8ba07
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/oper/pax_stats.cc
@@ -0,0 +1,57 @@
+#include "storage/oper/pax_stats.h"
+
+#include "comm/cbdb_wrappers.h"
+
+namespace pax {
+
+bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid collid,
+                               OperMinMaxFunc &func,
+                               StrategyNumber strategynum) {
+  OperMinMaxKey key;
+
+  if (!CollateIsSupport(collid)) {
+    return false;
+  }
+
+  key = {atttypid, subtype, strategynum};
+  auto it = min_max_opers.find(key);
+  if (it != min_max_opers.end()) {
+    func = it->second;
+    return true;
+  }
+  return false;
+}
+
+bool GetStrategyProcinfo(Oid typid, Oid subtype, Oid *opfamily,
+                         std::pair<FmgrInfo, FmgrInfo> &finfos) {
+  Oid opfamily1;
+  Oid opfamily2;
+
+  auto ok =
+      cbdb::MinMaxGetStrategyProcinfo(typid, subtype, &opfamily1, &finfos.first,
+                                      BTLessStrategyNumber) &&
+      cbdb::MinMaxGetStrategyProcinfo(typid, subtype, &opfamily2,
+                                      &finfos.second, BTGreaterStrategyNumber);
+  if (ok) {
+    Assert(opfamily1 == opfamily2);
+    Assert(OidIsValid(opfamily1));
+    *opfamily = opfamily1;
+  }
+  return ok;
+}
+
+bool GetStrategyProcinfo(Oid typid, Oid subtype,
+                         std::pair<OperMinMaxFunc, OperMinMaxFunc> &funcs) {
+  return MinMaxGetStrategyProcinfo(typid, subtype, InvalidOid, funcs.first,
+                                   BTLessStrategyNumber) &&
+         MinMaxGetStrategyProcinfo(typid, subtype, InvalidOid, funcs.second,
+                                   BTGreaterStrategyNumber);
+}
+
+bool CollateIsSupport(Oid collid) {
+  return collid == InvalidOid ||  // Allow no setting collate
+         collid == DEFAULT_COLLATION_OID || collid == C_COLLATION_OID ||
+         collid == POSIX_COLLATION_OID;
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/oper/pax_stats.h b/contrib/pax_storage/src/cpp/storage/oper/pax_stats.h
new file mode 100644
index 00000000000..37ab76eec89
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/oper/pax_stats.h
@@ -0,0 +1,21 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#include "storage/oper/pax_oper.h"
+
+namespace pax {
+
+bool MinMaxGetStrategyProcinfo(Oid atttypid, Oid subtype, Oid collid,
+                               OperMinMaxFunc &func,
+                               StrategyNumber strategynum);
+
+// Get the operator from pg
+bool GetStrategyProcinfo(Oid typid, Oid subtype, Oid *opfamily,
+                         std::pair<FmgrInfo, FmgrInfo> &finfos);
+
+// Get the operator from pax
+bool GetStrategyProcinfo(Oid typid, Oid subtype,
+                         std::pair<OperMinMaxFunc, OperMinMaxFunc> &funcs);
+
+bool CollateIsSupport(Oid collid);
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc.cc b/contrib/pax_storage/src/cpp/storage/orc/orc.cc
deleted file mode 100644
index 928ae710177..00000000000
--- a/contrib/pax_storage/src/cpp/storage/orc/orc.cc
+++ /dev/null
@@ -1,1109 +0,0 @@
-#include "storage/orc/orc.h"
-
-#include "comm/cbdb_api.h"
-
-#include <string>
-#include <utility>
-#include <vector>
-
-#include "catalog/micro_partition_stats.h"
-#include "comm/cbdb_wrappers.h"
-#include "exceptions/CException.h"
-#include "storage/columns/pax_column_int.h"
-#include "storage/columns/pax_encoding_non_fixed_column.h"
-#include "storage/pax_filter.h"
-namespace pax {
-
-std::pair<std::vector<orc::proto::Type_Kind>, std::vector<ColumnEncoding_Kind>>
-OrcWriter::BuildSchema(const MicroPartitionWriter::WriterOptions &options) {
-  std::vector<orc::proto::Type_Kind> type_kinds;
-  std::vector<ColumnEncoding_Kind> encoding_types;
-  TupleDesc desc;
-
-  desc = options.desc;
-  Assert(desc);
-
-  for (int i = 0; i < desc->natts; i++) {
-    auto *attr = &desc->attrs[i];
-    if (attr->attbyval) {
-      switch (attr->attlen) {
-        case 1:
-          type_kinds.emplace_back(orc::proto::Type_Kind::Type_Kind_BYTE);
-          encoding_types.emplace_back(
-              ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
-          break;
-        case 2:
-          type_kinds.emplace_back(orc::proto::Type_Kind::Type_Kind_SHORT);
-          encoding_types.emplace_back(
-              ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
-          break;
-        case 4:
-          type_kinds.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
-          encoding_types.emplace_back(
-              ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
-          break;
-        case 8:
-          type_kinds.emplace_back(orc::proto::Type_Kind::Type_Kind_LONG);
-          // TODO: parse options
-          encoding_types.emplace_back(
-              ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2);
-          break;
-        default:
-          Assert(!"should not be here! pg_type which attbyval=true only have typlen of "
-                  "1, 2, 4, or 8");
-      }
-    } else {
-      Assert(attr->attlen > 0 || attr->attlen == -1);
-      type_kinds.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-      encoding_types.emplace_back(
-          ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
-    }
-  }
-
-  Assert(type_kinds.size() == encoding_types.size());
-
-  return std::make_pair(type_kinds, encoding_types);
-}
-
-OrcWriter::OrcWriter(
-    const MicroPartitionWriter::WriterOptions &orc_writer_options,
-    const std::vector<orc::proto::Type_Kind> &column_types,
-    const std::vector<ColumnEncoding_Kind> &column_encoding_types, File *file)
-    : MicroPartitionWriter(orc_writer_options),
-      column_types_(column_types),
-      column_encoding_types_(column_encoding_types),
-      file_(file),
-      current_offset_(0) {
-  pax_columns_ = new PaxColumns(column_types, column_encoding_types);
-
-  summary_.rel_oid = orc_writer_options.rel_oid;
-  summary_.block_id = orc_writer_options.block_id;
-  summary_.file_name = orc_writer_options.file_name;
-
-  file_footer_.set_headerlength(0);
-  file_footer_.set_contentlength(0);
-  file_footer_.set_numberofrows(0);
-  file_footer_.set_rowindexstride(0);
-  file_footer_.set_writer(ORC_WRITER_ID);
-  file_footer_.set_softwareversion(ORC_SOFT_VERSION);
-  BuildFooterType();
-
-  post_script_.set_footerlength(0);
-  post_script_.set_compression(orc::proto::CompressionKind::NONE);
-  post_script_.set_compressionblocksize(0);
-
-  post_script_.add_version(ORC_FILE_MAJOR_VERSION);
-  post_script_.set_writerversion(ORC_WRITER_VERSION);
-  post_script_.set_magic(ORC_MAGIC_ID);
-
-  InitStripe();
-}
-
-OrcWriter::~OrcWriter() {
-  delete pax_columns_;
-  delete file_;
-}
-
-MicroPartitionWriter *OrcWriter::SetStatsCollector(
-    MicroPartitionStats *mpstats) {
-  if (mpstats)
-    mpstats->SetStatsMessage(&summary_.mp_stats, column_types_.size());
-  return MicroPartitionWriter::SetStatsCollector(mpstats);
-}
-
-void OrcWriter::Flush() {
-  BufferedOutputStream buffer_mem_stream(nullptr, 2048);
-  if (WriteStripe(&buffer_mem_stream)) {
-    Assert(current_offset_ >= buffer_mem_stream.GetDataBuffer()->Used());
-    file_->PWriteN(buffer_mem_stream.GetDataBuffer()->GetBuffer(),
-                   buffer_mem_stream.GetDataBuffer()->Used(),
-                   current_offset_ - buffer_mem_stream.GetDataBuffer()->Used());
-    file_->Flush();
-    pax_columns_->Clear();
-  }
-}
-
-void OrcWriter::WriteTuple(CTupleSlot *slot) {
-  int n;
-  TupleTableSlot *table_slot;
-  TupleDesc table_desc;
-  int16 type_len;
-  bool type_by_val;
-
-  summary_.num_tuples++;
-
-  table_slot = slot->GetTupleTableSlot();
-  table_desc = slot->GetTupleDesc();
-  n = table_desc->natts;
-
-  CBDB_CHECK(pax_columns_->GetColumns() == static_cast<size_t>(n),
-             cbdb::CException::ExType::kExTypeSchemaNotMatch);
-
-  pax_columns_->AddRows(1);
-
-  for (int i = 0; i < n; i++) {
-    type_len = table_desc->attrs[i].attlen;
-    type_by_val = table_desc->attrs[i].attbyval;
-
-    AssertImply(table_desc->attrs[i].attisdropped, table_slot->tts_isnull[i]);
-
-    if (table_slot->tts_isnull[i]) {
-      (*pax_columns_)[i]->AppendNull();
-      continue;
-    }
-
-    if (type_by_val) {
-      switch (type_len) {
-        case 1: {
-          auto value = cbdb::DatumToInt8(table_slot->tts_values[i]);
-          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
-                                     type_len);
-          break;
-        }
-        case 2: {
-          auto value = cbdb::DatumToInt16(table_slot->tts_values[i]);
-          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
-                                     type_len);
-          break;
-        }
-        case 4: {
-          auto value = cbdb::DatumToInt32(table_slot->tts_values[i]);
-          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
-                                     type_len);
-          break;
-        }
-        case 8: {
-          auto value = cbdb::DatumToInt64(table_slot->tts_values[i]);
-          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
-                                     type_len);
-          break;
-        }
-        default:
-          Assert(!"should not be here! pg_type which attbyval=true only have typlen of "
-                  "1, 2, 4, or 8 ");
-      }
-    } else {
-      switch (type_len) {
-        case -1: {
-          void *vl = nullptr;
-          int len = -1;
-          vl = cbdb::PointerAndLenFromDatum(table_slot->tts_values[i], &len);
-          Assert(vl != nullptr && len != -1);
-          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(vl), len);
-          break;
-        }
-        default:
-          Assert(type_len > 0);
-          (*pax_columns_)[i]->Append(static_cast<char *>(cbdb::DatumToPointer(
-                                         table_slot->tts_values[i])),
-                                     type_len);
-          break;
-      }
-    }
-  }
-}
-
-void OrcWriter::WriteTupleN(CTupleSlot **slot, size_t n) {
-  // TODO(jiaqizho): support WriteTupleN
-}
-
-bool OrcWriter::WriteStripe(BufferedOutputStream *buffer_mem_stream) {
-  std::vector<orc::proto::Stream> streams;
-  std::vector<ColumnEncoding> encoding_kinds;
-  orc::proto::StripeFooter stripe_footer;
-  auto stripe_stats = meta_data_.add_stripestats();
-
-  size_t data_len = 0;
-  size_t number_of_row = 0;
-
-  number_of_row = pax_columns_->GetRows();
-  stripe_rows_ = number_of_row;
-
-  // No need add stripe if nothing in memeory
-  if (number_of_row == 0) {
-    return false;
-  }
-
-  PaxColumns::ColumnStreamsFunc column_streams_func =
-      [&streams](const orc::proto::Stream_Kind &kind, size_t column,
-                 size_t length) {
-        orc::proto::Stream stream;
-        stream.set_kind(kind);
-        stream.set_column(static_cast<uint32>(column));
-        stream.set_length(length);
-        streams.push_back(std::move(stream));
-      };
-
-  PaxColumns::ColumnEncodingFunc column_encoding_func =
-      [&encoding_kinds](const ColumnEncoding_Kind &encoding_kind,
-                        size_t origin_len) {
-        ColumnEncoding column_encoding;
-        column_encoding.set_kind(encoding_kind);
-        column_encoding.set_length(origin_len);
-
-        encoding_kinds.push_back(std::move(column_encoding));
-      };
-
-  DataBuffer<char> *data_buffer =
-      pax_columns_->GetDataBuffer(column_streams_func, column_encoding_func);
-
-  for (const auto &stream : streams) {
-    *stripe_footer.add_streams() = stream;
-    data_len += stream.length();
-  }
-
-  for (size_t i = 0; i < pax_columns_->GetColumns(); i++) {
-    auto pb_stats = stripe_stats->add_colstats();
-    PaxColumn *pax_column = (*pax_columns_)[i];
-
-    *stripe_footer.add_pax_col_encodings() = encoding_kinds[i];
-
-    pb_stats->set_hasnull(pax_column->HasNull());
-    pb_stats->set_numberofvalues(pax_column->GetRows());
-  }
-
-  stripe_footer.set_writertimezone("GMT");
-  buffer_mem_stream->Set(data_buffer, 2048);
-
-  // check memory io with protobuf
-  CBDB_CHECK(stripe_footer.SerializeToZeroCopyStream(buffer_mem_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-
-  stripe_info_.set_indexlength(0);
-  stripe_info_.set_datalength(data_len);
-  stripe_info_.set_footerlength(buffer_mem_stream->GetSize());
-  stripe_info_.set_numberofrows(stripe_rows_);
-
-  *file_footer_.add_stripes() = stripe_info_;
-
-  current_offset_ += buffer_mem_stream->GetSize();
-  total_rows_ += stripe_rows_;
-
-  // reset the stripe
-  InitStripe();
-  return true;
-}
-
-void OrcWriter::Close() {
-  BufferedOutputStream buffer_mem_stream(nullptr, 2048);
-  size_t file_offset = current_offset_;
-  bool not_empty_stripe = false;
-  DataBuffer<char> *data_buffer;
-
-  not_empty_stripe = WriteStripe(&buffer_mem_stream);
-  if (!not_empty_stripe) {
-    data_buffer = new DataBuffer<char>(2048);
-    buffer_mem_stream.Set(data_buffer, 2048);
-  }
-
-  WriteMetadata(&buffer_mem_stream);
-  WriteFileFooter(&buffer_mem_stream);
-  WritePostscript(&buffer_mem_stream);
-  if (summary_callback_) {
-    summary_.file_size = buffer_mem_stream.GetDataBuffer()->Used();
-    summary_callback_(summary_);
-  }
-
-  file_->PWriteN(buffer_mem_stream.GetDataBuffer()->GetBuffer(),
-                 buffer_mem_stream.GetDataBuffer()->Used(), file_offset);
-  file_->Flush();
-  file_->Close();
-  if (!not_empty_stripe) {
-    delete data_buffer;
-  }
-}
-
-size_t OrcWriter::PhysicalSize() const { return pax_columns_->PhysicalSize(); }
-
-void OrcWriter::InitStripe() {
-  stripe_info_.set_offset(current_offset_);
-  stripe_info_.set_indexlength(0);
-  stripe_info_.set_datalength(0);
-  stripe_info_.set_footerlength(0);
-  stripe_info_.set_numberofrows(0);
-
-  stripe_rows_ = 0;
-}
-
-void OrcWriter::BuildFooterType() {
-  auto proto_type = file_footer_.add_types();
-  proto_type->set_maximumlength(0);
-  proto_type->set_precision(0);
-  proto_type->set_scale(0);
-  proto_type->set_kind(::orc::proto::Type_Kind_STRUCT);
-
-  // TODO(jiaqizho): support interface for meta kv, if we do need this function
-  //   protoAttr->set_key(key);
-  //   protoAttr->set_value(value);
-  for (size_t i = 0; i < column_types_.size(); ++i) {
-    auto orc_type = column_types_[i];
-
-    auto sub_proto_type = file_footer_.add_types();
-    sub_proto_type->set_maximumlength(0);
-    sub_proto_type->set_precision(0);
-    sub_proto_type->set_scale(0);
-    sub_proto_type->set_kind(orc_type);
-
-    file_footer_.mutable_types(0)->add_subtypes(i);
-  }
-}
-
-void OrcWriter::WriteMetadata(BufferedOutputStream *buffer_mem_stream) {
-  buffer_mem_stream->StartBufferOutRecord();
-  CBDB_CHECK(meta_data_.SerializeToZeroCopyStream(buffer_mem_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-
-  post_script_.set_metadatalength(buffer_mem_stream->EndBufferOutRecord());
-}
-
-void OrcWriter::WriteFileFooter(BufferedOutputStream *buffer_mem_stream) {
-  file_footer_.set_contentlength(current_offset_ - file_footer_.headerlength());
-  file_footer_.set_numberofrows(total_rows_);
-
-  for (size_t i = 0; i < pax_columns_->GetColumns(); i++) {
-    auto pb_stats = file_footer_.add_statistics();
-    // FIXME(jiaqizho): the statistics in file footer is not accurate
-    // but statistics in stripe stats is accurate
-    pb_stats->set_hasnull(false);
-    pb_stats->set_numberofvalues((*pax_columns_)[i]->GetRows());
-  }
-
-  buffer_mem_stream->StartBufferOutRecord();
-  CBDB_CHECK(file_footer_.SerializeToZeroCopyStream(buffer_mem_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-
-  post_script_.set_footerlength(buffer_mem_stream->EndBufferOutRecord());
-}
-
-void OrcWriter::WritePostscript(BufferedOutputStream *buffer_mem_stream) {
-  buffer_mem_stream->StartBufferOutRecord();
-  CBDB_CHECK(post_script_.SerializeToZeroCopyStream(buffer_mem_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-
-  char ps_len = static_cast<char>(buffer_mem_stream->EndBufferOutRecord());
-  buffer_mem_stream->DirectWrite(&ps_len, sizeof(unsigned char));
-}
-
-OrcReader::OrcReader(File *file)
-    : file_(file),
-      reused_buffer_(nullptr),
-      working_pax_columns_(nullptr),
-      num_of_stripes_(0),
-      proj_map_(nullptr),
-      proj_len_(0),
-      is_close_(true) {}
-
-OrcReader::~OrcReader() { delete file_; }
-
-PaxColumns *OrcReader::GetAllColumns() {
-  Assert(GetNumberOfStripes() == 1);
-
-  if (!working_pax_columns_) {
-    working_pax_columns_ =
-        ReadStripe(current_stripe_index_++, proj_map_, proj_len_);
-    current_row_index_ = 0;
-    for (size_t i = 0; i < column_types_.size(); i++) {
-      current_nulls_[i] = 0;
-      auto column = (*working_pax_columns_)[i];
-      if (column) {
-        Assert(column->GetBuffer().first);
-      }
-    }
-  }
-
-  return working_pax_columns_;
-}
-
-void OrcReader::ReadMetadata(ssize_t file_length, uint64 post_script_len) {
-  uint64 meta_len = post_script_.metadatalength();
-  uint64 footer_len = post_script_.footerlength();
-  off_t meta_start = file_length - meta_len - footer_len - post_script_len -
-                     ORC_POST_SCRIPT_SIZE;
-  char read_buffer[meta_len];
-  SeekableInputStream input_stream(read_buffer, meta_len);
-
-  Assert(meta_start >= 0);
-  file_->PReadN(read_buffer, meta_len, meta_start);
-
-  CBDB_CHECK(meta_data_.ParseFromZeroCopyStream(&input_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-}
-
-void OrcReader::BuildProtoTypes() {
-  int max_id = 0;
-
-  max_id = file_footer_.types_size();
-
-  CBDB_CHECK(max_id > 0, cbdb::CException::ExType::kExTypeInvalidORCFormat);
-
-  const orc::proto::Type &type = file_footer_.types(0);
-
-  // There is an assumption here: for all pg tables, the outermost structure
-  // should be Type_Kind_STRUCT
-  CBDB_CHECK(type.kind() == orc::proto::Type_Kind_STRUCT,
-             cbdb::CException::ExType::kExTypeInvalidORCFormat);
-  CBDB_CHECK(type.subtypes_size() == max_id - 1,
-             cbdb::CException::ExType::kExTypeInvalidORCFormat);
-
-  for (int j = 0; j < type.subtypes_size(); ++j) {
-    int sub_type_id = static_cast<int>(type.subtypes(j)) + 1;
-    const orc::proto::Type &sub_type = file_footer_.types(sub_type_id);
-    // should allow struct contain struct
-    // but not support yet
-    CBDB_CHECK(sub_type.kind() != orc::proto::Type_Kind_STRUCT,
-               cbdb::CException::ExType::kExTypeInvalidORCFormat);
-
-    column_types_.emplace_back(sub_type.kind());
-  }
-}
-
-void OrcReader::ReadFooter(size_t footer_offset, size_t footer_len) {
-  char buffer[footer_len];
-
-  file_->PReadN(&buffer, footer_len, footer_offset);
-
-  SeekableInputStream input_stream(buffer, footer_len);
-  CBDB_CHECK(file_footer_.ParseFromZeroCopyStream(&input_stream),
-             cbdb::CException::ExType::kExTypeIOError);
-
-  BuildProtoTypes();
-  current_nulls_ = new uint32[column_types_.size()];
-  memset(current_nulls_, 0, column_types_.size() * sizeof(uint32));
-}
-
-void OrcReader::ReadPostScript(size_t file_size, uint64 post_script_len) {
-  char post_script_buffer[post_script_len];
-  off_t offset;
-
-  offset = (off_t)(file_size - ORC_POST_SCRIPT_SIZE - post_script_len);
-  Assert(offset >= 0);
-
-  file_->PReadN(post_script_buffer, post_script_len, offset);
-
-  post_script_.ParseFromArray(&post_script_buffer,
-                              static_cast<int>(post_script_len));
-  // TODO(jiaqizho): verify orc format here
-}
-
-static bool ProjShouldReadAll(const bool *const proj_map, size_t proj_len) {
-  if (!proj_map) {
-    return true;
-  }
-
-  for (size_t i = 0; i < proj_len; i++) {
-    if (!proj_map[i]) {
-      return false;
-    }
-  }
-
-  return true;
-}
-
-orc::proto::StripeFooter OrcReader::ReadStripeWithProjection(
-    DataBuffer<char> *data_buffer, OrcReader::StripeInformation *stripe_info,
-    const bool *const proj_map, size_t proj_len) {
-  size_t stripe_footer_offset = 0;
-  orc::proto::StripeFooter stripe_footer;
-  size_t streams_index = 0;
-  uint64_t batch_len = 0;
-  uint64_t batch_offset = 0;
-  size_t index = 0;
-
-  stripe_footer_offset = stripe_info->data_length + stripe_info->index_length;
-
-  /* Check all column projection is true.
-   * If no need do column projection, read all
-   * buffer(data + stripe footer) from stripe and decode stripe footer.
-   */
-  if (ProjShouldReadAll(proj_map, proj_len)) {
-    file_->PReadN(data_buffer->GetBuffer(), stripe_info->footer_length,
-                  stripe_info->offset);
-    SeekableInputStream input_stream(
-        data_buffer->GetBuffer() + stripe_footer_offset,
-        stripe_info->footer_length - stripe_footer_offset);
-    if (!stripe_footer.ParseFromZeroCopyStream(&input_stream)) {
-      // fail to do memory io with protobuf
-      CBDB_RAISE(cbdb::CException::ExType::kExTypeIOError);
-    }
-
-    return stripe_footer;
-  }
-
-  Assert(stripe_info->index_length == 0);
-
-  /* If need do column projection here
-   * Then read stripe footer and decode it before read data part
-   */
-  file_->PReadN(data_buffer->GetBuffer(),
-                stripe_info->footer_length - stripe_footer_offset,
-                stripe_info->offset + stripe_footer_offset);
-
-  SeekableInputStream input_stream(
-      data_buffer->GetBuffer(),
-      stripe_info->footer_length - stripe_footer_offset);
-
-  if (!stripe_footer.ParseFromZeroCopyStream(&input_stream)) {
-    CBDB_RAISE(cbdb::CException::ExType::kExTypeIOError);
-  }
-
-  data_buffer->BrushBackAll();
-
-  batch_offset = stripe_info->offset;
-
-  while (index < column_types_.size()) {
-    // Current column have been skipped
-    // Move `batch_offset` and `streams_index` to the right position
-    if (!proj_map[index]) {
-      index++;
-
-      const orc::proto::Stream *n_stream = nullptr;
-      do {
-        n_stream = &stripe_footer.streams(streams_index++);
-        batch_offset += n_stream->length();
-      } while (n_stream->kind() != ::orc::proto::Stream_Kind::Stream_Kind_DATA);
-
-      continue;
-    }
-
-    batch_len = 0;
-
-    /* Current column should be read
-     * In this case, did a greedy algorithm to combine io: while
-     * the current column is being read, it is necessary
-     * to ensure that subsequent columns will be read in the same io.
-     *
-     * So in `do...while`, only the `batch_size` which io needs to read
-     * is calculated, until meet a column which needs to be skipped.
-     */
-    do {
-      bool has_null = stripe_info->stripe_statistics.colstats(index).hasnull();
-      if (has_null) {
-        const orc::proto::Stream &non_null_stream =
-            stripe_footer.streams(streams_index++);
-        batch_len += non_null_stream.length();
-      }
-
-      const orc::proto::Stream *len_or_data_stream =
-          &stripe_footer.streams(streams_index++);
-      batch_len += len_or_data_stream->length();
-
-      if (len_or_data_stream->kind() ==
-          ::orc::proto::Stream_Kind::Stream_Kind_LENGTH) {
-        len_or_data_stream = &stripe_footer.streams(streams_index++);
-        batch_len += len_or_data_stream->length();
-      }
-    } while ((++index) < column_types_.size() && proj_map[index]);
-
-    file_->PReadN(data_buffer->GetAvailableBuffer(), batch_len, batch_offset);
-    data_buffer->Brush(batch_len);
-    batch_offset += batch_len;
-  }
-
-  return stripe_footer;
-}
-
-template <typename T>
-static PaxColumn *GetIntEncodingColumn(DataBuffer<char> *data_buffer,
-                                       const orc::proto::Stream &data_stream,
-                                       const ColumnEncoding &data_encoding) {
-  uint32 column_data_size = 0;
-  uint64 column_data_len = 0;
-
-  DataBuffer<T> *column_data_buffer = nullptr;
-  PaxIntColumn<T> *pax_column = nullptr;
-
-  column_data_size = static_cast<uint32>(data_stream.column());
-  column_data_len = static_cast<uint64>(data_stream.length());
-
-  column_data_buffer = new DataBuffer<T>(
-      reinterpret_cast<T *>(data_buffer->GetAvailableBuffer()), column_data_len,
-      false, false);
-  column_data_buffer->BrushAll();
-
-  data_buffer->Brush(column_data_len);
-
-  PaxDecoder::DecodingOption decoding_option;
-  decoding_option.column_encode_type = data_encoding.kind();
-  decoding_option.is_sign = true;
-
-  if (data_encoding.kind() ==
-      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
-    Assert(column_data_size == column_data_buffer->GetSize());
-    pax_column = new PaxIntColumn<T>(std::move(decoding_option));
-  } else {
-    Assert(data_encoding.length() / sizeof(T) == column_data_size);
-    pax_column =
-        new PaxIntColumn<T>(column_data_size, std::move(decoding_option));
-  }
-
-  pax_column->Set(column_data_buffer);
-  return pax_column;
-}
-
-PaxColumns *OrcReader::ReadStripe(size_t index, bool *proj_map,
-                                  size_t proj_len) {
-  auto stripe_info = GetStripeInfo(index);
-  auto pax_columns = new PaxColumns();
-  DataBuffer<char> *data_buffer = nullptr;
-  orc::proto::StripeFooter stripe_footer;
-  size_t streams_index = 0;
-  size_t streams_size = 0;
-  size_t encoding_kinds_size = 0;
-
-  Assert(stripe_info->index_length == 0);
-  pax_columns->AddRows(stripe_info->numbers_of_row);
-
-  DEFER({ delete stripe_info; });
-
-  if (unlikely(stripe_info->footer_length == 0)) {
-    return pax_columns;
-  }
-
-  if (reused_buffer_) {
-    while (reused_buffer_->Capacity() < stripe_info->footer_length) {
-      reused_buffer_->ReSize(reused_buffer_->Capacity() / 2 * 3);
-    }
-    data_buffer = new DataBuffer<char>(
-        reused_buffer_->GetBuffer(), reused_buffer_->Capacity(), false, false);
-
-  } else {
-    data_buffer = new DataBuffer<char>(stripe_info->footer_length);
-  }
-  pax_columns->Set(data_buffer);
-
-  /* `ReadStripeWithProjection` will read the column memory which filter by
-   * `proj_map`, and initialize `stripe_footer`
-   *
-   * Notice that: should catch `kExTypeIOError` then delete pax columns
-   * But for now we will destroy memory context if exception happen.
-   * And we don't have a decision that should we use `try...catch` at yet,
-   * so it's ok that we just no catch here.
-   */
-  stripe_footer =
-      ReadStripeWithProjection(data_buffer, stripe_info, proj_map, proj_len);
-
-  streams_size = stripe_footer.streams_size();
-  encoding_kinds_size = stripe_footer.pax_col_encodings_size();
-
-  if (unlikely(streams_size == 0 && column_types_.empty())) {
-    return pax_columns;
-  }
-
-  data_buffer->BrushBackAll();
-
-  AssertImply(proj_len != 0, column_types_.size() <= proj_len);
-  Assert(encoding_kinds_size <= column_types_.size());
-
-  for (size_t index = 0; index < column_types_.size(); index++) {
-    /* Skip read current column, just move `streams_index` after
-     * `Stream_Kind_DATA` but still need append nullptr into `PaxColumns` to
-     * make sure sizeof pax_columns eq with column number
-     */
-    if (proj_map && !proj_map[index]) {
-      const orc::proto::Stream *n_stream = nullptr;
-      do {
-        n_stream = &stripe_footer.streams(streams_index++);
-      } while (n_stream->kind() != ::orc::proto::Stream_Kind::Stream_Kind_DATA);
-
-      pax_columns->Append(nullptr);
-      continue;
-    }
-
-    DataBuffer<bool> *non_null_bitmap = nullptr;
-    bool has_null = stripe_info->stripe_statistics.colstats(index).hasnull();
-    if (has_null) {
-      uint64 non_null_length = 0;
-      const orc::proto::Stream &non_null_stream =
-          stripe_footer.streams(streams_index++);
-      non_null_length = static_cast<uint32>(non_null_stream.length());
-
-      non_null_bitmap = new DataBuffer<bool>(
-          reinterpret_cast<bool *>(data_buffer->GetAvailableBuffer()),
-          non_null_length, false, false);
-      non_null_bitmap->BrushAll();
-      data_buffer->Brush(non_null_length);
-    }
-
-    switch (column_types_[index]) {
-      case (orc::proto::Type_Kind::Type_Kind_STRING): {
-        uint32 column_lens_size = 0;
-        uint64 column_lens_len = 0;
-        uint64 column_data_len = 0;
-        DataBuffer<int64> *column_len_buffer = nullptr;
-        DataBuffer<char> *column_data_buffer = nullptr;
-        PaxNonFixedEncodingColumn *pax_column = nullptr;
-
-        const orc::proto::Stream &len_stream =
-            stripe_footer.streams(streams_index++);
-        const orc::proto::Stream &data_stream =
-            stripe_footer.streams(streams_index++);
-        const ColumnEncoding &data_encoding =
-            stripe_footer.pax_col_encodings(index);
-
-        column_lens_size = static_cast<uint32>(len_stream.column());
-        column_lens_len = static_cast<uint64>(len_stream.length());
-
-        column_len_buffer = new DataBuffer<int64>(
-            reinterpret_cast<int64 *>(data_buffer->GetAvailableBuffer()),
-            column_lens_len, false, false);
-        column_len_buffer->BrushAll();
-        data_buffer->Brush(column_lens_len);
-
-        column_data_len = data_stream.length();
-
-#ifdef ENBALE_DEBUG
-        if (data_encoding.kind() ==
-            ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
-          size_t segs_size = 0;
-          for (size_t i = 0; i < column_len_buffer->GetSize(); i++) {
-            segs_size += (*column_len_buffer)[i];
-          }
-          Assert(column_data_len == segs_size);
-        }
-#endif
-
-        column_data_buffer = new DataBuffer<char>(
-            data_buffer->GetAvailableBuffer(), column_data_len, false, false);
-        column_data_buffer->BrushAll();
-        data_buffer->Brush(column_data_len);
-
-        Assert(static_cast<uint32>(data_stream.column()) == column_lens_size);
-
-        PaxDecoder::DecodingOption decoding_option;
-        decoding_option.column_encode_type = data_encoding.kind();
-        decoding_option.is_sign = true;
-
-        if (data_encoding.kind() ==
-            ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
-          Assert(column_data_len == column_data_buffer->GetSize());
-          pax_column =
-              new PaxNonFixedEncodingColumn(0, std::move(decoding_option));
-        } else {
-          pax_column = new PaxNonFixedEncodingColumn(
-              data_encoding.length(), std::move(decoding_option));
-        }
-
-        // current memory will be freed in pax_columns->data_
-        pax_column->Set(column_data_buffer, column_len_buffer, column_data_len);
-        pax_column->SetMemTakeOver(false);
-        pax_columns->Append(pax_column);
-        break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_BOOLEAN):
-      case (orc::proto::Type_Kind::Type_Kind_BYTE): {
-        const orc::proto::Stream &data_stream =
-            stripe_footer.streams(streams_index++);
-        uint32 column_data_size = 0;
-        uint64 column_data_len = 0;
-        DataBuffer<char> *column_data_buffer = nullptr;
-        PaxCommColumn<char> *pax_column = nullptr;
-
-        column_data_size = static_cast<uint32>(data_stream.column());
-        column_data_len = static_cast<uint64>(data_stream.length());
-        column_data_buffer = new DataBuffer<char>(
-            reinterpret_cast<char *>(data_buffer->GetAvailableBuffer()),
-            column_data_len, false, false);
-
-        column_data_buffer->BrushAll();
-        data_buffer->Brush(column_data_len);
-
-        Assert(column_data_size == column_data_buffer->GetSize());
-        pax_column = new PaxCommColumn<char>();
-        pax_column->Set(column_data_buffer);
-        pax_columns->Append(pax_column);
-        break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_SHORT): {
-        const orc::proto::Stream &data_stream =
-            stripe_footer.streams(streams_index++);
-        const ColumnEncoding &data_encoding =
-            stripe_footer.pax_col_encodings(index);
-        pax_columns->Append(GetIntEncodingColumn<int16>(
-            data_buffer, data_stream, data_encoding));
-        break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_INT): {
-        const orc::proto::Stream &data_stream =
-            stripe_footer.streams(streams_index++);
-        const ColumnEncoding &data_encoding =
-            stripe_footer.pax_col_encodings(index);
-        pax_columns->Append(GetIntEncodingColumn<int32>(
-            data_buffer, data_stream, data_encoding));
-        break;
-      }
-      case (orc::proto::Type_Kind::Type_Kind_LONG): {
-        const orc::proto::Stream &data_stream =
-            stripe_footer.streams(streams_index++);
-        const ColumnEncoding &data_encoding =
-            stripe_footer.pax_col_encodings(index);
-        pax_columns->Append(GetIntEncodingColumn<int64>(
-            data_buffer, data_stream, data_encoding));
-        break;
-      }
-      default:
-        // should't be here
-        Assert(!"should't be here, non-implemented type");
-        break;
-    }
-
-    // fill nulls data buffer
-    if (has_null) {
-      Assert(pax_columns->GetColumns() > 0 && non_null_bitmap);
-      auto last_column = (*pax_columns)[pax_columns->GetColumns() - 1];
-      last_column->SetNulls(non_null_bitmap);
-    }
-  }
-
-  Assert(streams_size == streams_index);
-  return pax_columns;
-}
-
-OrcReader::StripeInformation *OrcReader::GetStripeInfo(size_t index) const {
-  auto *stripe_info_in_mem = new StripeInformation();
-  orc::proto::StripeInformation stripe_info;
-
-  CBDB_CHECK(index < num_of_stripes_,
-             cbdb::CException::ExType::kExTypeLogicError);
-
-  stripe_info = file_footer_.stripes(static_cast<int>(index));
-  stripe_info_in_mem->footer_length = stripe_info.footerlength();
-  stripe_info_in_mem->data_length = stripe_info.datalength();
-  stripe_info_in_mem->numbers_of_row = stripe_info.numberofrows();
-  stripe_info_in_mem->offset = stripe_info.offset();
-
-  stripe_info_in_mem->index_length = stripe_info.indexlength();
-  stripe_info_in_mem->stripe_footer_start = stripe_info.offset() +
-                                            stripe_info.indexlength() +
-                                            stripe_info.datalength();
-
-  stripe_info_in_mem->stripe_statistics =
-      meta_data_.stripestats(static_cast<int>(index));
-
-  return stripe_info_in_mem;
-}
-
-size_t OrcReader::GetNumberOfStripes() const { return num_of_stripes_; }
-
-void OrcReader::Open(const ReaderOptions &options) {
-  size_t file_length = 0;
-  uint64 post_script_len = 0;
-
-  size_t footer_offset = 0;
-  size_t footer_len = 0;
-  size_t tail_len = 0;
-
-  Assert(file_);
-  Assert(is_close_);
-
-  // Must not open twice.
-  Assert(!reused_buffer_);
-  if (options.reused_buffer) {
-    CBDB_CHECK(options.reused_buffer->IsMemTakeOver(),
-               cbdb::CException::ExType::kExTypeLogicError);
-    options.reused_buffer->BrushBackAll();
-
-    reused_buffer_ = options.reused_buffer;
-  }
-
-  Assert(!proj_map_ && !proj_len_);
-  if (options.filter)
-    std::tie(proj_map_, proj_len_) = options.filter->GetColumnProjection();
-
-  // Begin read footer
-
-  // TODO(jiaqizho):
-  // There is an optimization here, in standard ORC, A single ORC
-  // file will read
-  // follow these step:
-  // - read postscript size
-  // - read post script
-  // - read file footer
-  // - read meta if exist
-  // the footer information of a single ORC file needing cost 3-4 iops
-  // consider add a new filed after postscript size, contain the full size of
-  // footer information
-  file_length = file_->FileLength();
-  file_->PRead(&post_script_len, ORC_POST_SCRIPT_SIZE,
-               (off_t)(file_length - ORC_POST_SCRIPT_SIZE));
-
-  ReadPostScript(file_length, post_script_len);
-
-  footer_len = post_script_.footerlength();
-  tail_len = ORC_POST_SCRIPT_SIZE + post_script_len + footer_len;
-  footer_offset = file_length - tail_len;
-
-  ReadFooter(footer_offset, footer_len);
-  num_of_stripes_ = file_footer_.stripes_size();
-
-  if (post_script_.metadatalength() != 0)
-    ReadMetadata(file_length, post_script_len);
-  is_close_ = false;
-}
-
-void OrcReader::ResetCurrentReading() {
-  if (working_pax_columns_) {
-    delete working_pax_columns_;
-    working_pax_columns_ = nullptr;
-  }
-  current_stripe_index_ = 0;
-  current_row_index_ = 0;
-  current_offset_ = 0;
-  memset(current_nulls_, 0, column_types_.size() * sizeof(uint32));
-}
-
-void OrcReader::Close() {
-  if (is_close_) {
-    return;
-  }
-
-  ResetCurrentReading();
-  delete[] current_nulls_;
-  current_nulls_ = nullptr;
-  file_->Close();
-  is_close_ = true;
-}
-
-bool OrcReader::ReadTuple(CTupleSlot *cslot) {
-  size_t row_nums = 0;
-  TupleTableSlot *slot;
-  size_t column_numbers = 0;
-  size_t index = 0;
-  size_t nattrs = 0;
-  AttrMissing *attrmiss = nullptr;
-
-  slot = cslot->GetTupleTableSlot();
-
-  while (true) {
-    nattrs = static_cast<size_t>(slot->tts_tupleDescriptor->natts);
-    if (!working_pax_columns_) {
-      // no data remain
-      if (current_stripe_index_ >= GetNumberOfStripes()) {
-        return false;
-      }
-
-      working_pax_columns_ =
-          ReadStripe(current_stripe_index_++, proj_map_, proj_len_);
-      current_row_index_ = 0;
-      for (size_t i = 0; i < column_types_.size(); i++) {
-        current_nulls_[i] = 0;
-      }
-    }
-
-    column_numbers = working_pax_columns_->GetColumns();
-
-    // The column number in Pax file meta could be smaller than the column
-    // number in TupleSlot in case after alter table add column DDL operation
-    // was done.
-    if (column_numbers > nattrs) {
-      CBDB_RAISE(cbdb::CException::ExType::kExTypeSchemaNotMatch);
-    }
-
-    row_nums = working_pax_columns_->GetRows();
-
-    // skip the empty stripe or current stripe already consumed
-    if (unlikely(row_nums == 0) || current_row_index_ == row_nums) {
-      delete working_pax_columns_;
-      working_pax_columns_ = nullptr;
-    } else {
-      break;
-    }
-  }
-
-  char *buffer = nullptr;
-  size_t buffer_len = 0;
-
-  //  first check if column has missing value
-  if (slot->tts_tupleDescriptor->constr)
-    attrmiss = slot->tts_tupleDescriptor->constr->missing;
-
-  for (index = 0; index < nattrs; index++) {
-    if (proj_map_ && !proj_map_[index]) {
-      continue;
-    }
-
-    // handle PAX columns number inconsistent with pg catalog nattrs in case
-    // data not been inserted yet or read pax file conserved before last add
-    // column DDL is done, for these cases it is normal that pg catalog schema
-    // is not match with that in PAX file:
-    // 1. if atthasmissing is set, then return default column value.
-    // 2. if atthasmissing is not set, then return null value.
-    if (index >= column_numbers) {
-      slot->tts_isnull[index] = true;
-      //  The attrmiss default value memory is managed in CacheMemoryContext,
-      //  which was allocated in RelationBuildTupleDesc.
-      if (attrmiss && (slot->tts_tupleDescriptor->attrs[index].atthasmissing &&
-                       attrmiss[index].am_present)) {
-        slot->tts_values[index] = attrmiss[index].am_value;
-        slot->tts_isnull[index] = false;
-      }
-      continue;
-    }
-
-    // In case column is droped, then set its value as null without reading data
-    // tuples.
-    if (unlikely(slot->tts_tupleDescriptor->attrs[index].attisdropped)) {
-      slot->tts_isnull[index] = true;
-      continue;
-    }
-
-    PaxColumn *column = ((*working_pax_columns_)[index]);
-
-    // set default is not null
-    slot->tts_isnull[index] = false;
-    if (column->HasNull()) {
-      auto null_bitmap = column->GetNulls();
-      if (!(*null_bitmap)[current_row_index_]) {
-        slot->tts_isnull[index] = true;
-        current_nulls_[index]++;
-        continue;
-      }
-    }
-
-    Assert(current_row_index_ >= current_nulls_[index]);
-
-    std::tie(buffer, buffer_len) =
-        column->GetBuffer(current_row_index_ - current_nulls_[index]);
-    switch (column->GetPaxColumnTypeInMem()) {
-      case kTypeNonFixed: {
-        slot->tts_values[index] = PointerGetDatum(buffer);
-        break;
-      }
-      case kTypeFixed: {
-        // FIXME(gongxun): get value info from PaxColumn
-        switch (slot->tts_tupleDescriptor->attrs[index].attlen) {
-          case 1:
-            slot->tts_values[index] =
-                cbdb::Int8ToDatum(*reinterpret_cast<int8 *>(buffer));
-            break;
-          case 2:
-            slot->tts_values[index] =
-                cbdb::Int16ToDatum(*reinterpret_cast<int16 *>(buffer));
-            break;
-          case 4:
-            slot->tts_values[index] =
-                cbdb::Int32ToDatum(*reinterpret_cast<int32 *>(buffer));
-            break;
-          case 8:
-            slot->tts_values[index] =
-                cbdb::Int64ToDatum(*reinterpret_cast<int64 *>(buffer));
-            break;
-          default:
-            Assert(!"should't be here, fixed type len should be 1, 2, 4, 8");
-        }
-        break;
-      }
-      default: {
-        Assert(!"should't be here, non-implemented column type in memory");
-        break;
-      }
-    }
-  }
-
-  current_row_index_++;
-  current_offset_++;
-  cslot->SetOffset(current_offset_);
-
-  return true;
-}
-
-}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc.h b/contrib/pax_storage/src/cpp/storage/orc/orc.h
index 26755e56373..e323af6f3d6 100644
--- a/contrib/pax_storage/src/cpp/storage/orc/orc.h
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc.h
@@ -5,40 +5,56 @@
 #include <vector>
 
 #include "comm/cbdb_wrappers.h"
-#include "comm/pax_defer.h"
+#include "comm/pax_memory.h"
 #include "exceptions/CException.h"
 #include "storage/columns/pax_column.h"
 #include "storage/columns/pax_columns.h"
 #include "storage/file_system.h"
 #include "storage/micro_partition.h"
-#include "storage/proto/proto_wrappers.h"
+#include "storage/micro_partition_stats.h"
+#include "storage/orc/orc_format_reader.h"
 #include "storage/proto/protobuf_stream.h"
 
 namespace pax {
 class MicroPartitionStats;
+class OrcFormatReader;
+class OrcGroup;
 
-#define ORC_MAGIC_ID "ORC"
-// ORC cpp writer
-#define ORC_WRITER_ID 1
-#define ORC_SOFT_VERSION "1"
-#define ORC_FILE_MAJOR_VERSION 1
-#define ORC_WRITER_VERSION 1
-#define ORC_POST_SCRIPT_SIZE 1
+class OrcColumnStatsData : public MicroPartitionStatsData {
+ public:
+  OrcColumnStatsData() = default;
+  OrcColumnStatsData *Initialize(int natts);
+  void CopyFrom(MicroPartitionStatsData *stats) override;
+  ::pax::stats::ColumnBasicInfo *GetColumnBasicInfo(int column_index) override;
+  ::pax::stats::ColumnDataStats *GetColumnDataStats(int column_index) override;
+  int ColumnSize() const override;
+  void SetAllNull(int column_index, bool allnull) override;
+  void SetHasNull(int column_index, bool hasnull) override;
+  bool GetAllNull(int column_index) override;
+  bool GetHasNull(int column_index) override;
+  void Reset();
+
+ private:
+  void CheckVectorSize() const;
+
+  std::vector<::pax::stats::ColumnDataStats> col_data_stats_;
+  std::vector<::pax::stats::ColumnBasicInfo> col_basic_info_;
+  std::vector<bool> has_nulls_;
+  std::vector<bool> all_nulls_;
+};
 
 class OrcWriter : public MicroPartitionWriter {
  public:
   OrcWriter(const MicroPartitionWriter::WriterOptions &orc_writer_options,
-            const std::vector<orc::proto::Type_Kind> &column_types,
-            const std::vector<ColumnEncoding_Kind> &column_encoding_types,
-            File *file);
+            const std::vector<pax::orc::proto::Type_Kind> &column_types, File *file);
 
   ~OrcWriter() override;
 
   void Flush() override;
 
-  void WriteTuple(CTupleSlot *slot) override;
+  void WriteTuple(TupleTableSlot *slot) override;
 
-  void WriteTupleN(CTupleSlot **slot, size_t n) override;
+  void MergeTo(MicroPartitionWriter *writer) override;
 
   void Close() override;
 
@@ -47,9 +63,7 @@ class OrcWriter : public MicroPartitionWriter {
 
   size_t PhysicalSize() const override;
 
-  static std::pair<std::vector<orc::proto::Type_Kind>,
-                   std::vector<ColumnEncoding_Kind>>
-  BuildSchema(const MicroPartitionWriter::WriterOptions &options);
+  static std::vector<pax::orc::proto::Type_Kind> BuildSchema(TupleDesc desc);
 
 #ifndef RUN_GTEST
  protected:  // NOLINT
@@ -57,119 +71,100 @@ class OrcWriter : public MicroPartitionWriter {
 
   // only for test
   static MicroPartitionWriter *CreateWriter(
-      const MicroPartitionWriter::WriterOptions &options,
-      const std::vector<orc::proto::Type_Kind> &column_types, File *file) {
-    std::vector<ColumnEncoding_Kind> all_no_encoding_types;
+      MicroPartitionWriter::WriterOptions options,
+      const std::vector<pax::orc::proto::Type_Kind> column_types, File *file) {
+    std::vector<std::tuple<ColumnEncoding_Kind, int>> all_no_encoding_types;
     for (auto _ : column_types) {
       (void)_;
-      all_no_encoding_types.emplace_back(
-          ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED);
+      all_no_encoding_types.emplace_back(std::make_tuple(
+          ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED, 0));
     }
 
-    return new OrcWriter(options, column_types, all_no_encoding_types, file);
-  }
+    options.encoding_opts = all_no_encoding_types;
 
-  // after create a new writer or old stripe have been flushed
-  // stripe_info_ in memory should reinit
-  void InitStripe();
+    return PAX_NEW<OrcWriter>(options, column_types, file);
+  }
 
   void BuildFooterType();
+  bool WriteStripe(BufferedOutputStream *buffer_mem_stream,
+                   PaxColumns *pax_columns, MicroPartitionStats *stripe_stats,
+                   MicroPartitionStats *file_stats);
   bool WriteStripe(BufferedOutputStream *buffer_mem_stream);
-  void WriteMetadata(BufferedOutputStream *buffer_mem_stream);
   void WriteFileFooter(BufferedOutputStream *buffer_mem_stream);
   void WritePostscript(BufferedOutputStream *buffer_mem_stream);
 
+  void MergePaxColumns(OrcWriter *writer);
+  void MergeGroups(OrcWriter *orc_writer);
+  void MergeGroup(OrcWriter *orc_writer, int group_index,
+                  DataBuffer<char> *merge_buffer);
+  void DeleteUnstateFile();
+
  protected:
+  bool is_closed_;
   PaxColumns *pax_columns_;
-  const std::vector<orc::proto::Type_Kind> column_types_;
-  const std::vector<ColumnEncoding_Kind> column_encoding_types_;
+  Datum *toast_holder_;
+  const std::vector<pax::orc::proto::Type_Kind> column_types_;
   File *file_;
   WriteSummary summary_;
 
-  ::orc::proto::Footer file_footer_;
-  ::orc::proto::PostScript post_script_;
-  ::orc::proto::StripeInformation stripe_info_;
-  ::orc::proto::Metadata meta_data_;
+  int32 row_index_;
+  uint64 total_rows_;
+  uint64 current_offset_;
 
-  uint64 stripe_rows_ = 0;
-  uint64 total_rows_ = 0;
-  uint64 current_offset_ = 0;
+  ::pax::orc::proto::Footer file_footer_;
+  ::pax::orc::proto::PostScript post_script_;
+  ::pax::MicroPartitionStats stats_collector_;
 };
 
+#ifdef ENABLE_PLASMA
+class PaxColumnCache;
+#endif  // ENABLE_PLASMA
+
 class OrcReader : public MicroPartitionReader {
  public:
-  struct StripeInformation {
-    uint64 footer_length;
-    uint64 data_length;
-    uint64 numbers_of_row;
-    uint64 offset;
-
-    uint64 index_length;
-    uint64 stripe_footer_start;
-
-    // refine column statistics if we do need it
-    ::orc::proto::StripeStatistics stripe_statistics;
-  };
-
   explicit OrcReader(File *file);
 
-  ~OrcReader() override;
-
-  StripeInformation *GetStripeInfo(size_t index) const;
-
-  PaxColumns *ReadStripe(size_t index, bool *proj_map = nullptr,
-                         size_t proj_len = 0);
-
-  size_t GetNumberOfStripes() const;
+  ~OrcReader() override = default;
 
   void Open(const ReaderOptions &options) override;
 
   void Close() override;
 
-  bool ReadTuple(CTupleSlot *cslot) override;
+  bool ReadTuple(TupleTableSlot *cslot) override;
 
-#ifndef RUN_GTEST
- protected:  // NOLINT
-#endif
+  bool GetTuple(TupleTableSlot *slot, size_t row_index) override;
 
-  PaxColumns *GetAllColumns() override;
+  size_t GetGroupNums() override;
 
-  orc::proto::StripeFooter ReadStripeWithProjection(
-      DataBuffer<char> *data_buffer, OrcReader::StripeInformation *stripe_info,
-      const bool *proj_map, size_t proj_len);
+  MicroPartitionReader::Group *ReadGroup(size_t group_index) override;
 
-  void ReadMetadata(ssize_t file_length, uint64 post_script_len);
+  std::unique_ptr<ColumnStatsProvider> GetGroupStatsInfo(
+      size_t group_index) override;
 
-  void BuildProtoTypes();
-
-  void ReadFooter(size_t footer_offset, size_t footer_len);
-
-  void ReadPostScript(size_t file_size, uint64 post_script_len);
+#ifndef RUN_GTEST
+ protected:  // NOLINT
+#endif
 
   // Clean up reading status
   void ResetCurrentReading();
 
  protected:
-  std::vector<orc::proto::Type_Kind> column_types_;
-  File *file_;
+  MicroPartitionReader::Group *working_group_;
 
-  DataBuffer<char> *reused_buffer_;
-  PaxColumns *working_pax_columns_;
-  size_t current_stripe_index_ = 0;
-  size_t current_row_index_ = 0;
-  uint64 current_offset_ = 0;
+  // used to cache the group in `GetTuple`
+  MicroPartitionReader::Group *cached_group_;
+  size_t current_group_index_;
 
-  uint32 *current_nulls_ = nullptr;
-
-  orc::proto::PostScript post_script_;
-  orc::proto::Footer file_footer_;
-  orc::proto::Metadata meta_data_;
-
-  size_t num_of_stripes_;
   bool *proj_map_;
   size_t proj_len_;
 
-  bool is_close_;
+  OrcFormatReader format_reader_;
+  bool is_closed_;
+
+#ifdef ENABLE_PLASMA
+  PaxColumnCache *pax_column_cache_ = nullptr;
+  std::vector<std::string> release_key_;
+#endif  // ENABLE_PLASMA
 };
 
 };  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_defined.h b/contrib/pax_storage/src/cpp/storage/orc/orc_defined.h
new file mode 100644
index 00000000000..5f49de9f667
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_defined.h
@@ -0,0 +1,9 @@
+#pragma once
+
+#define ORC_MAGIC_ID "ORC"
+#define ORC_WRITER_ID 1
+#define PAX_MAJOR_VERSION 1
+#define PAX_MINOR_VERSION 0
+
+#define ORC_POST_SCRIPT_SIZE 8
+#define ORC_TAIL_SIZE 32768
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.cc
new file mode 100644
index 00000000000..badf4b569a1
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.cc
@@ -0,0 +1,650 @@
+#include "storage/orc/orc_format_reader.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
+#include "storage/columns/pax_column_traits.h"
+#include "storage/orc/orc_defined.h"
+
+namespace pax {
+
+OrcFormatReader::OrcFormatReader(File *file)
+    : file_(file),
+      reused_buffer_(nullptr),
+      num_of_stripes_(0),
+      is_vec_(false) {}
+
+OrcFormatReader::~OrcFormatReader() { PAX_DELETE(file_); }
+
+void OrcFormatReader::SetReusedBuffer(DataBuffer<char> *data_buffer) {
+  reused_buffer_ = data_buffer;
+}
+
+void OrcFormatReader::Open() {
+  size_t file_length = 0;
+  uint64 post_script_len = 0;
+
+  Assert(file_);
+  auto read_in_disk = [this](size_t file_size, size_t ps_len,
+                             bool skip_read_post_script) {
+    // read post script
+    if (!skip_read_post_script) {
+      char post_script_buffer[ps_len];
+      off_t offset;
+
+      offset = (off_t)(file_size - ORC_POST_SCRIPT_SIZE - ps_len);
+      Assert(offset >= 0);
+
+      file_->PReadN(post_script_buffer, ps_len, offset);
+
+      CBDB_CHECK(post_script_.ParseFromArray(&post_script_buffer,
+                                             static_cast<int>(ps_len)),
+                 cbdb::CException::ExType::kExTypeIOError);
+    }
+
+    size_t footer_len = post_script_.footerlength();
+    size_t tail_len = ORC_POST_SCRIPT_SIZE + ps_len + footer_len;
+    size_t footer_offset = file_size - tail_len;
+
+    // read file_footer
+    {
+      // The footer contains statistical information. The min/max implementation
+      // may have a large attribute value. buffer cannot be allocated on the
+      // stack, which may cause stack overflow.
+      std::unique_ptr<char[]> buffer(new char[footer_len]());
+
+      file_->PReadN(buffer.get(), footer_len, footer_offset);
+
+      SeekableInputStream input_stream(buffer.get(), footer_len);
+      CBDB_CHECK(file_footer_.ParseFromZeroCopyStream(&input_stream),
+                 cbdb::CException::ExType::kExTypeIOError);
+    }
+  };
+
+  file_length = file_->FileLength();
+  if (file_length > ORC_TAIL_SIZE) {
+    size_t footer_len;
+    size_t tail_len;
+    size_t footer_offset;
+    char tail_buffer[ORC_TAIL_SIZE];
+
+    file_->PReadN(tail_buffer, ORC_TAIL_SIZE,
+                  (off_t)(file_length - ORC_TAIL_SIZE));
+
+    static_assert(sizeof(post_script_len) == ORC_POST_SCRIPT_SIZE,
+                  "post script type len not match.");
+    memcpy(&post_script_len, &tail_buffer[ORC_TAIL_SIZE - ORC_POST_SCRIPT_SIZE],
+           ORC_POST_SCRIPT_SIZE);
+    if (post_script_len + ORC_POST_SCRIPT_SIZE > ORC_TAIL_SIZE) {
+      read_in_disk(file_length, post_script_len, false);
+      goto finish_read;
+    }
+
+    auto post_script_offset =
+        (off_t)(ORC_TAIL_SIZE - ORC_POST_SCRIPT_SIZE - post_script_len);
+    CBDB_CHECK(post_script_.ParseFromArray(tail_buffer + post_script_offset,
+                                           static_cast<int>(post_script_len)),
+               cbdb::CException::ExType::kExTypeIOError);
+
+    footer_len = post_script_.footerlength();
+    tail_len = ORC_POST_SCRIPT_SIZE + post_script_len + footer_len;
+    if (tail_len > ORC_TAIL_SIZE) {
+      read_in_disk(file_length, post_script_len, true);
+      goto finish_read;
+    }
+
+    footer_offset = ORC_TAIL_SIZE - tail_len;
+    SeekableInputStream input_stream(tail_buffer + footer_offset, footer_len);
+    CBDB_CHECK(file_footer_.ParseFromZeroCopyStream(&input_stream),
+               cbdb::CException::ExType::kExTypeIOError);
+  } else {
+    static_assert(sizeof(post_script_len) == ORC_POST_SCRIPT_SIZE,
+                  "post script type len not match.");
+    file_->PReadN(&post_script_len, ORC_POST_SCRIPT_SIZE,
+                  (off_t)(file_length - ORC_POST_SCRIPT_SIZE));
+    read_in_disk(file_length, post_script_len, false);
+  }
+
+finish_read:
+  num_of_stripes_ = file_footer_.stripes_size();
+  is_vec_ = file_footer_.storageformat() == kTypeStorageOrcVec;
+
+  // Build schema
+  auto max_id = file_footer_.types_size();
+  CBDB_CHECK(max_id > 0, cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+  const pax::orc::proto::Type &type = file_footer_.types(0);
+  // There is an assumption here: for all pg tables, the outermost structure
+  // should be Type_Kind_STRUCT
+  CBDB_CHECK(type.kind() == pax::orc::proto::Type_Kind_STRUCT,
+             cbdb::CException::ExType::kExTypeInvalidORCFormat);
+  CBDB_CHECK(type.subtypes_size() == max_id - 1,
+             cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+  for (int j = 0; j < type.subtypes_size(); ++j) {
+    int sub_type_id = static_cast<int>(type.subtypes(j)) + 1;
+    const pax::orc::proto::Type &sub_type = file_footer_.types(sub_type_id);
+    // should allow struct contain struct
+    // but not support yet
+    CBDB_CHECK(sub_type.kind() != pax::orc::proto::Type_Kind_STRUCT,
+               cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+    column_types_.emplace_back(sub_type.kind());
+  }
+
+  // Build stripe row offset array
+  size_t cur_stripe_row_offset = 0;
+  for (size_t i = 0; i < num_of_stripes_; i++) {
+    stripe_row_offsets_.emplace_back(cur_stripe_row_offset);
+    cur_stripe_row_offset += file_footer_.stripes(i).numberofrows();
+  }
+}
+
+void OrcFormatReader::Close() { file_->Close(); }
+
+size_t OrcFormatReader::GetStripeNums() const { return num_of_stripes_; }
+
+size_t OrcFormatReader::GetStripeNumberOfRows(size_t stripe_index) {
+  Assert(stripe_index < GetStripeNums());
+  return file_footer_.stripes(static_cast<int>(stripe_index)).numberofrows();
+}
+
+size_t OrcFormatReader::GetStripeOffset(size_t stripe_index) {
+  Assert(stripe_index < GetStripeNums());
+  return stripe_row_offsets_[stripe_index];
+}
+
+// FIXME(jiaqizho): move method to higher level
+static bool ProjShouldReadAll(const bool *const proj_map, size_t proj_len) {
+  if (!proj_map) {
+    return true;
+  }
+
+  for (size_t i = 0; i < proj_len; i++) {
+    if (!proj_map[i]) {
+      return false;
+    }
+  }
+
+  return true;
+}
+
+pax::orc::proto::StripeFooter OrcFormatReader::ReadStripeFooter(
+    DataBuffer<char> *data_buffer, size_t sf_length, size_t sf_offset,
+    size_t sf_data_len) {
+  pax::orc::proto::StripeFooter stripe_footer;
+
+  Assert(data_buffer->Capacity() >= (sf_length - sf_data_len));
+  file_->PReadN(data_buffer->GetBuffer(), sf_length - sf_data_len,
+                sf_offset + sf_data_len);
+  SeekableInputStream input_stream(data_buffer->GetBuffer(),
+                                   sf_length - sf_data_len);
+  if (!stripe_footer.ParseFromZeroCopyStream(&input_stream)) {
+    // fail to do memory io with protobuf
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeIOError);
+  }
+
+  return stripe_footer;
+}
+
+pax::orc::proto::StripeFooter OrcFormatReader::ReadStripeFooter(
+    DataBuffer<char> *data_buffer, size_t stripe_index) {
+  size_t sf_data_len;
+  size_t sf_offset;
+  size_t sf_length;
+  pax::orc::proto::StripeInformation stripe_info;
+
+  Assert(stripe_index < GetStripeNums());
+
+  stripe_info = file_footer_.stripes(static_cast<int>(stripe_index));
+
+  sf_data_len = stripe_info.datalength();
+  sf_offset = stripe_info.offset();
+  sf_length = stripe_info.footerlength();
+
+  Assert(data_buffer->IsMemTakeOver());
+  Assert(data_buffer->Used() == 0);
+
+  if (data_buffer->Capacity() < (sf_length - sf_data_len)) {
+    data_buffer->ReSize(sf_length - sf_data_len);
+  }
+
+  return ReadStripeFooter(data_buffer, sf_length, sf_offset, sf_data_len);
+}
+
+pax::orc::proto::StripeFooter OrcFormatReader::ReadStripeWithProjection(
+    DataBuffer<char> *data_buffer,
+    const ::pax::orc::proto::StripeInformation &stripe_info,
+    const bool *const proj_map, size_t proj_len) {
+  pax::orc::proto::StripeFooter stripe_footer;
+  size_t stripe_footer_data_len;
+  size_t stripe_footer_offset;
+  size_t stripe_footer_length;
+
+  size_t streams_index = 0;
+  uint64_t batch_len = 0;
+  uint64_t batch_offset = 0;
+  size_t index = 0;
+
+  stripe_footer_data_len = stripe_info.datalength();
+  stripe_footer_offset = stripe_info.offset();
+  stripe_footer_length = stripe_info.footerlength();
+
+  /* Check all column projection is true.
+   * If no need do column projection, read all
+   * buffer(data + stripe footer) from stripe and decode stripe footer.
+   */
+  if (ProjShouldReadAll(proj_map, proj_len)) {
+    file_->PReadN(data_buffer->GetBuffer(), stripe_footer_length,
+                  stripe_footer_offset);
+    SeekableInputStream input_stream(
+        data_buffer->GetBuffer() + stripe_footer_data_len,
+        stripe_footer_length - stripe_footer_data_len);
+    if (!stripe_footer.ParseFromZeroCopyStream(&input_stream)) {
+      // fail to do memory io with protobuf
+      CBDB_RAISE(cbdb::CException::ExType::kExTypeIOError);
+    }
+
+    return stripe_footer;
+  }
+
+  /* If need do column projection here
+   * Then read stripe footer and decode it before read data part
+   */
+  stripe_footer =
+      ReadStripeFooter(data_buffer, stripe_footer_length, stripe_footer_offset,
+                       stripe_footer_data_len);
+  data_buffer->BrushBackAll();
+
+  batch_offset = stripe_footer_offset;
+
+  while (index < column_types_.size()) {
+    // Current column have been skipped
+    // Move `batch_offset` and `streams_index` to the right position
+    if (!proj_map[index]) {
+      index++;
+
+      const pax::orc::proto::Stream *n_stream = nullptr;
+      do {
+        n_stream = &stripe_footer.streams(streams_index++);
+        batch_offset += n_stream->length();
+      } while (n_stream->kind() !=
+               ::pax::orc::proto::Stream_Kind::Stream_Kind_DATA);
+
+      continue;
+    }
+
+    batch_len = 0;
+
+    /* Current column should be read
+     * In this case, did a greedy algorithm to combine io: while
+     * the current column is being read, it is necessary
+     * to ensure that subsequent columns will be read in the same io.
+     *
+     * So in `do...while`, only the `batch_size` which io needs to read
+     * is calculated, until meet a column which needs to be skipped.
+     */
+    do {
+      bool has_null = stripe_info.colstats(index).hasnull();
+      if (has_null) {
+        const pax::orc::proto::Stream &non_null_stream =
+            stripe_footer.streams(streams_index++);
+        batch_len += non_null_stream.length();
+      }
+
+      const pax::orc::proto::Stream *len_or_data_stream =
+          &stripe_footer.streams(streams_index++);
+      batch_len += len_or_data_stream->length();
+
+      if (len_or_data_stream->kind() ==
+          ::pax::orc::proto::Stream_Kind::Stream_Kind_LENGTH) {
+        len_or_data_stream = &stripe_footer.streams(streams_index++);
+        batch_len += len_or_data_stream->length();
+      }
+    } while ((++index) < column_types_.size() && proj_map[index]);
+
+    file_->PReadN(data_buffer->GetAvailableBuffer(), batch_len, batch_offset);
+    data_buffer->Brush(batch_len);
+    batch_offset += batch_len;
+  }
+
+  return stripe_footer;
+}
+
+template <typename T>
+static PaxColumn *BuildEncodingColumn(
+    DataBuffer<char> *data_buffer, const pax::orc::proto::Stream &data_stream,
+    const ColumnEncoding &data_encoding, bool is_vec) {
+  uint32 not_null_rows = 0;
+  uint64 column_data_len = 0;
+  DataBuffer<T> *column_data_buffer = nullptr;
+
+  Assert(data_stream.kind() == pax::orc::proto::Stream_Kind_DATA);
+
+  not_null_rows = static_cast<uint32>(data_stream.column());
+  column_data_len = static_cast<uint64>(data_stream.length());
+
+  column_data_buffer = PAX_NEW<DataBuffer<T>>(
+      reinterpret_cast<T *>(data_buffer->GetAvailableBuffer()), column_data_len,
+      false, false);
+
+  column_data_buffer->BrushAll();
+  data_buffer->Brush(column_data_len);
+
+  PaxDecoder::DecodingOption decoding_option;
+  decoding_option.column_encode_type = data_encoding.kind();
+  decoding_option.is_sign = true;
+  decoding_option.compress_level = data_encoding.compress_lvl();
+
+  size_t alloc_size = 0;
+
+  if (data_encoding.kind() !=
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    alloc_size = data_encoding.length();
+  }
+
+  if (is_vec) {
+    auto pax_column =
+        traits::ColumnOptCreateTraits<PaxVecEncodingColumn, T>::create_decoding(
+            alloc_size, decoding_option);
+    pax_column->Set(column_data_buffer, (size_t)not_null_rows);
+    return pax_column;
+  } else {
+    AssertImply(data_encoding.kind() ==
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED,
+                not_null_rows == column_data_buffer->GetSize());
+    AssertImply(data_encoding.kind() !=
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED,
+                data_encoding.length() / sizeof(T) == not_null_rows);
+    auto pax_column =
+        traits::ColumnOptCreateTraits<PaxEncodingColumn, T>::create_decoding(
+            alloc_size, decoding_option);
+    pax_column->Set(column_data_buffer);
+    return pax_column;
+  }
+
+  Assert(false);
+}
+
+static PaxColumn *BuildEncodingVecNonFixedColumn(
+    DataBuffer<char> *data_buffer, const pax::orc::proto::Stream &data_stream,
+    const pax::orc::proto::Stream &len_stream,
+    const ColumnEncoding &data_encoding) {
+  uint32 not_null_rows = 0;
+  uint64 column_lens_len = 0;
+  uint64 column_data_len = 0;
+  DataBuffer<int32> *column_offset_buffer = nullptr;
+  DataBuffer<char> *column_data_buffer = nullptr;
+  PaxVecNonFixedColumn *pax_column = nullptr;
+
+  auto total_rows = static_cast<uint32>(len_stream.column());
+  not_null_rows = static_cast<uint32>(data_stream.column());
+  column_data_len = static_cast<uint64>(data_stream.length());
+  column_lens_len = static_cast<uint64>(len_stream.length());
+
+  Assert(column_lens_len >= ((total_rows + 1) * sizeof(int32)));
+  column_offset_buffer = PAX_NEW<DataBuffer<int32>>(
+      reinterpret_cast<int32 *>(data_buffer->GetAvailableBuffer()),
+      column_lens_len, false, false);
+
+  column_offset_buffer->Brush((total_rows + 1) * sizeof(int32));
+  // at lease 2
+  Assert(column_offset_buffer->GetSize() >= 2);
+  data_buffer->Brush(column_lens_len);
+  column_data_buffer = PAX_NEW<DataBuffer<char>>(
+      data_buffer->GetAvailableBuffer(), column_data_len, false, false);
+
+  if (data_encoding.kind() ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    column_data_buffer->Brush(
+        (*column_offset_buffer)[column_offset_buffer->GetSize() - 1]);
+    data_buffer->Brush(column_data_len);
+
+    pax_column = traits::ColumnCreateTraits2<PaxVecNonFixedColumn>::create(0);
+  } else {
+    data_buffer->Brush(column_data_len);
+    column_data_buffer->BrushAll();
+
+    PaxDecoder::DecodingOption decoding_option;
+    decoding_option.column_encode_type = data_encoding.kind();
+    decoding_option.is_sign = true;
+    decoding_option.compress_level = data_encoding.compress_lvl();
+
+    pax_column =
+        traits::ColumnOptCreateTraits2<PaxVecNonFixedEncodingColumn>::  //
+        create_decoding(data_encoding.length(), std::move(decoding_option));
+  }
+  pax_column->Set(column_data_buffer, column_offset_buffer, column_data_len,
+                  not_null_rows);
+  return pax_column;
+}
+
+static PaxColumn *BuildEncodingNonFixedColumn(
+    DataBuffer<char> *data_buffer, const pax::orc::proto::Stream &data_stream,
+    const pax::orc::proto::Stream &len_stream,
+    const ColumnEncoding &data_encoding) {
+  uint32 column_lens_size = 0;
+  uint64 column_lens_len = 0;
+  uint64 column_data_len = 0;
+  DataBuffer<int32> *column_len_buffer = nullptr;
+  DataBuffer<char> *column_data_buffer = nullptr;
+  PaxNonFixedColumn *pax_column = nullptr;
+
+  column_lens_size = static_cast<uint32>(len_stream.column());
+  column_lens_len = static_cast<uint64>(len_stream.length());
+
+  column_len_buffer = PAX_NEW<DataBuffer<int32>>(
+      reinterpret_cast<int32 *>(data_buffer->GetAvailableBuffer()),
+      column_lens_len, false, false);
+
+  Assert(column_lens_len >= column_lens_size * sizeof(int32));
+  column_len_buffer->Brush(column_lens_size * sizeof(int32));
+  data_buffer->Brush(column_lens_len);
+
+  column_data_len = data_stream.length();
+
+#ifdef ENABLE_DEBUG
+  if (data_encoding.kind() ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    size_t segs_size = 0;
+    for (size_t i = 0; i < column_len_buffer->GetSize(); i++) {
+      segs_size += (*column_len_buffer)[i];
+    }
+    Assert(column_data_len == segs_size);
+  }
+#endif
+
+  column_data_buffer = PAX_NEW<DataBuffer<char>>(
+      data_buffer->GetAvailableBuffer(), column_data_len, false, false);
+  column_data_buffer->BrushAll();
+  data_buffer->Brush(column_data_len);
+
+  Assert(static_cast<uint32>(data_stream.column()) == column_lens_size);
+
+  if (data_encoding.kind() ==
+      ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED) {
+    Assert(column_data_len == column_data_buffer->GetSize());
+    pax_column = traits::ColumnCreateTraits2<PaxNonFixedColumn>::create(0);
+  } else {
+    PaxDecoder::DecodingOption decoding_option;
+    decoding_option.column_encode_type = data_encoding.kind();
+    decoding_option.is_sign = true;
+    decoding_option.compress_level = data_encoding.compress_lvl();
+
+    pax_column = traits::ColumnOptCreateTraits2<
+        PaxNonFixedEncodingColumn>::create_decoding(data_encoding.length(),
+                                                    std::move(decoding_option));
+  }
+
+  // current memory will be freed in pax_columns->data_
+  pax_column->Set(column_data_buffer, column_len_buffer, column_data_len);
+  return pax_column;
+}
+
+// TODO(jiaqizho): add args buffer
+// which can read from a prev read buffer
+PaxColumns *OrcFormatReader::ReadStripe(size_t group_index, bool *proj_map,
+                                        size_t proj_len) {
+  auto stripe_info = file_footer_.stripes(static_cast<int>(group_index));
+  auto pax_columns = PAX_NEW<PaxColumns>();
+  DataBuffer<char> *data_buffer = nullptr;
+  pax::orc::proto::StripeFooter stripe_footer;
+  size_t streams_index = 0;
+  size_t streams_size = 0;
+  size_t encoding_kinds_size = 0;
+
+  pax_columns->AddRows(stripe_info.numberofrows());
+
+  if (unlikely(stripe_info.footerlength() == 0)) {
+    return pax_columns;
+  }
+
+  if (reused_buffer_) {
+    Assert(reused_buffer_->Capacity() >= 4);
+    Assert(reused_buffer_->Used() == 0);
+    if (reused_buffer_->Available() < stripe_info.footerlength()) {
+      reused_buffer_->ReSize(
+          reused_buffer_->Used() + stripe_info.footerlength(), 1.5);
+    }
+    data_buffer = PAX_NEW<DataBuffer<char>>(
+        reused_buffer_->GetBuffer(), reused_buffer_->Capacity(), false, false);
+
+  } else {
+    data_buffer = PAX_NEW<DataBuffer<char>>(stripe_info.footerlength());
+  }
+  pax_columns->Set(data_buffer);
+  pax_columns->SetStorageFormat(is_vec_
+                                    ? PaxStorageFormat::kTypeStorageOrcVec
+                                    : PaxStorageFormat::kTypeStorageOrcNonVec);
+
+  /* `ReadStripeWithProjection` will read the column memory which filter by
+   * `proj_map`, and initialize `stripe_footer`
+   *
+   * Notice that: should catch `kExTypeIOError` then delete pax columns
+   * But for now we will destroy memory context if exception happen.
+   * And we don't have a decision that should we use `try...catch` at yet,
+   * so it's ok that we just no catch here.
+   */
+  stripe_footer =
+      ReadStripeWithProjection(data_buffer, stripe_info, proj_map, proj_len);
+
+  streams_size = stripe_footer.streams_size();
+  encoding_kinds_size = stripe_footer.pax_col_encodings_size();
+
+  if (unlikely(streams_size == 0 && column_types_.empty())) {
+    return pax_columns;
+  }
+
+  data_buffer->BrushBackAll();
+
+  AssertImply(proj_len != 0, column_types_.size() <= proj_len);
+  Assert(encoding_kinds_size <= column_types_.size());
+
+  for (size_t index = 0; index < column_types_.size(); index++) {
+    /* Skip read current column, just move `streams_index` after
+     * `Stream_Kind_DATA` but still need append nullptr into `PaxColumns` to
+     * make sure sizeof pax_columns eq with column number
+     */
+    if (proj_map && !proj_map[index]) {
+      const pax::orc::proto::Stream *n_stream = nullptr;
+      do {
+        n_stream = &stripe_footer.streams(streams_index++);
+      } while (n_stream->kind() !=
+               ::pax::orc::proto::Stream_Kind::Stream_Kind_DATA);
+
+      pax_columns->Append(nullptr);
+      continue;
+    }
+
+    Bitmap8 *non_null_bitmap = nullptr;
+    bool has_null = stripe_info.colstats(index).hasnull();
+    if (has_null) {
+      const pax::orc::proto::Stream &non_null_stream =
+          stripe_footer.streams(streams_index++);
+      auto bm_nbytes = static_cast<uint32>(non_null_stream.length());
+      auto bm_bytes =
+          reinterpret_cast<uint8 *>(data_buffer->GetAvailableBuffer());
+
+      Assert(non_null_stream.kind() == pax::orc::proto::Stream_Kind_PRESENT);
+      non_null_bitmap = PAX_NEW<Bitmap8>(BitmapRaw<uint8>(bm_bytes, bm_nbytes),
+                                         BitmapTpl<uint8>::ReadOnlyRefBitmap);
+      data_buffer->Brush(bm_nbytes);
+    }
+
+    switch (column_types_[index]) {
+      case (pax::orc::proto::Type_Kind::Type_Kind_STRING): {
+        const pax::orc::proto::Stream &len_stream =
+            stripe_footer.streams(streams_index++);
+        const pax::orc::proto::Stream &data_stream =
+            stripe_footer.streams(streams_index++);
+        const ColumnEncoding &data_encoding =
+            stripe_footer.pax_col_encodings(index);
+
+        Assert(len_stream.kind() == pax::orc::proto::Stream_Kind_LENGTH);
+        Assert(data_stream.kind() == pax::orc::proto::Stream_Kind_DATA);
+
+        pax_columns->Append(
+            is_vec_ ? BuildEncodingVecNonFixedColumn(data_buffer, data_stream,
+                                                     len_stream, data_encoding)
+                    : BuildEncodingNonFixedColumn(data_buffer, data_stream,
+                                                  len_stream, data_encoding));
+        break;
+      }
+      case (pax::orc::proto::Type_Kind::Type_Kind_BOOLEAN):
+      case (pax::orc::proto::Type_Kind::Type_Kind_BYTE):
+        pax_columns->Append(BuildEncodingColumn<int8>(
+            data_buffer, stripe_footer.streams(streams_index++),
+            stripe_footer.pax_col_encodings(index), is_vec_));
+        break;
+      case (pax::orc::proto::Type_Kind::Type_Kind_SHORT):
+        pax_columns->Append(BuildEncodingColumn<int16>(
+            data_buffer, stripe_footer.streams(streams_index++),
+            stripe_footer.pax_col_encodings(index), is_vec_));
+        break;
+      case (pax::orc::proto::Type_Kind::Type_Kind_INT): {
+        pax_columns->Append(BuildEncodingColumn<int32>(
+            data_buffer, stripe_footer.streams(streams_index++),
+            stripe_footer.pax_col_encodings(index), is_vec_));
+        break;
+      }
+      case (pax::orc::proto::Type_Kind::Type_Kind_LONG): {
+        pax_columns->Append(BuildEncodingColumn<int64>(
+            data_buffer, stripe_footer.streams(streams_index++),
+            stripe_footer.pax_col_encodings(index), is_vec_));
+        break;
+      }
+      default:
+        // should't be here
+        Assert(!"should't be here, non-implemented type");
+        break;
+    }
+
+    // fill nulls data buffer
+    Assert(pax_columns->GetColumns() > 0);
+    auto last_column = (*pax_columns)[pax_columns->GetColumns() - 1];
+    last_column->SetRows(stripe_info.numberofrows());
+    if (has_null) {
+      Assert(non_null_bitmap);
+      last_column->SetBitmap(non_null_bitmap);
+    }
+  }
+
+#ifdef ENABLE_DEBUG
+
+  auto storage_tyep_verify = is_vec_ ? PaxStorageFormat::kTypeStorageOrcVec
+                                     : PaxStorageFormat::kTypeStorageOrcNonVec;
+
+  Assert(storage_tyep_verify == pax_columns->GetStorageFormat());
+  for (size_t index = 0; index < column_types_.size(); index++) {
+    auto column_verify = (*pax_columns)[index];
+    if (column_verify) {
+      Assert(storage_tyep_verify == column_verify->GetStorageFormat());
+    }
+  }
+
+#endif
+
+  Assert(streams_size == streams_index);
+  return pax_columns;
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.h b/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.h
new file mode 100644
index 00000000000..68669536e74
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_format_reader.h
@@ -0,0 +1,61 @@
+#pragma once
+
+#include "storage/columns/pax_columns.h"
+#include "storage/file_system.h"
+#include "storage/proto/proto_wrappers.h"
+#include "storage/proto/protobuf_stream.h"
+
+namespace pax {
+namespace tools { class PaxDumpReader; }
+class OrcFormatReader final {
+ public:
+  explicit OrcFormatReader(File *file);
+
+  ~OrcFormatReader();
+
+  void SetReusedBuffer(DataBuffer<char> *data_buffer);
+
+  void Open();
+
+  void Close();
+
+  size_t GetStripeNums() const;
+
+  size_t GetStripeNumberOfRows(size_t stripe_index);
+
+  size_t GetStripeOffset(size_t stripe_index);
+
+  PaxColumns *ReadStripe(size_t group_index, bool *proj_map = nullptr,
+                         size_t proj_len = 0);
+
+ private:
+  pax::orc::proto::StripeFooter ReadStripeWithProjection(
+      DataBuffer<char> *data_buffer,
+      const ::pax::orc::proto::StripeInformation &stripe_info, const bool *proj_map,
+      size_t proj_len);
+
+  pax::orc::proto::StripeFooter ReadStripeFooter(DataBuffer<char> *data_buffer,
+                                            size_t sf_length, size_t sf_offset,
+                                            size_t sf_data_len);
+
+  pax::orc::proto::StripeFooter ReadStripeFooter(DataBuffer<char> *data_buffer,
+                                            size_t stripe_index);
+
+  void BuildProtoTypes();
+
+ private:
+  friend class tools::PaxDumpReader;
+  friend class OrcGroupStatsProvider;
+  std::vector<pax::orc::proto::Type_Kind> column_types_;
+  File *file_;
+  DataBuffer<char> *reused_buffer_;
+  size_t num_of_stripes_;
+  bool is_vec_;
+
+  std::vector<size_t> stripe_row_offsets_;
+
+  pax::orc::proto::PostScript post_script_;
+  pax::orc::proto::Footer file_footer_;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_group.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_group.cc
new file mode 100644
index 00000000000..4bf37d567df
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_group.cc
@@ -0,0 +1,230 @@
+#include "storage/orc/orc_group.h"
+
+#include "comm/pax_memory.h"
+
+namespace pax {
+
+OrcGroup::OrcGroup(PaxColumns *pax_column, size_t row_offset)
+    : pax_columns_(pax_column), row_offset_(row_offset), current_row_index_(0) {
+  Assert(pax_columns_);
+
+  current_nulls_ = PAX_NEW_ARRAY<uint32>(pax_columns_->GetColumns());
+  memset(current_nulls_, 0, pax_columns_->GetColumns() * sizeof(uint32));
+}
+
+OrcGroup::~OrcGroup() {
+  PAX_DELETE(pax_columns_);
+  PAX_DELETE_ARRAY(current_nulls_);
+}
+
+size_t OrcGroup::GetRows() const { return pax_columns_->GetRows(); }
+
+size_t OrcGroup::GetRowOffset() const { return row_offset_; }
+
+PaxColumns *OrcGroup::GetAllColumns() const { return pax_columns_; }
+
+std::pair<bool, size_t> OrcGroup::ReadTuple(TupleTableSlot *slot) {
+  size_t index = 0;
+  size_t nattrs = 0;
+  size_t column_nums = 0;
+
+  Assert(pax_columns_);
+  Assert(slot);
+
+  // already consumed
+  if (current_row_index_ >= pax_columns_->GetRows()) {
+    return {false, current_row_index_};
+  }
+
+  nattrs = static_cast<size_t>(slot->tts_tupleDescriptor->natts);
+  column_nums = pax_columns_->GetColumns();
+
+  for (index = 0; index < nattrs; index++) {
+    // filter with projection
+    if (index < column_nums && !((*pax_columns_)[index])) {
+      continue;
+    }
+
+    // handle PAX columns number inconsistent with pg catalog nattrs in case
+    // data not been inserted yet or read pax file conserved before last add
+    // column DDL is done, for these cases it is normal that pg catalog schema
+    // is not match with that in PAX file.
+    if (index >= column_nums) {
+      cbdb::SlotGetMissingAttrs(slot, index, nattrs);
+      break;
+    }
+
+    // In case column is droped, then set its value as null without reading data
+    // tuples.
+    if (unlikely(slot->tts_tupleDescriptor->attrs[index].attisdropped)) {
+      slot->tts_isnull[index] = true;
+      continue;
+    }
+
+    auto column = ((*pax_columns_)[index]);
+
+    std::tie(slot->tts_values[index], slot->tts_isnull[index]) =
+        GetColumnValue(column, current_row_index_, &(current_nulls_[index]));
+  }
+  current_row_index_++;
+  return {true, current_row_index_ - 1};
+}
+
+bool OrcGroup::GetTuple(TupleTableSlot *slot, size_t row_index) {
+  size_t index = 0;
+  size_t nattrs = 0;
+  size_t column_nums = 0;
+
+  Assert(pax_columns_);
+  Assert(slot);
+
+  if (row_index >= pax_columns_->GetRows()) {
+    return false;
+  }
+
+  nattrs = static_cast<size_t>(slot->tts_tupleDescriptor->natts);
+  column_nums = pax_columns_->GetColumns();
+
+  for (index = 0; index < nattrs; index++) {
+    // Same logic with `ReadTuple`
+    if (index < column_nums && !((*pax_columns_)[index])) {
+      continue;
+    }
+
+    if (index >= column_nums) {
+      cbdb::SlotGetMissingAttrs(slot, index, nattrs);
+      break;
+    }
+
+    if (unlikely(slot->tts_tupleDescriptor->attrs[index].attisdropped)) {
+      slot->tts_isnull[index] = true;
+      continue;
+    }
+
+    auto column = ((*pax_columns_)[index]);
+
+    // different with `ReadTuple`
+    std::tie(slot->tts_values[index], slot->tts_isnull[index]) =
+        GetColumnValue(column, row_index);
+  }
+
+  return true;
+}
+
+// Used in `GetColumnValue`
+// After accumulating `null_counts` in `GetColumnValue`
+// Then we can direct get Datum when storage type is `orc`
+static Datum GetDatumWithNonNull(PaxColumn *column, size_t non_null_offset) {
+  Assert(column);
+  Datum datum = 0;
+  char *buffer;
+  size_t buffer_len;
+
+  std::tie(buffer, buffer_len) = column->GetBuffer(non_null_offset);
+  switch (column->GetPaxColumnTypeInMem()) {
+    case kTypeNonFixed:
+      datum = PointerGetDatum(buffer);
+      break;
+    case kTypeFixed: {
+      Assert(buffer_len > 0);
+      switch (buffer_len) {
+        case 1:
+          datum = cbdb::Int8ToDatum(*reinterpret_cast<int8 *>(buffer));
+          break;
+        case 2:
+          datum = cbdb::Int16ToDatum(*reinterpret_cast<int16 *>(buffer));
+          break;
+        case 4:
+          datum = cbdb::Int32ToDatum(*reinterpret_cast<int32 *>(buffer));
+          break;
+        case 8:
+          datum = cbdb::Int64ToDatum(*reinterpret_cast<int64 *>(buffer));
+          break;
+        default:
+          Assert(!"should't be here, fixed type len should be 1, 2, 4, 8");
+      }
+      break;
+    }
+    default:
+      Assert(!"should't be here, non-implemented column type in memory");
+      break;
+  }
+  return datum;
+}
+
+std::pair<Datum, bool> OrcGroup::GetColumnValue(TupleDesc desc,
+                                                size_t column_index,
+                                                size_t row_index) {
+  Assert(row_index < pax_columns_->GetRows());
+  if (column_index < pax_columns_->GetColumns()) {
+    auto column = (*pax_columns_)[column_index];
+
+    // dropped column
+    if (!column) {
+      return {0, true};
+    }
+
+    return GetColumnValue(column, row_index);
+  }
+
+  AttrMissing *attrmiss = nullptr;
+  if (desc->constr) attrmiss = desc->constr->missing;
+
+  if (!attrmiss) {
+    // no missing values array at all, so just fill everything in as NULL
+    return {0, true};
+  } else {
+    // fill with default value
+    return {attrmiss[column_index].am_value,
+            !attrmiss[column_index].am_present};
+  }
+}
+
+std::pair<Datum, bool> OrcGroup::GetColumnValue(PaxColumn *column,  // NOLINT
+                                                size_t row_index,
+                                                uint32 *null_counts) {
+  Assert(column);
+  Assert(row_index < column->GetRows());
+  Assert(row_index >= *null_counts);
+
+  if (column->HasNull()) {
+    auto bm = column->GetBitmap();
+    Assert(bm);
+    if (!bm->Test(row_index)) {
+      *null_counts += 1;
+      return {0, true};
+    }
+  }
+
+  return {GetDatumWithNonNull(column, row_index - *null_counts), false};
+}
+
+std::pair<Datum, bool> OrcGroup::GetColumnValue(size_t column_index,
+                                                size_t row_index) {
+  Assert(column_index < pax_columns_->GetColumns());
+
+  auto column = (*pax_columns_)[column_index];
+  Assert(column);
+
+  return GetColumnValue(column, row_index);
+}
+
+std::pair<Datum, bool> OrcGroup::GetColumnValue(PaxColumn *column,
+                                                size_t row_index) {
+  Assert(column);
+  Assert(row_index < column->GetRows());
+
+  if (column->HasNull()) {
+    auto bm = column->GetBitmap();
+    Assert(bm);
+    if (!bm->Test(row_index)) {
+      return {0, true};
+    }
+  }
+
+  return {
+      GetDatumWithNonNull(column, column->GetRangeNonNullRows(0, row_index)),
+      false};
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_group.h b/contrib/pax_storage/src/cpp/storage/orc/orc_group.h
new file mode 100644
index 00000000000..ef7fa9bd470
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_group.h
@@ -0,0 +1,79 @@
+#pragma once
+#include "comm/cbdb_api.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "storage/micro_partition.h"
+
+namespace pax {
+
+namespace tools { class PaxDumpReader; }
+
+class OrcGroup : public MicroPartitionReader::Group {
+ public:
+  OrcGroup(PaxColumns *pax_column, size_t row_offset);
+
+  ~OrcGroup() override;
+
+  size_t GetRows() const override;
+
+  size_t GetRowOffset() const override;
+
+  PaxColumns *GetAllColumns() const override;
+
+  std::pair<bool, size_t> ReadTuple(TupleTableSlot *slot) override;
+
+  bool GetTuple(TupleTableSlot *slot, size_t row_index) override;
+
+  std::pair<Datum, bool> GetColumnValue(TupleDesc desc, size_t column_index,
+                                        size_t row_index) override;
+
+ protected:
+  // Used to direct get datum from columns
+  virtual std::pair<Datum, bool> GetColumnValue(size_t column_index,
+                                                size_t row_index);
+
+  virtual std::pair<Datum, bool> GetColumnValue(PaxColumn *column,
+                                                size_t row_index);
+
+  // Used in `ReadTuple`
+  // Different from the other `GetColumnValue` function, in this function, if a
+  // null row is encountered, then we will perform an accumulation operation on
+  // `null_counts`. If no null row is encountered, the offset of the row data
+  // will be calculated through `null_counts`. The other `GetColumnValue`
+  // function are less efficient in `foreach` because they have to calculate the
+  // offset of the row data from scratch every time.
+  virtual std::pair<Datum, bool> GetColumnValue(PaxColumn *column,
+                                                size_t row_index,
+                                                uint32 *null_counts);
+
+ protected:
+  PaxColumns *pax_columns_;
+  size_t row_offset_;
+  size_t current_row_index_;
+
+ private:
+  friend class tools::PaxDumpReader;
+  uint32 *current_nulls_ = nullptr;
+};
+
+class OrcVecGroup final : public OrcGroup {
+ public:
+  OrcVecGroup(PaxColumns *pax_column, size_t row_offset);
+
+  ~OrcVecGroup() override;
+
+ private:
+  std::pair<Datum, bool> GetColumnValue(size_t column_index,
+                                        size_t row_index) override;
+
+  std::pair<Datum, bool> GetColumnValue(PaxColumn *column,
+                                        size_t row_index) override;
+
+  std::pair<Datum, bool> GetColumnValue(PaxColumn *column, size_t row_index,
+                                        uint32 *null_counts) override;
+
+ private:
+  std::vector<struct varlena *> buffer_holder_;
+};
+
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_reader.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_reader.cc
new file mode 100644
index 00000000000..a24b464a30d
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_reader.cc
@@ -0,0 +1,270 @@
+#include "comm/cbdb_api.h"
+
+#include <string>
+#include <utility>
+#include <vector>
+
+#include "comm/cbdb_wrappers.h"
+#include "exceptions/CException.h"
+#include "storage/columns/pax_column_cache.h"
+#include "storage/orc/orc.h"
+#include "storage/orc/orc_defined.h"
+#include "storage/orc/orc_group.h"
+#include "storage/pax_filter.h"
+#include "storage/pax_itemptr.h"
+
+namespace pax {
+
+class OrcGroupStatsProvider final : public ColumnStatsProvider {
+ public:
+  OrcGroupStatsProvider(const OrcFormatReader &format_reader,
+                        size_t group_index)
+      : format_reader_(format_reader), group_index_(group_index) {
+    Assert(group_index >= 0 && group_index < format_reader.GetStripeNums());
+  }
+  int ColumnSize() const override {
+    return static_cast<int>(format_reader_.file_footer_.colinfo_size());
+  }
+  bool AllNull(int column_index) const override {
+    return format_reader_.file_footer_.stripes(group_index_)
+        .colstats(column_index)
+        .allnull();
+  }
+  bool HasNull(int column_index) const override {
+    return format_reader_.file_footer_.stripes(group_index_)
+        .colstats(column_index)
+        .hasnull();
+  }
+  const ::pax::stats::ColumnBasicInfo &ColumnInfo(
+      int column_index) const override {
+    return format_reader_.file_footer_.colinfo(column_index);
+  }
+  const ::pax::stats::ColumnDataStats &DataStats(
+      int column_index) const override {
+    return format_reader_.file_footer_.stripes(group_index_)
+        .colstats(column_index)
+        .coldatastats();
+  }
+
+ private:
+  const OrcFormatReader &format_reader_;
+  size_t group_index_;
+};
+
+OrcReader::OrcReader(File *file)
+    : working_group_(nullptr),
+      cached_group_(nullptr),
+      current_group_index_(0),
+      proj_map_(nullptr),
+      proj_len_(0),
+      format_reader_(file),
+      is_closed_(true) {}
+
+std::unique_ptr<ColumnStatsProvider> OrcReader::GetGroupStatsInfo(
+    size_t group_index) {
+  auto x = PAX_NEW<OrcGroupStatsProvider>(format_reader_, group_index);
+  return std::unique_ptr<ColumnStatsProvider>(x);
+}
+
+MicroPartitionReader::Group *OrcReader::ReadGroup(size_t group_index) {
+  PaxColumns *pax_columns = nullptr;
+
+  Assert(group_index < GetGroupNums());
+#ifdef ENABLE_PLASMA
+  if (pax_column_cache_) {
+    PaxColumns *columns_readed = nullptr;
+    bool *proj_copy = nullptr;
+    bool still_remain = false;
+    std::tie(pax_columns, release_key_, proj_copy) =
+        pax_column_cache_->ReadCache(group_index);
+
+    for (size_t i = 0; i < proj_len_; i++) {
+      if (proj_copy[i]) {
+        still_remain = true;
+        break;
+      }
+    }
+
+    if (still_remain) {
+      columns_readed =
+          format_reader_.ReadStripe(group_index, proj_copy, proj_len_);
+      pax_column_cache_->WriteCache(columns_readed, group_index);
+    }
+
+    PAX_DELETE_ARRAY(proj_copy);
+
+    // No get the cache columns
+    if (pax_columns->GetRows() == 0) {
+      Assert(columns_readed);
+      PAX_DELETE(pax_columns);
+      pax_columns = columns_readed;
+    } else if (still_remain) {
+      Assert(columns_readed);
+      pax_columns->MergeTo(columns_readed);
+    }
+
+  } else {
+    pax_columns = format_reader_.ReadStripe(group_index, proj_map_, proj_len_);
+  }
+#else  // ENABLE_PLASMA
+  pax_columns = format_reader_.ReadStripe(group_index, proj_map_, proj_len_);
+
+#endif  // ENABLE_PLASMA
+
+#ifdef ENABLE_DEBUG
+  for (size_t i = 0; i < pax_columns->GetColumns(); i++) {
+    auto column = (*pax_columns)[i];
+    if (column && !column->GetBuffer().first) {
+      auto bm = column->GetBitmap();
+      Assert(bm);
+      for (size_t n = 0; n < column->GetRows(); n++) {
+        Assert(!bm->Test(n));
+      }
+    }
+  }
+#endif  // ENABLE_DEBUG
+
+  size_t group_offset = format_reader_.GetStripeOffset(group_index);
+  if (COLUMN_STORAGE_FORMAT_IS_VEC(pax_columns))
+    return PAX_NEW<OrcVecGroup>(pax_columns, group_offset);
+  else
+    return PAX_NEW<OrcGroup>(pax_columns, group_offset);
+}
+
+size_t OrcReader::GetGroupNums() { return format_reader_.GetStripeNums(); }
+
+void OrcReader::Open(const ReaderOptions &options) {
+  // Must not open twice.
+  Assert(is_closed_);
+  if (options.reused_buffer) {
+    CBDB_CHECK(options.reused_buffer->IsMemTakeOver(),
+               cbdb::CException::ExType::kExTypeLogicError);
+    options.reused_buffer->BrushBackAll();
+    format_reader_.SetReusedBuffer(options.reused_buffer);
+  }
+
+  if (options.filter) {
+    std::tie(proj_map_, proj_len_) = options.filter->GetColumnProjection();
+  }
+
+#ifdef ENABLE_PLASMA
+  if (options.pax_cache)
+    pax_column_cache_ = PAX_NEW<PaxColumnCache>(options.pax_cache, options.block_id,
+                                           proj_map_, proj_len_);
+#endif
+  format_reader_.Open();
+
+  is_closed_ = false;
+}
+
+void OrcReader::ResetCurrentReading() {
+  PAX_DELETE(working_group_);
+  working_group_ = nullptr;
+
+  PAX_DELETE(cached_group_);
+  cached_group_ = nullptr;
+
+  current_group_index_ = 0;
+}
+
+void OrcReader::Close() {
+  if (is_closed_) {
+    return;
+  }
+
+#ifdef ENABLE_PLASMA
+  if (pax_column_cache_) {
+    pax_column_cache_->ReleaseCache(release_key_);
+    PAX_DELETE(pax_column_cache_);
+  }
+#endif
+
+  ResetCurrentReading();
+  format_reader_.Close();
+  is_closed_ = true;
+}
+
+bool OrcReader::ReadTuple(TupleTableSlot *slot) {
+retry_read_group:
+  if (!working_group_) {
+    if (current_group_index_ >= GetGroupNums()) {
+      return false;
+    }
+
+    working_group_ = ReadGroup(current_group_index_++);
+    auto columns = working_group_->GetAllColumns();
+
+    // The column number in Pax file meta could be smaller than the column
+    // number in TupleSlot in case after alter table add column DDL operation
+    // was done.
+    CBDB_CHECK(columns->GetColumns() <=
+                   static_cast<size_t>(slot->tts_tupleDescriptor->natts),
+               cbdb::CException::ExType::kExTypeSchemaNotMatch);
+  }
+
+  bool ok = false;
+  size_t group_row_offset = 0;
+
+  std::tie(ok, group_row_offset) = working_group_->ReadTuple(slot);
+  if (!ok) {
+    PAX_DELETE(working_group_);
+    working_group_ = nullptr;
+    goto retry_read_group;
+  }
+
+  SetTupleOffset(&slot->tts_tid,
+                 working_group_->GetRowOffset() + group_row_offset);
+  return true;
+}
+
+bool OrcReader::GetTuple(TupleTableSlot *slot, size_t row_index) {
+  int32 group_index = -1;
+  size_t nums_of_group;
+  int left, right;
+
+  size_t group_offset, number_of_rows;
+
+  nums_of_group = GetGroupNums();
+  left = 0;
+  right = nums_of_group - 1;
+
+  // current `row_index` in group
+  if (cached_group_ && cached_group_->GetRowOffset() >= row_index &&
+      row_index < (cached_group_->GetRowOffset() + cached_group_->GetRows())) {
+    goto found;
+  }
+
+  while (left <= right) {
+    auto mid = (right - left) / 2 + left;
+    group_offset = format_reader_.GetStripeOffset(mid);
+    number_of_rows = format_reader_.GetStripeNumberOfRows(mid);
+
+    if (row_index >= group_offset &&
+        row_index < (group_offset + number_of_rows)) {
+      group_index = mid;
+      break;
+    } else if (row_index < group_offset) {
+      right = mid - 1;
+    } else {  // row_index >= (group_offset + number_of_rows)
+      left = mid + 1;
+    }
+  }
+
+  if (group_index == -1) {
+    return false;
+  }
+
+  // group_offset have been inited in loop
+  // and must not in cached_group_
+  PAX_DELETE(cached_group_);
+  cached_group_ = ReadGroup(group_index);
+
+found:
+  auto ok =
+      cached_group_->GetTuple(slot, row_index - cached_group_->GetRowOffset());
+  Assert(ok);
+  SetTupleOffset(&slot->tts_tid, row_index);
+  return ok;
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_test.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_test.cc
index 2a5fe5bc9ad..71089bef3fa 100644
--- a/contrib/pax_storage/src/cpp/storage/orc/orc_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_test.cc
@@ -9,146 +9,26 @@
 #include "comm/cbdb_wrappers.h"
 #include "comm/gtest_wrappers.h"
 #include "exceptions/CException.h"
+#include "pax_gtest_helper.h"
 #include "storage/local_file_system.h"
+#include "storage/pax_filter.h"
 
 namespace pax::tests {
 
-// 3 clomun - string(len 100), string(len 100), int(len 4)
-#define COLUMN_NUMS 3
-#define COLUMN_SIZE 100
-#define INT32_COLUMN_VALUE 0x123
-#define INT32_COLUMN_VALUE_DEFAULT 0x001
 #define PROJECTION_COLUMN 2
 #define PROJECTION_COLUMN_SINGLE 1
 
-static void GenFakeBuffer(char *buffer, size_t length) {
-  for (size_t i = 0; i < length; i++) {
-    buffer[i] = static_cast<char>(i);
-  }
-}
-
-static void CreateOrcTestResourceOwner() {
-  CurrentResourceOwner = ResourceOwnerCreate(NULL, "OrcTestResourceOwner");
-}
-
-static void ReleaseOrcTestResourceOwner() {
-  ResourceOwner tmp_resource_owner = CurrentResourceOwner;
-  CurrentResourceOwner = NULL;
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_BEFORE_LOCKS, false,
-                       true);
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_LOCKS, false, true);
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_AFTER_LOCKS, false,
-                       true);
-  ResourceOwnerDelete(tmp_resource_owner);
-}
-
 class OrcTest : public ::testing::Test {
  public:
   void SetUp() override {
-    Singleton<LocalFileSystem>::GetInstance();
-    remove(file_name_.c_str());
-
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "OrcTestMemoryContext", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-    CreateOrcTestResourceOwner();
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
   void TearDown() override {
     Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    ReleaseOrcTestResourceOwner();
-  }
-
-  static void DeleteCTupleSlot(CTupleSlot *ctuple_slot) {
-    auto tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    cbdb::Pfree(tuple_table_slot->tts_tupleDescriptor);
-    if (tuple_table_slot->tts_isnull) {
-      cbdb::Pfree(tuple_table_slot->tts_isnull);
-    }
-
-    cbdb::Pfree(tuple_table_slot);
-    delete ctuple_slot;
-  }
-
-  static CTupleSlot *CreateFakeCTupleSlot(bool with_value = true) {
-    TupleTableSlot *tuple_slot = nullptr;
-
-    auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
-        sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
-
-    tuple_desc->natts = COLUMN_NUMS;
-    tuple_desc->attrs[0] = {
-        .attlen = -1,
-        .attbyval = false,
-    };
-
-    tuple_desc->attrs[1] = {
-        .attlen = -1,
-        .attbyval = false,
-    };
-
-    tuple_desc->attrs[2] = {
-        .attlen = 4,
-        .attbyval = true,
-    };
-
-    tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
-
-    if (with_value) {
-      char column_buff[COLUMN_SIZE * 2];
-      GenFakeBuffer(column_buff, COLUMN_SIZE);
-      GenFakeBuffer(column_buff + COLUMN_SIZE, COLUMN_SIZE);
-
-      bool *fake_is_null =
-          reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * COLUMN_NUMS));
-
-      fake_is_null[0] = false;
-      fake_is_null[1] = false;
-      fake_is_null[2] = false;
-
-      tuple_slot->tts_values[0] =
-          cbdb::DatumFromCString(column_buff, COLUMN_SIZE);
-      tuple_slot->tts_values[1] =
-          cbdb::DatumFromCString(column_buff + COLUMN_SIZE, COLUMN_SIZE);
-      tuple_slot->tts_values[2] = cbdb::Int32ToDatum(INT32_COLUMN_VALUE);
-      tuple_slot->tts_isnull = fake_is_null;
-    }
-
-    auto ctuple_slot = new CTupleSlot(tuple_slot);
-
-    return ctuple_slot;
-  }
-
-  static CTupleSlot *CreateEmptyCTupleSlot() {
-    auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
-        sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
-    bool *fake_is_null =
-        reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * COLUMN_NUMS));
-    auto tuple_slot = reinterpret_cast<TupleTableSlot *>(
-        cbdb::Palloc0(sizeof(TupleTableSlot)));
-    auto tts_values =
-        reinterpret_cast<Datum *>(cbdb::Palloc0(sizeof(Datum) * COLUMN_NUMS));
-    tuple_desc->natts = COLUMN_NUMS;
-    tuple_desc->attrs[0] = {
-        .attlen = -1,
-        .attbyval = false,
-    };
-
-    tuple_desc->attrs[1] = {
-        .attlen = -1,
-        .attbyval = false,
-    };
-
-    tuple_desc->attrs[2] = {
-        .attlen = 4,
-        .attbyval = true,
-    };
-    tuple_slot->tts_tupleDescriptor = tuple_desc;
-    tuple_slot->tts_values = tts_values;
-    tuple_slot->tts_isnull = fake_is_null;
-    return new CTupleSlot(tuple_slot);
+    ReleaseTestResourceOwner();
   }
 
   static void VerifySingleStripe(PaxColumns *columns,
@@ -159,7 +39,7 @@ class OrcTest : public ::testing::Test {
     int read_len = -1;
     char *read_data = nullptr;
 
-    GenFakeBuffer(column_buff, COLUMN_SIZE);
+    GenTextBuffer(column_buff, COLUMN_SIZE);
 
     EXPECT_EQ(COLUMN_NUMS, columns->GetColumns());
 
@@ -214,20 +94,14 @@ class OrcTestProjection
     : public ::testing::TestWithParam<::testing::tuple<uint8, bool>> {
  public:
   void SetUp() override {
-    Singleton<LocalFileSystem>::GetInstance();
-    remove(file_name_.c_str());
-
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "OrcTestMemoryContext", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
-
-    MemoryContextSwitchTo(orc_test_memory_context);
-    CreateOrcTestResourceOwner();
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
   void TearDown() override {
     Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    ReleaseOrcTestResourceOwner();
+    ReleaseTestResourceOwner();
   }
 
  protected:
@@ -235,137 +109,130 @@ class OrcTestProjection
 };
 
 TEST_F(OrcTest, WriteTuple) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   OrcWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
 }
 
 TEST_F(OrcTest, OpenOrc) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
-  auto writer =
-      OrcWriter::CreateWriter(writer_options, std::move(types), file_ptr);
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  reader->GetStripeInfo(0);
+  EXPECT_EQ(1, reader->GetGroupNums());
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadStripes) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
   // file_ptr in orc writer will be freed when writer do destruct
   // current OrcWriter::CreateWriter only for test
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   // file_ptr in orc reader will be freed when reader do destruct
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  auto columns = reader->ReadStripe(0);
+  EXPECT_EQ(1, reader->GetGroupNums());
+  auto group = reader->ReadGroup(0);
+  auto columns = group->GetAllColumns();
+
   OrcTest::VerifySingleStripe(columns);
   reader->Close();
 
-  delete columns;
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete group;
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadStripesTwice) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  auto columns_stripe = reader->ReadStripe(0);
+  EXPECT_EQ(1, reader->GetGroupNums());
+  auto group = reader->ReadGroup(0);
+  auto columns = group->GetAllColumns();
 
   reader->Close();
   char column_buff[COLUMN_SIZE];
 
-  GenFakeBuffer(column_buff, COLUMN_SIZE);
+  GenTextBuffer(column_buff, COLUMN_SIZE);
 
-  EXPECT_EQ(COLUMN_NUMS, columns_stripe->GetColumns());
-  auto column1 = reinterpret_cast<PaxNonFixedColumn *>((*columns_stripe)[0]);
-  auto column2 = reinterpret_cast<PaxNonFixedColumn *>((*columns_stripe)[1]);
+  EXPECT_EQ(COLUMN_NUMS, columns->GetColumns());
+  auto column1 = reinterpret_cast<PaxNonFixedColumn *>((*columns)[0]);
+  auto column2 = reinterpret_cast<PaxNonFixedColumn *>((*columns)[1]);
 
   EXPECT_EQ(2, column1->GetNonNullRows());
   EXPECT_EQ(0, std::memcmp(column1->GetBuffer(0).first + VARHDRSZ, column_buff,
@@ -378,27 +245,25 @@ TEST_F(OrcTest, WriteReadStripesTwice) {
   EXPECT_EQ(0, std::memcmp(column2->GetBuffer(1).first + VARHDRSZ, column_buff,
                            COLUMN_SIZE));
 
-  delete columns_stripe;
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete group;
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadMultiStripes) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Flush();
@@ -406,88 +271,89 @@ TEST_F(OrcTest, WriteReadMultiStripes) {
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(2, reader->GetNumberOfStripes());
-  auto columns1 = reader->ReadStripe(0);
-  auto columns2 = reader->ReadStripe(1);
+  EXPECT_EQ(2, reader->GetGroupNums());
+  auto group1 = reader->ReadGroup(0);
+  auto columns1 = group1->GetAllColumns();
+  auto group2 = reader->ReadGroup(1);
+  auto columns2 = group2->GetAllColumns();
   OrcTest::VerifySingleStripe(columns1);
   OrcTest::VerifySingleStripe(columns2);
   reader->Close();
 
-  delete columns1;
-  delete columns2;
+  delete group1;
+  delete group2;
 
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadCloseEmptyOrc) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
   writer->WriteTuple(tuple_slot);
   writer->Flush();
 
   // close without any data
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  auto columns = reader->ReadStripe(0);
+  EXPECT_EQ(1, reader->GetGroupNums());
+  auto group = reader->ReadGroup(0);
+  auto columns = group->GetAllColumns();
   OrcTest::VerifySingleStripe(columns);
   reader->Close();
 
+  delete group;
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadEmptyOrc) {
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
   // flush empty
   writer->Flush();
   // direct close
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(0, reader->GetNumberOfStripes());
+  EXPECT_EQ(0, reader->GetGroupNums());
   reader->Close();
 
   delete writer;
@@ -495,78 +361,116 @@ TEST_F(OrcTest, WriteReadEmptyOrc) {
 }
 
 TEST_F(OrcTest, ReadTuple) {
-  char column_buff[COLUMN_SIZE];
-
-  GenFakeBuffer(column_buff, COLUMN_SIZE);
-
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  tuple_slot_empty->GetTupleDesc()->natts = COLUMN_NUMS;
+  EXPECT_EQ(1, reader->GetGroupNums());
   reader->ReadTuple(tuple_slot_empty);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty));
+  reader->Close();
+
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete writer;
+  delete reader;
+}
 
-  auto vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[0]);
-  auto tunpacked = pg_detoast_datum_packed(vl);
-  EXPECT_EQ((Pointer)vl, (Pointer)tunpacked);
+TEST_F(OrcTest, GetTuple) {
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
+  auto local_fs = Singleton<LocalFileSystem>::GetInstance();
+  ASSERT_NE(nullptr, local_fs);
 
-  int read_len = VARSIZE(tunpacked);
-  char *read_data = VARDATA_ANY(tunpacked);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
+  EXPECT_NE(nullptr, file_ptr);
 
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, std::memcmp(read_data, column_buff, COLUMN_SIZE));
+  MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  writer_options.group_limit = 100;
+
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
+  for (int i = 0; i < 1000; i++) {
+    if (i % 5 == 0) {
+      tuple_slot->tts_isnull[0] = true;
+      tuple_slot->tts_isnull[1] = true;
+    } else {
+      tuple_slot->tts_isnull[0] = false;
+      tuple_slot->tts_isnull[1] = false;
+    }
+    tuple_slot->tts_values[2] = Int32GetDatum(i);
+    writer->WriteTuple(tuple_slot);
+  }
+  writer->Close();
+
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
+
+  MicroPartitionReader::ReaderOptions reader_options;
+  auto reader = new OrcReader(file_ptr);
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
+
+  reader->Open(reader_options);
+  EXPECT_EQ(10, reader->GetGroupNums());
+
+  for (int i = 0; i < 1000; i++) {
+    ASSERT_TRUE(reader->GetTuple(tuple_slot_empty, i));
+    if (i % 5 == 0) {
+      EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+      EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+    } else {
+      EXPECT_FALSE(tuple_slot_empty->tts_isnull[0]);
+      EXPECT_FALSE(tuple_slot_empty->tts_isnull[1]);
+    }
+    EXPECT_EQ(DatumGetInt32(tuple_slot_empty->tts_values[2]), i);
+  }
+
+  ASSERT_FALSE(reader->GetTuple(tuple_slot_empty, 1000));
+  ASSERT_FALSE(reader->GetTuple(tuple_slot_empty, 10000));
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
 
 class OrcEncodingTest : public ::testing::TestWithParam<ColumnEncoding_Kind> {
   void SetUp() override {
-    Singleton<LocalFileSystem>::GetInstance();
-    remove(file_name_.c_str());
-
-    MemoryContext orc_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "OrcTestMemoryContext", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
 
-    MemoryContextSwitchTo(orc_test_memory_context);
-    CreateOrcTestResourceOwner();
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
   void TearDown() override {
     Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    ReleaseOrcTestResourceOwner();
+    ReleaseTestResourceOwner();
   }
 
  protected:
   const std::string file_name_ = "./test_encoding.file";
 };
 
+class OrcCompressTest : public OrcEncodingTest {};
+
 TEST_P(OrcEncodingTest, ReadTupleWithEncoding) {
   TupleTableSlot *tuple_slot = nullptr;
   auto encoding_kind = GetParam();
@@ -578,11 +482,13 @@ TEST_P(OrcEncodingTest, ReadTupleWithEncoding) {
   tuple_desc->attrs[0] = {
       .attlen = 8,
       .attbyval = true,
+      .attalign = TYPALIGN_DOUBLE,
   };
 
   tuple_desc->attrs[1] = {
       .attlen = 8,
       .attbyval = true,
+      .attalign = TYPALIGN_DOUBLE,
   };
 
   tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
@@ -594,46 +500,47 @@ TEST_P(OrcEncodingTest, ReadTupleWithEncoding) {
   tuple_slot->tts_values[0] = Int64GetDatum(0);
   tuple_slot->tts_values[1] = Int64GetDatum(1);
   tuple_slot->tts_isnull = fake_is_null;
-  auto ctuple_slot = new CTupleSlot(tuple_slot);
 
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_LONG);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_LONG);
-  std::vector<ColumnEncoding_Kind> types_encoding;
-  types_encoding.emplace_back(encoding_kind);
-  types_encoding.emplace_back(encoding_kind);
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_LONG);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_LONG);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 0));
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 0));
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.encoding_opts = types_encoding;
+  writer_options.desc = tuple_desc;
 
-  auto writer = new OrcWriter(writer_options, types, types_encoding, file_ptr);
+  auto writer = new OrcWriter(writer_options, types, file_ptr);
 
   for (size_t i = 0; i < 10000; i++) {
-    ctuple_slot->GetTupleTableSlot()->tts_values[0] = Int64GetDatum(i);
-    ctuple_slot->GetTupleTableSlot()->tts_values[1] = Int64GetDatum(i + 1);
-    writer->WriteTuple(ctuple_slot);
+    tuple_slot->tts_values[0] = Int64GetDatum(i);
+    tuple_slot->tts_values[1] = Int64GetDatum(i + 1);
+    writer->WriteTuple(tuple_slot);
   }
 
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
+  EXPECT_EQ(1, reader->GetGroupNums());
   for (size_t i = 0; i < 10000; i++) {
-    ASSERT_TRUE(reader->ReadTuple(ctuple_slot));
-    ASSERT_EQ(ctuple_slot->GetTupleTableSlot()->tts_values[0], i);
-    ASSERT_EQ(ctuple_slot->GetTupleTableSlot()->tts_values[1], i + 1);
+    ASSERT_TRUE(reader->ReadTuple(tuple_slot));
+    ASSERT_EQ(tuple_slot->tts_values[0], i);
+    ASSERT_EQ(tuple_slot->tts_values[1], i + 1);
   }
   reader->Close();
 
-  OrcTest::DeleteCTupleSlot(ctuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
@@ -642,147 +549,232 @@ INSTANTIATE_TEST_CASE_P(
     OrcEncodingTestCombine, OrcEncodingTest,
     testing::Values(ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED,
                     ColumnEncoding_Kind::ColumnEncoding_Kind_NO_ENCODED,
-                    ColumnEncoding_Kind::ColumnEncoding_Kind_ORC_RLE_V2));
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2,
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZSTD));
+
+TEST_P(OrcCompressTest, ReadTupleWithCompress) {
+  TupleTableSlot *tuple_slot = nullptr;
+  auto encoding_kind = GetParam();
+  char column_buff_str[COLUMN_SIZE];
+
+  auto tuple_desc = reinterpret_cast<TupleDescData *>(
+      cbdb::Palloc0(sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * 2));
+
+  tuple_desc->natts = 2;
+  tuple_desc->attrs[0] = {
+      .attlen = -1,
+      .attbyval = false,
+      .attalign = TYPALIGN_DOUBLE,
+  };
+
+  tuple_desc->attrs[1] = {
+      .attlen = -1,
+      .attbyval = false,
+      .attalign = TYPALIGN_DOUBLE,
+  };
+
+  tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
+  bool *fake_is_null =
+      reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * COLUMN_NUMS));
+  fake_is_null[0] = false;
+  fake_is_null[1] = false;
+
+  tuple_slot->tts_isnull = fake_is_null;
+
+  auto local_fs = Singleton<LocalFileSystem>::GetInstance();
+  ASSERT_NE(nullptr, local_fs);
+
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
+  EXPECT_NE(nullptr, file_ptr);
+
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 5));
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 5));
+  MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.encoding_opts = types_encoding;
+  writer_options.desc = tuple_desc;
+
+  auto writer = new OrcWriter(writer_options, types, file_ptr);
+
+  for (size_t i = 0; i < COLUMN_SIZE; i++) {
+    column_buff_str[i] = i;
+  }
+
+  for (size_t i = 0; i < 1000; i++) {
+    tuple_slot->tts_values[0] =
+        cbdb::DatumFromCString(column_buff_str, COLUMN_SIZE);
+    tuple_slot->tts_values[1] =
+        cbdb::DatumFromCString(column_buff_str, COLUMN_SIZE);
+    writer->WriteTuple(tuple_slot);
+  }
+  writer->Close();
+
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
+
+  MicroPartitionReader::ReaderOptions reader_options;
+  auto reader = new OrcReader(file_ptr);
+  reader->Open(reader_options);
+
+  ASSERT_EQ(1, reader->GetGroupNums());
+  auto group = reader->ReadGroup(0);
+  auto columns = group->GetAllColumns();
+
+  ASSERT_EQ(2, columns->GetColumns());
+
+  auto column1 = reinterpret_cast<PaxNonFixedColumn *>((*columns)[0]);
+  ASSERT_EQ(1000, column1->GetNonNullRows());
+
+  auto column2 = reinterpret_cast<PaxNonFixedColumn *>((*columns)[1]);
+  ASSERT_EQ(1000, column2->GetNonNullRows());
+
+  for (size_t i = 0; i < 1000; i++) {
+    EXPECT_EQ(0, std::memcmp(column1->GetBuffer(i).first + VARHDRSZ,
+                             column_buff_str, COLUMN_SIZE));
+
+    EXPECT_EQ(0, std::memcmp(column2->GetBuffer(i).first + VARHDRSZ,
+                             column_buff_str, COLUMN_SIZE));
+  }
+
+  reader->Close();
+
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete group;
+  delete writer;
+  delete reader;
+}
+
+INSTANTIATE_TEST_CASE_P(
+    OrcEncodingTestCombine, OrcCompressTest,
+    testing::Values(ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZSTD,
+                    ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZLIB));
 
 TEST_F(OrcTest, ReadTupleDefaultColumn) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot(true);
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto *writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto *writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  EXPECT_EQ(1, reader->GetGroupNums());
 
-  TupleTableSlot *slot = tuple_slot_empty->GetTupleTableSlot();
-
-  slot->tts_tupleDescriptor->attrs[3] = {
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
+  tuple_slot_empty->tts_tupleDescriptor->attrs[3] = {
       .attlen = 4,
       .attbyval = true,
   };
 
-  slot->tts_tupleDescriptor->natts = COLUMN_NUMS + 1;
+  tuple_slot_empty->tts_tupleDescriptor->natts = COLUMN_NUMS + 1;
 
-  slot->tts_tupleDescriptor->attrs[3].atthasmissing = true;
-  slot->tts_tupleDescriptor->constr =
+  tuple_slot_empty->tts_tupleDescriptor->attrs[3].atthasmissing = true;
+  tuple_slot_empty->tts_tupleDescriptor->constr =
       reinterpret_cast<TupleConstr *>(cbdb::Palloc0(sizeof(TupleConstr)));
-  slot->tts_tupleDescriptor->constr->missing = reinterpret_cast<AttrMissing *>(
-      cbdb::Palloc0((COLUMN_NUMS + 1) * sizeof(AttrMissing)));
+  tuple_slot_empty->tts_tupleDescriptor->constr->missing =
+      reinterpret_cast<AttrMissing *>(
+          cbdb::Palloc0((COLUMN_NUMS + 1) * sizeof(AttrMissing)));
 
-  slot->tts_tupleDescriptor->constr->missing[3].am_value =
+  tuple_slot_empty->tts_tupleDescriptor->constr->missing[3].am_value =
       cbdb::Int32ToDatum(INT32_COLUMN_VALUE_DEFAULT);
-  slot->tts_tupleDescriptor->constr->missing[3].am_present = true;
+  tuple_slot_empty->tts_tupleDescriptor->constr->missing[3].am_present = true;
   reader->ReadTuple(tuple_slot_empty);
 
-  ASSERT_EQ(tuple_slot_empty->GetTupleTableSlot()->tts_values[3],
-            INT32_COLUMN_VALUE_DEFAULT);
+  ASSERT_EQ(tuple_slot_empty->tts_values[3], INT32_COLUMN_VALUE_DEFAULT);
 
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, ReadTupleDroppedColumn) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot(true);
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto *writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto *writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
-
-  TupleTableSlot *slot = tuple_slot_empty->GetTupleTableSlot();
-
-  slot->tts_tupleDescriptor->attrs[2].attisdropped = true;
-
+  EXPECT_EQ(1, reader->GetGroupNums());
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
+  tuple_slot_empty->tts_tupleDescriptor->attrs[2].attisdropped = true;
   reader->ReadTuple(tuple_slot_empty);
-
-  ASSERT_EQ(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2], true);
+  ASSERT_EQ(tuple_slot_empty->tts_isnull[2], true);
 
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, ReadTupleDroppedColumnWithProjection) {
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot(true);
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  EXPECT_EQ(1, reader->GetGroupNums());
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
-  TupleTableSlot *slot = tuple_slot_empty->GetTupleTableSlot();
-
-  slot->tts_tupleDescriptor->attrs[2].attisdropped = true;
+  tuple_slot_empty->tts_tupleDescriptor->attrs[2].attisdropped = true;
 
   reader->ReadTuple(tuple_slot_empty);
 
-  ASSERT_EQ(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2], true);
+  ASSERT_EQ(tuple_slot_empty->tts_isnull[2], true);
 
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
@@ -796,10 +788,12 @@ TEST_F(OrcTest, WriteReadBigTuple) {
   tuple_desc->attrs[0] = {
       .attlen = 4,
       .attbyval = true,
+      .attalign = TYPALIGN_INT,
   };
   tuple_desc->attrs[1] = {
       .attlen = 4,
       .attbyval = true,
+      .attalign = TYPALIGN_INT,
   };
 
   tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
@@ -811,43 +805,43 @@ TEST_F(OrcTest, WriteReadBigTuple) {
   tuple_slot->tts_values[0] = Int32GetDatum(0);
   tuple_slot->tts_values[1] = Int32GetDatum(1);
   tuple_slot->tts_isnull = fake_is_null;
-  auto ctuple_slot = new CTupleSlot(tuple_slot);
 
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_desc;
 
   auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
 
   for (size_t i = 0; i < 10000; i++) {
-    ctuple_slot->GetTupleTableSlot()->tts_values[0] = Int32GetDatum(i);
-    ctuple_slot->GetTupleTableSlot()->tts_values[1] = Int32GetDatum(i + 1);
-    writer->WriteTuple(ctuple_slot);
+    tuple_slot->tts_values[0] = Int32GetDatum(i);
+    tuple_slot->tts_values[1] = Int32GetDatum(i + 1);
+    writer->WriteTuple(tuple_slot);
   }
 
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
+  EXPECT_EQ(1, reader->GetGroupNums());
   for (size_t i = 0; i < 10000; i++) {
-    ASSERT_TRUE(reader->ReadTuple(ctuple_slot));
-    ASSERT_EQ(ctuple_slot->GetTupleTableSlot()->tts_values[0], i);
-    ASSERT_EQ(ctuple_slot->GetTupleTableSlot()->tts_values[1], i + 1);
+    ASSERT_TRUE(reader->ReadTuple(tuple_slot));
+    ASSERT_EQ(tuple_slot->tts_values[0], i);
+    ASSERT_EQ(tuple_slot->tts_values[1], i + 1);
   }
   reader->Close();
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete writer;
   delete reader;
 }
@@ -856,46 +850,44 @@ TEST_F(OrcTest, WriteReadNoFixedColumnInSameTuple) {
   char column_buff_origin[COLUMN_SIZE];
   char column_buff_reset[COLUMN_SIZE];
 
-  CTupleSlot *tuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
 
   // using the same tuple slot with different data
-  cbdb::Pfree(
-      cbdb::DatumToPointer(tuple_slot->GetTupleTableSlot()->tts_values[0]));
+  cbdb::Pfree(cbdb::DatumToPointer(tuple_slot->tts_values[0]));
   memset(&column_buff_reset, 0, COLUMN_SIZE);
-  tuple_slot->GetTupleTableSlot()->tts_values[0] =
+  tuple_slot->tts_values[0] =
       cbdb::DatumFromCString(column_buff_reset, COLUMN_SIZE);
 
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  auto columns = reader->ReadStripe(0);
+  EXPECT_EQ(1, reader->GetGroupNums());
+  auto group = reader->ReadGroup(0);
+  auto columns = group->GetAllColumns();
 
   EXPECT_EQ(COLUMN_NUMS, columns->GetColumns());
   auto column1 = reinterpret_cast<PaxNonFixedColumn *>((*columns)[0]);
 
-  GenFakeBuffer(column_buff_origin, COLUMN_SIZE);
+  GenTextBuffer(column_buff_origin, COLUMN_SIZE);
 
   EXPECT_EQ(2, column1->GetNonNullRows());
   EXPECT_EQ(0, std::memcmp(column1->GetBuffer(0).first + VARHDRSZ,
@@ -905,250 +897,211 @@ TEST_F(OrcTest, WriteReadNoFixedColumnInSameTuple) {
 
   reader->Close();
 
-  delete columns;
-  DeleteCTupleSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete group;
   delete writer;
   delete reader;
 }
 
 TEST_F(OrcTest, WriteReadWithNullField) {
-  char column_buff[COLUMN_SIZE];
-  CTupleSlot *ctuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  GenFakeBuffer(column_buff, COLUMN_SIZE);
-
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   OrcWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto *writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto *writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   // str str int
   // null null int
   // str str null
   // null null null
-  writer->WriteTuple(ctuple_slot);
+  writer->WriteTuple(tuple_slot);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = false;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = true;
+  tuple_slot->tts_isnull[1] = true;
+  tuple_slot->tts_isnull[2] = false;
+  writer->WriteTuple(tuple_slot);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = false;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = false;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = true;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = false;
+  tuple_slot->tts_isnull[1] = false;
+  tuple_slot->tts_isnull[2] = true;
+  writer->WriteTuple(tuple_slot);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = true;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = true;
+  tuple_slot->tts_isnull[1] = true;
+  tuple_slot->tts_isnull[2] = true;
+  writer->WriteTuple(tuple_slot);
 
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  tuple_slot_empty->GetTupleDesc()->natts = COLUMN_NUMS;
+  EXPECT_EQ(1, reader->GetGroupNums());
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[2]);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty));
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
-  EXPECT_EQ(
-      cbdb::DatumToInt32(tuple_slot_empty->GetTupleTableSlot()->tts_values[2]),
-      INT32_COLUMN_VALUE);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[2]);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty, 3));
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
-  auto vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[0]);
-  int read_len = VARSIZE(vl);
-  char *read_data = VARDATA_ANY(vl);
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, std::memcmp(read_data, column_buff, COLUMN_SIZE));
-
-  vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[1]);
-  read_len = VARSIZE(vl);
-  read_data = VARDATA_ANY(vl);
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, std::memcmp(read_data, column_buff, COLUMN_SIZE));
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[2]);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty, 1));
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty, 2));
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[2]);
 
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete reader;
   delete writer;
 }
 
 TEST_F(OrcTest, WriteReadWithBoundNullField) {
-  char column_buff[COLUMN_SIZE];
-  CTupleSlot *ctuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  GenFakeBuffer(column_buff, COLUMN_SIZE);
-
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   OrcWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto *writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto *writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   // null null null
   // str str int
   // null null null
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = true;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = true;
+  tuple_slot->tts_isnull[1] = true;
+  tuple_slot->tts_isnull[2] = true;
+  writer->WriteTuple(tuple_slot);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = false;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = false;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = false;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = false;
+  tuple_slot->tts_isnull[1] = false;
+  tuple_slot->tts_isnull[2] = false;
+  writer->WriteTuple(tuple_slot);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = true;
-  writer->WriteTuple(ctuple_slot);
+  tuple_slot->tts_isnull[0] = true;
+  tuple_slot->tts_isnull[1] = true;
+  tuple_slot->tts_isnull[2] = true;
+  writer->WriteTuple(tuple_slot);
 
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  tuple_slot_empty->GetTupleDesc()->natts = COLUMN_NUMS;
+  EXPECT_EQ(1, reader->GetGroupNums());
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[2]);
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_FALSE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
-
-  auto vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[0]);
-  int read_len = VARSIZE(vl);
-  char *read_data = VARDATA_ANY(vl);
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, std::memcmp(read_data, column_buff, COLUMN_SIZE));
-
-  vl = (struct varlena *)DatumGetPointer(
-      tuple_slot_empty->GetTupleTableSlot()->tts_values[1]);
-  read_len = VARSIZE(vl);
-  read_data = VARDATA_ANY(vl);
-  EXPECT_EQ(read_len, COLUMN_SIZE + VARHDRSZ);
-  EXPECT_EQ(0, std::memcmp(read_data, column_buff, COLUMN_SIZE));
-  EXPECT_EQ(DatumGetInt32(tuple_slot_empty->GetTupleTableSlot()->tts_values[2]),
-            INT32_COLUMN_VALUE);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_FALSE(tuple_slot_empty->tts_isnull[2]);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(tuple_slot_empty));
 
   reader->ReadTuple(tuple_slot_empty);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-  EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+  EXPECT_TRUE(tuple_slot_empty->tts_isnull[2]);
 
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete reader;
   delete writer;
 }
 
 TEST_F(OrcTest, WriteReadWithALLNullField) {
-  CTupleSlot *ctuple_slot = CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
 
-  auto *file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   OrcWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto *writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto *writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[0] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[1] = true;
-  ctuple_slot->GetTupleTableSlot()->tts_isnull[2] = true;
+  tuple_slot->tts_isnull[0] = true;
+  tuple_slot->tts_isnull[1] = true;
+  tuple_slot->tts_isnull[2] = true;
   for (size_t i = 0; i < 1000; i++) {
-    writer->WriteTuple(ctuple_slot);
+    writer->WriteTuple(tuple_slot);
   }
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
   MicroPartitionReader::ReaderOptions reader_options;
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
-  CTupleSlot *tuple_slot_empty = CreateEmptyCTupleSlot();
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
 
-  EXPECT_EQ(1, reader->GetNumberOfStripes());
-  tuple_slot_empty->GetTupleDesc()->natts = COLUMN_NUMS;
+  EXPECT_EQ(1, reader->GetGroupNums());
   for (size_t i = 0; i < 1000; i++) {
     reader->ReadTuple(tuple_slot_empty);
-    EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[0]);
-    EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[1]);
-    EXPECT_TRUE(tuple_slot_empty->GetTupleTableSlot()->tts_isnull[2]);
+    EXPECT_TRUE(tuple_slot_empty->tts_isnull[0]);
+    EXPECT_TRUE(tuple_slot_empty->tts_isnull[1]);
+    EXPECT_TRUE(tuple_slot_empty->tts_isnull[2]);
   }
   reader->Close();
 
-  DeleteCTupleSlot(tuple_slot_empty);
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+  DeleteTestTupleTableSlot(tuple_slot);
   delete reader;
   delete writer;
 }
 
 TEST_P(OrcTestProjection, ReadTupleWithProjectionColumn) {
-  CTupleSlot *tuple_slot = OrcTest::CreateFakeCTupleSlot();
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
   auto local_fs = Singleton<LocalFileSystem>::GetInstance();
   ASSERT_NE(nullptr, local_fs);
-  bool proj_map[COLUMN_NUMS] = {false, false, false};
   size_t proj_index = ::testing::get<0>(GetParam());
   auto reversal = ::testing::get<1>(GetParam());
+  bool *proj_map;
+
+  proj_map = new bool[COLUMN_NUMS];
+  memset(proj_map, false, COLUMN_NUMS);
 
   ASSERT_LE(proj_index, COLUMN_NUMS);
   ASSERT_GE(proj_index, 0);
@@ -1160,16 +1113,14 @@ TEST_P(OrcTestProjection, ReadTupleWithProjectionColumn) {
     proj_map[proj_index] = !proj_map[proj_index];
   }
 
-  auto file_ptr = local_fs->Open(file_name_);
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
   EXPECT_NE(nullptr, file_ptr);
 
-  std::vector<orc::proto::Type_Kind> types;
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_STRING);
-  types.emplace_back(orc::proto::Type_Kind::Type_Kind_INT);
   MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
 
-  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+  auto writer = OrcWriter::CreateWriter(
+      writer_options, std::move(CreateTestSchemaTypes()), file_ptr);
 
   writer->WriteTuple(tuple_slot);
   writer->Flush();
@@ -1177,24 +1128,33 @@ TEST_P(OrcTestProjection, ReadTupleWithProjectionColumn) {
   writer->WriteTuple(tuple_slot);
   writer->Close();
 
-  file_ptr = local_fs->Open(file_name_);
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
 
+  auto pax_filter = new PaxFilter();
+  pax_filter->SetColumnProjection(proj_map, COLUMN_NUMS);
   MicroPartitionReader::ReaderOptions reader_options;
+  reader_options.filter = pax_filter;
+
   auto reader = new OrcReader(file_ptr);
   reader->Open(reader_options);
 
-  EXPECT_EQ(2, reader->GetNumberOfStripes());
+  EXPECT_EQ(2, reader->GetGroupNums());
+
+  auto group1 = reader->ReadGroup(0);
+  auto columns1 = group1->GetAllColumns();
 
-  auto stripe1 = reader->ReadStripe(0, proj_map, COLUMN_NUMS);
-  auto stripe2 = reader->ReadStripe(1, proj_map, COLUMN_NUMS);
-  OrcTest::VerifySingleStripe(stripe1, proj_map);
-  OrcTest::VerifySingleStripe(stripe2, proj_map);
+  auto group2 = reader->ReadGroup(1);
+  auto columns2 = group2->GetAllColumns();
+
+  OrcTest::VerifySingleStripe(columns1, proj_map);
+  OrcTest::VerifySingleStripe(columns2, proj_map);
   reader->Close();
 
-  delete stripe1;
-  delete stripe2;
+  DeleteTestTupleTableSlot(tuple_slot);
+  delete group1;
+  delete group2;
 
-  OrcTest::DeleteCTupleSlot(tuple_slot);
+  delete pax_filter;
   delete writer;
   delete reader;
 }
@@ -1203,4 +1163,104 @@ INSTANTIATE_TEST_CASE_P(OrcTestProjectionCombine, OrcTestProjection,
                         testing::Combine(testing::Values(0, 1, 2, 3),
                                          testing::Values(false, true)));
 
+TEST_P(OrcEncodingTest, WriterMerge) {
+  TupleTableSlot *tuple_slot = CreateTestTupleTableSlot();
+  const std::string file1_name = "./test1.file";
+  const std::string file2_name = "./test2.file";
+  const std::string file3_name = "./test3.file";
+  auto *local_fs = Singleton<LocalFileSystem>::GetInstance();
+  TupleTableSlot *tuple_slot_empty = CreateTestTupleTableSlot(false);
+  auto encoding_kind = GetParam();
+
+  remove(file1_name.c_str());
+  remove(file2_name.c_str());
+  remove(file3_name.c_str());
+
+  ASSERT_NE(nullptr, local_fs);
+
+  auto file1_ptr = local_fs->Open(file1_name, fs::kReadWriteMode);
+  auto file2_ptr = local_fs->Open(file2_name, fs::kReadWriteMode);
+  auto file3_ptr = local_fs->Open(file3_name, fs::kReadWriteMode);
+  EXPECT_NE(nullptr, file1_ptr);
+  EXPECT_NE(nullptr, file2_ptr);
+  EXPECT_NE(nullptr, file3_ptr);
+
+  OrcWriter::WriterOptions writer_options;
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 0));
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 0));
+  types_encoding.emplace_back(std::make_tuple(encoding_kind, 0));
+  writer_options.encoding_opts = types_encoding;
+  writer_options.group_limit = 100;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+
+  auto *writer1 = new OrcWriter(writer_options,
+                                std::move(CreateTestSchemaTypes()), file1_ptr);
+  auto *writer2 = new OrcWriter(writer_options,
+                                std::move(CreateTestSchemaTypes()), file2_ptr);
+  auto *writer3 = new OrcWriter(writer_options,
+                                std::move(CreateTestSchemaTypes()), file3_ptr);
+
+  // two group + 51 rows in memory
+  for (size_t i = 0; i < 251; i++) {
+    if (i % 3 == 0) {
+      tuple_slot->tts_isnull[0] = true;
+      tuple_slot->tts_isnull[1] = true;
+      tuple_slot->tts_isnull[2] = true;
+    } else {
+      tuple_slot->tts_isnull[0] = false;
+      tuple_slot->tts_isnull[1] = false;
+      tuple_slot->tts_isnull[2] = false;
+    }
+    writer1->WriteTuple(tuple_slot);
+    writer2->WriteTuple(tuple_slot);
+  }
+
+  for (size_t i = 0; i < 20; i++) {
+    writer3->WriteTuple(tuple_slot);
+  }
+
+  // writer1 merge writer2, writer3 merge writer1
+  // writer3 must contains all of datas
+  writer1->MergeTo(writer2);
+  writer3->MergeTo(writer1);
+  writer3->Close();
+
+  delete writer1;
+  delete writer2;
+  delete writer3;
+
+  ASSERT_NE(0, access(file1_name.c_str(), 0));
+  ASSERT_NE(0, access(file2_name.c_str(), 0));
+
+  MicroPartitionReader::ReaderOptions reader_options;
+  file3_ptr = local_fs->Open(file3_name, fs::kReadMode);
+
+  auto reader = new OrcReader(file3_ptr);
+  reader->Open(reader_options);
+
+  // no memory merge
+  ASSERT_EQ(7, reader->GetGroupNums());
+
+  size_t total_rows = (251 * 2) + 20;
+
+  for (size_t i = 0; i < total_rows; i++) {
+    ASSERT_TRUE(reader->ReadTuple(tuple_slot_empty));
+    if (!tuple_slot_empty->tts_isnull[0]) {
+      VerifyTestTupleTableSlot(tuple_slot_empty);
+    }
+  }
+
+  ASSERT_FALSE(reader->ReadTuple(tuple_slot_empty));
+
+  DeleteTestTupleTableSlot(tuple_slot);
+  DeleteTestTupleTableSlot(tuple_slot_empty);
+
+  reader->Close();
+  delete reader;
+
+  // only remain file3
+  remove(file3_name.c_str());
+}
+
 }  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_vec_group.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_vec_group.cc
new file mode 100644
index 00000000000..5dbca4207db
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_vec_group.cc
@@ -0,0 +1,118 @@
+#include "storage/orc/orc_group.h"
+
+namespace pax {
+
+OrcVecGroup::OrcVecGroup(PaxColumns *pax_column, size_t row_offset)
+    : OrcGroup(pax_column, row_offset) {
+  Assert(pax_column);
+  Assert(COLUMN_STORAGE_FORMAT_IS_VEC(pax_column));
+}
+
+OrcVecGroup::~OrcVecGroup() {
+  for (auto buffer : buffer_holder_) {
+    cbdb::Pfree(buffer);
+  }
+}
+
+static std::pair<Datum, struct varlena *> GetDatumWithNonNull(PaxColumn *column,
+                                                              size_t row_index);
+
+std::pair<Datum, bool> OrcVecGroup::GetColumnValue(size_t column_index,
+                                                   size_t row_index) {
+  Assert(column_index < pax_columns_->GetColumns());
+
+  auto column = (*pax_columns_)[column_index];
+  Assert(column);
+
+  return GetColumnValue(column, row_index);
+}
+
+std::pair<Datum, bool> OrcVecGroup::GetColumnValue(PaxColumn *column,
+                                                   size_t row_index) {
+  Assert(column);
+  Assert(row_index < column->GetRows());
+  Datum datum;
+  struct varlena *buffer_ref = nullptr;
+
+  if (column->HasNull()) {
+    auto bm = column->GetBitmap();
+    Assert(bm);
+    if (!bm->Test(row_index)) {
+      return {0, true};
+    }
+  }
+
+  std::tie(datum, buffer_ref) = GetDatumWithNonNull(column, row_index);
+  if (buffer_ref) buffer_holder_.emplace_back(buffer_ref);
+
+  return {datum, false};
+}
+
+static std::pair<Datum, struct varlena *> GetDatumWithNonNull(
+    PaxColumn *column, size_t row_index) {
+  Assert(column);
+  Datum datum = 0;
+  char *buffer;
+  size_t buffer_len;
+  struct varlena *result_ref = nullptr;
+
+  std::tie(buffer, buffer_len) = column->GetBuffer(row_index);
+  switch (column->GetPaxColumnTypeInMem()) {
+    case kTypeNonFixed:
+      CBDB_WRAP_START;
+      {
+        result_ref = reinterpret_cast<struct varlena *>(
+            palloc(TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len + VARHDRSZ)));
+        SET_VARSIZE(result_ref, buffer_len + VARHDRSZ);
+        memcpy(VARDATA(result_ref), buffer, buffer_len);
+        datum = PointerGetDatum(result_ref);
+      }
+      CBDB_WRAP_END;
+      break;
+    case kTypeFixed: {
+      Assert(buffer_len > 0);
+      switch (buffer_len) {
+        case 1:
+          datum = cbdb::Int8ToDatum(*reinterpret_cast<int8 *>(buffer));
+          break;
+        case 2:
+          datum = cbdb::Int16ToDatum(*reinterpret_cast<int16 *>(buffer));
+          break;
+        case 4:
+          datum = cbdb::Int32ToDatum(*reinterpret_cast<int32 *>(buffer));
+          break;
+        case 8:
+          datum = cbdb::Int64ToDatum(*reinterpret_cast<int64 *>(buffer));
+          break;
+        default:
+          Assert(!"should't be here, fixed type len should be 1, 2, 4, 8");
+      }
+      break;
+    }
+    default:
+      Assert(!"should't be here, non-implemented column type in memory");
+      break;
+  }
+
+  return {datum, result_ref};
+}
+
+std::pair<Datum, bool> OrcVecGroup::GetColumnValue(PaxColumn *column,
+                                                   size_t row_index,
+                                                   uint32 * /*null_counts*/) {
+  if (column->HasNull()) {
+    auto bm = column->GetBitmap();
+    Assert(bm);
+    if (!bm->Test(row_index)) {
+      return {0, true};
+    }
+  }
+  Datum datum;
+  struct varlena *buffer_ref = nullptr;
+  std::tie(datum, buffer_ref) = GetDatumWithNonNull(column, row_index);
+  if (buffer_ref) buffer_holder_.emplace_back(buffer_ref);
+
+  return {datum, false};
+}
+
+}  // namespace pax
\ No newline at end of file
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_vec_test.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_vec_test.cc
new file mode 100644
index 00000000000..26443586198
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_vec_test.cc
@@ -0,0 +1,364 @@
+#include "storage/orc/orc.h"  // NOLINT
+#include <cstdio>
+#include <random>
+#include <string>
+#include <utility>
+
+#include "access/tupdesc_details.h"
+#include "comm/cbdb_wrappers.h"
+#include "comm/gtest_wrappers.h"
+#include "exceptions/CException.h"
+#include "storage/local_file_system.h"
+#include "storage/columns/pax_column_traits.h"
+#include "pax_gtest_helper.h"
+namespace pax::tests {
+
+#ifdef VEC_BUILD
+
+class OrcVecTest : public ::testing::Test {
+ public:
+  void SetUp() override {
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
+
+    CreateMemoryContext();
+    CreateTestResourceOwner();
+  }
+
+  void TearDown() override {
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
+    ReleaseTestResourceOwner();
+  }
+
+  static TupleTableSlot *CreateFakeTupleSlot() {
+    TupleTableSlot *tuple_slot = nullptr;
+    auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
+        sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * 2));
+
+    tuple_desc->natts = 2;
+    tuple_desc->attrs[0] = {
+        .attlen = -1,
+        .attbyval = false,
+        .attalign = TYPALIGN_DOUBLE,
+    };
+
+    tuple_desc->attrs[1] = {
+        .attlen = 4,
+        .attbyval = true,
+        .attalign = TYPALIGN_INT,
+    };
+
+    tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
+    bool *fake_is_null =
+        reinterpret_cast<bool *>(cbdb::Palloc0(sizeof(bool) * 2));
+    tuple_slot->tts_isnull = fake_is_null;
+    return tuple_slot;
+  }
+
+  static void DeleteTupleSlot(TupleTableSlot *tuple_table_slot) {
+    cbdb::Pfree(tuple_table_slot->tts_tupleDescriptor);
+    if (tuple_table_slot->tts_isnull) {
+      cbdb::Pfree(tuple_table_slot->tts_isnull);
+    }
+
+    cbdb::Pfree(tuple_table_slot);
+  }
+
+ protected:
+  const std::string file_name_ = "./test_vec_orc.file";
+};
+
+TEST_F(OrcVecTest, WriteReadGroup) {
+  TupleTableSlot *tuple_slot = CreateFakeTupleSlot();
+
+  auto local_fs = Singleton<LocalFileSystem>::GetInstance();
+  ASSERT_NE(nullptr, local_fs);
+
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
+  EXPECT_NE(nullptr, file_ptr);
+
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
+  OrcWriter::WriterOptions writer_options;
+
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  writer_options.storage_format = PaxStorageFormat::kTypeStorageOrcVec;
+
+  auto writer = OrcWriter::CreateWriter(writer_options, types, file_ptr);
+
+  for (uint16 i = 0; i < 10000; i++) {
+    if (i % 3 == 0) {
+      tuple_slot->tts_isnull[0] = true;
+      tuple_slot->tts_isnull[1] = true;
+    } else {
+      tuple_slot->tts_isnull[0] = false;
+      tuple_slot->tts_isnull[1] = false;
+    }
+
+    tuple_slot->tts_values[0] =
+        cbdb::DatumFromCString((char *)&i, sizeof(uint16));
+    tuple_slot->tts_values[1] = Int64GetDatum(i);
+    writer->WriteTuple(tuple_slot);
+  }
+
+  writer->Flush();
+
+  tuple_slot->tts_isnull[0] = false;
+  tuple_slot->tts_isnull[1] = false;
+
+  uint16 i = 10000;
+  tuple_slot->tts_values[0] =
+      cbdb::DatumFromCString((char *)&i, sizeof(uint16));
+  tuple_slot->tts_values[1] = Int64GetDatum(10000);
+  writer->WriteTuple(tuple_slot);
+
+  writer->Close();
+
+  DeleteTupleSlot(tuple_slot);
+  delete writer;
+
+  MicroPartitionReader::ReaderOptions reader_options;
+
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
+
+  auto reader = new OrcReader(file_ptr);
+  reader->Open(reader_options);
+
+  EXPECT_EQ(2, reader->GetGroupNums());
+
+  // verify group1
+  auto group1 = reader->ReadGroup(0);
+  auto columns1 = group1->GetAllColumns();
+
+  EXPECT_EQ(2, columns1->GetColumns());
+
+  auto column1 = (PaxVecNonFixedColumn *)(*columns1)[0];
+  auto column2 = (PaxVecCommColumn<int32> *)(*columns1)[1];
+
+  auto column1_data = column1->GetDataBuffer();
+  auto column2_data = column2->GetDataBuffer();
+  auto column1_offsets = column1->GetOffsetBuffer();
+
+  ASSERT_EQ(10000, column1->GetRows());
+  ASSERT_EQ(10000, column2->GetRows());
+
+  ASSERT_TRUE(column1->HasNull());
+  ASSERT_TRUE(column2->HasNull());
+
+  ASSERT_EQ(6666, column1->GetNonNullRows());
+  ASSERT_EQ(6666, column2->GetNonNullRows());
+
+  ASSERT_TRUE(column1_data);
+  ASSERT_TRUE(column2_data);
+  ASSERT_TRUE(column1_offsets);
+
+  ASSERT_EQ(0, column1_offsets->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+
+  ASSERT_EQ(10001, column1_offsets->GetSize());
+  ASSERT_LE((*column1_offsets)[column1_offsets->GetSize() - 1],
+            column1_data->GetSize());
+
+  ASSERT_EQ(10000, column2_data->GetSize());
+
+  for (uint16 i = 0; i < 10000; i++) {
+    if (i % 3 == 0) {
+      ASSERT_EQ((*column2_data)[i], 0);
+    } else {
+      ASSERT_EQ((*column2_data)[i], i);
+    }
+  }
+
+  // verify group 2
+  auto group2 = reader->ReadGroup(1);
+  auto columns2 = group2->GetAllColumns();
+
+  column1 = (PaxVecNonFixedColumn *)(*columns2)[0];
+  column2 = (PaxVecCommColumn<int32> *)(*columns2)[1];
+
+  column1_data = column1->GetDataBuffer();
+  column2_data = column2->GetDataBuffer();
+  column1_offsets = column1->GetOffsetBuffer();
+
+  ASSERT_FALSE(column1->HasNull());
+  ASSERT_FALSE(column2->HasNull());
+
+  ASSERT_EQ(1, column1->GetNonNullRows());
+  ASSERT_EQ(1, column2->GetNonNullRows());
+
+  ASSERT_TRUE(column1_data);
+  ASSERT_TRUE(column2_data);
+
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_TRUE(column1_offsets);
+
+  ASSERT_EQ(0, column1_offsets->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+
+  ASSERT_EQ(2, column1_offsets->GetSize());
+  ASSERT_LE((*column1_offsets)[column1_offsets->GetSize() - 1],
+            column1_data->GetSize());
+  // still contain memalign size
+  ASSERT_EQ(2, column2_data->GetSize());
+
+  ASSERT_EQ((*column2_data)[0], 10000);
+
+  delete group1;
+  delete group2;
+  delete reader;
+}
+
+TEST_F(OrcVecTest, WriteReadGroupWithEncoding) {
+  TupleTableSlot *tuple_slot = CreateFakeTupleSlot();
+
+  auto local_fs = Singleton<LocalFileSystem>::GetInstance();
+  ASSERT_NE(nullptr, local_fs);
+
+  auto file_ptr = local_fs->Open(file_name_, fs::kWriteMode);
+  EXPECT_NE(nullptr, file_ptr);
+
+  std::vector<pax::orc::proto::Type_Kind> types;
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+  types.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> types_encoding;
+  types_encoding.emplace_back(std::make_tuple(
+      ColumnEncoding_Kind::ColumnEncoding_Kind_COMPRESS_ZSTD, 5));
+  types_encoding.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind::ColumnEncoding_Kind_RLE_V2, 0));
+
+  MicroPartitionWriter::WriterOptions writer_options;
+  writer_options.desc = tuple_slot->tts_tupleDescriptor;
+  writer_options.encoding_opts = types_encoding;
+  writer_options.storage_format = PaxStorageFormat::kTypeStorageOrcVec;
+
+  auto writer = new OrcWriter(writer_options, types, file_ptr);
+
+  for (uint16 i = 0; i < 10000; i++) {
+    if (i % 3 == 0) {
+      tuple_slot->tts_isnull[0] = true;
+      tuple_slot->tts_isnull[1] = true;
+    } else {
+      tuple_slot->tts_isnull[0] = false;
+      tuple_slot->tts_isnull[1] = false;
+    }
+
+    tuple_slot->tts_values[0] =
+        cbdb::DatumFromCString((char *)&i, sizeof(uint16));
+    tuple_slot->tts_values[1] = Int64GetDatum(i);
+    writer->WriteTuple(tuple_slot);
+  }
+
+  writer->Flush();
+
+  tuple_slot->tts_isnull[0] = false;
+  tuple_slot->tts_isnull[1] = false;
+
+  uint16 i = 10000;
+  tuple_slot->tts_values[0] =
+      cbdb::DatumFromCString((char *)&i, sizeof(uint16));
+  tuple_slot->tts_values[1] = Int64GetDatum(10000);
+  writer->WriteTuple(tuple_slot);
+
+  writer->Close();
+
+  DeleteTupleSlot(tuple_slot);
+  delete writer;
+
+  MicroPartitionReader::ReaderOptions reader_options;
+
+  file_ptr = local_fs->Open(file_name_, fs::kReadMode);
+
+  auto reader = new OrcReader(file_ptr);
+  reader->Open(reader_options);
+
+  EXPECT_EQ(2, reader->GetGroupNums());
+
+  // verify group1
+  auto group1 = reader->ReadGroup(0);
+  auto columns1 = group1->GetAllColumns();
+
+  EXPECT_EQ(2, columns1->GetColumns());
+
+  auto column1 = (PaxVecNonFixedColumn *)(*columns1)[0];
+  auto column2 = (PaxVecCommColumn<int32> *)(*columns1)[1];
+
+  auto column1_data = column1->GetDataBuffer();
+  auto column2_data = column2->GetDataBuffer();
+  auto column1_offsets = column1->GetOffsetBuffer();
+
+  ASSERT_EQ(10000, column1->GetRows());
+  ASSERT_EQ(10000, column2->GetRows());
+
+  ASSERT_TRUE(column1->HasNull());
+  ASSERT_TRUE(column2->HasNull());
+
+  ASSERT_EQ(6666, column1->GetNonNullRows());
+  ASSERT_EQ(6666, column2->GetNonNullRows());
+
+  ASSERT_TRUE(column1_data);
+  ASSERT_TRUE(column2_data);
+  ASSERT_TRUE(column1_offsets);
+
+  ASSERT_EQ(0, column1_offsets->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+
+  ASSERT_EQ(10001, column1_offsets->GetSize());
+  ASSERT_LE((*column1_offsets)[column1_offsets->GetSize() - 1],
+            column1_data->GetSize());
+
+  column2->GetBuffer(0);
+
+  for (uint16 i = 0; i < 10000; i++) {
+    if (i % 3 == 0) {
+      ASSERT_EQ(*(int32 *)column2->GetBuffer(i).first, 0);
+    } else {
+      ASSERT_EQ(*(int32 *)column2->GetBuffer(i).first, i);
+    }
+  }
+
+  // verify group 2
+  auto group2 = reader->ReadGroup(1);
+  auto columns2 = group2->GetAllColumns();
+
+  column1 = (PaxVecNonFixedColumn *)(*columns2)[0];
+  column2 = (PaxVecCommColumn<int32> *)(*columns2)[1];
+
+  column1_data = column1->GetDataBuffer();
+  column2_data = column2->GetDataBuffer();
+  column1_offsets = column1->GetOffsetBuffer();
+
+  ASSERT_FALSE(column1->HasNull());
+  ASSERT_FALSE(column2->HasNull());
+
+  ASSERT_EQ(1, column1->GetNonNullRows());
+  ASSERT_EQ(1, column2->GetNonNullRows());
+
+  ASSERT_TRUE(column1_data);
+  ASSERT_TRUE(column2_data);
+
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_TRUE(column1_offsets);
+
+  ASSERT_EQ(0, column1_offsets->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column1_data->Capacity() % MEMORY_ALIGN_SIZE);
+  ASSERT_EQ(0, column2_data->Capacity() % MEMORY_ALIGN_SIZE);
+
+  ASSERT_EQ(2, column1_offsets->GetSize());
+  ASSERT_LE((*column1_offsets)[column1_offsets->GetSize() - 1],
+            column1_data->GetSize());
+
+  ASSERT_EQ((*column2_data)[0], 10000);
+
+  delete group1;
+  delete group2;
+  delete reader;
+}
+
+#endif  // VEC_BUILD
+
+}  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/storage/orc/orc_writer.cc b/contrib/pax_storage/src/cpp/storage/orc/orc_writer.cc
new file mode 100644
index 00000000000..35f6e1f0ef1
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/orc/orc_writer.cc
@@ -0,0 +1,672 @@
+#include "comm/cbdb_api.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "comm/guc.h"
+#include "comm/log.h"
+#include "comm/pax_memory.h"
+#include "storage/columns/pax_column_traits.h"
+#include "storage/micro_partition_stats.h"
+#include "storage/orc/orc.h"
+#include "storage/orc/orc_defined.h"
+#include "storage/orc/orc_group.h"
+#include "storage/pax_itemptr.h"
+
+namespace pax {
+
+std::vector<pax::orc::proto::Type_Kind> OrcWriter::BuildSchema(TupleDesc desc) {
+  std::vector<pax::orc::proto::Type_Kind> type_kinds;
+  for (int i = 0; i < desc->natts; i++) {
+    auto attr = &desc->attrs[i];
+    if (attr->attbyval) {
+      switch (attr->attlen) {
+        case 1:
+          type_kinds.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_BYTE);
+          break;
+        case 2:
+          type_kinds.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_SHORT);
+          break;
+        case 4:
+          type_kinds.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_INT);
+          break;
+        case 8:
+          type_kinds.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_LONG);
+          break;
+        default:
+          Assert(!"should not be here! pg_type which attbyval=true only have typlen of "
+                  "1, 2, 4, or 8");
+      }
+    } else {
+      Assert(attr->attlen > 0 || attr->attlen == -1);
+      type_kinds.emplace_back(pax::orc::proto::Type_Kind::Type_Kind_STRING);
+    }
+  }
+
+  return type_kinds;
+}
+
+template <typename N>
+static PaxColumn *CreateCommColumn(bool is_vec,
+                                   const PaxEncoder::EncodingOption &opts) {
+  return is_vec
+             ? (PaxColumn *)traits::ColumnOptCreateTraits<
+                   PaxVecEncodingColumn, N>::create_encoding(DEFAULT_CAPACITY,
+                                                             opts)
+             : (PaxColumn *)traits::ColumnOptCreateTraits<
+                   PaxEncodingColumn, N>::create_encoding(DEFAULT_CAPACITY,
+                                                          opts);
+}
+
+static PaxColumns *BuildColumns(
+    const std::vector<pax::orc::proto::Type_Kind> &types,
+    const std::vector<std::tuple<ColumnEncoding_Kind, int>>
+        &column_encoding_types,
+    const PaxStorageFormat &storage_format) {
+  PaxColumns *columns;
+  bool is_vec;
+
+  columns = PAX_NEW<PaxColumns>();
+  is_vec = (storage_format == PaxStorageFormat::kTypeStorageOrcVec);
+  columns->SetStorageFormat(storage_format);
+
+  for (size_t i = 0; i < types.size(); i++) {
+    auto type = types[i];
+
+    PaxEncoder::EncodingOption encoding_option;
+    encoding_option.column_encode_type = std::get<0>(column_encoding_types[i]);
+    encoding_option.is_sign = true;
+    encoding_option.compress_level = std::get<1>(column_encoding_types[i]);
+
+    switch (type) {
+      case (pax::orc::proto::Type_Kind::Type_Kind_STRING): {
+        encoding_option.is_sign = false;
+        columns->Append(is_vec
+                            ? (PaxColumn *)traits::ColumnOptCreateTraits2<
+                                  PaxVecNonFixedEncodingColumn>::
+                                  create_encoding(DEFAULT_CAPACITY,
+                                                  std::move(encoding_option))
+                            : (PaxColumn *)traits::ColumnOptCreateTraits2<
+                                  PaxNonFixedEncodingColumn>::
+                                  create_encoding(DEFAULT_CAPACITY,
+                                                  std::move(encoding_option)));
+        break;
+      }
+      case (pax::orc::proto::Type_Kind::Type_Kind_BOOLEAN):
+      case (pax::orc::proto::Type_Kind::Type_Kind_BYTE):  // len 1 integer
+        columns->Append(
+            CreateCommColumn<int8>(is_vec, std::move(encoding_option)));
+        break;
+      case (pax::orc::proto::Type_Kind::Type_Kind_SHORT):  // len 2 integer
+        columns->Append(
+            CreateCommColumn<int16>(is_vec, std::move(encoding_option)));
+        break;
+      case (pax::orc::proto::Type_Kind::Type_Kind_INT):  // len 4 integer
+        columns->Append(
+            CreateCommColumn<int32>(is_vec, std::move(encoding_option)));
+        break;
+      case (pax::orc::proto::Type_Kind::Type_Kind_LONG):  // len 8 integer
+        columns->Append(
+            CreateCommColumn<int64>(is_vec, std::move(encoding_option)));
+        break;
+      default:
+        Assert(!"non-implemented column type");
+        break;
+    }
+  }
+
+  return columns;
+}
+
+OrcWriter::OrcWriter(
+    const MicroPartitionWriter::WriterOptions &writer_options,
+    const std::vector<pax::orc::proto::Type_Kind> &column_types, File *file)
+    : MicroPartitionWriter(writer_options),
+      is_closed_(false),
+      column_types_(column_types),
+      file_(file),
+      row_index_(0),
+      total_rows_(0),
+      current_offset_(0) {
+  pax_columns_ = BuildColumns(column_types_, writer_options.encoding_opts,
+                              writer_options.storage_format);
+
+  TupleDesc desc = writer_options.desc;
+  for (int i = 0; i < desc->natts; i++) {
+    auto attr = &desc->attrs[i];
+    Assert((size_t)i < pax_columns_->GetColumns());
+    auto column = (*pax_columns_)[i];
+
+    Assert(column);
+    size_t align_size;
+    switch (attr->attalign) {
+      case TYPALIGN_SHORT:
+        align_size = ALIGNOF_SHORT;
+        break;
+      case TYPALIGN_INT:
+        align_size = ALIGNOF_INT;
+        break;
+      case TYPALIGN_DOUBLE:
+        align_size = ALIGNOF_DOUBLE;
+        break;
+      case TYPALIGN_CHAR:
+        align_size = PAX_DATA_NO_ALIGN;
+        break;
+      default:
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+    }
+
+    column->SetAlignSize(align_size);
+  }
+
+  summary_.rel_oid = writer_options.rel_oid;
+  summary_.block_id = writer_options.block_id;
+  summary_.file_name = writer_options.file_name;
+
+  file_footer_.set_contentlength(0);
+  file_footer_.set_numberofrows(0);
+  BuildFooterType();
+
+  post_script_.set_footerlength(0);
+  post_script_.set_majorversion(PAX_MAJOR_VERSION);
+  post_script_.set_minorversion(PAX_MINOR_VERSION);
+  post_script_.set_writer(ORC_WRITER_ID);
+  post_script_.set_magic(ORC_MAGIC_ID);
+
+  auto natts = static_cast<int>(column_types.size());
+  auto stats_data = PAX_NEW<OrcColumnStatsData>();
+  stats_collector_.SetStatsMessage(stats_data->Initialize(natts), natts);
+  toast_holder_ = PAX_NEW_ARRAY<Datum>(natts);
+  memset(toast_holder_, 0, natts * sizeof(Datum));
+}
+
+OrcWriter::~OrcWriter() {
+  PAX_DELETE(pax_columns_);
+  PAX_DELETE(file_);
+  PAX_DELETE_ARRAY(toast_holder_);
+}
+
+MicroPartitionWriter *OrcWriter::SetStatsCollector(
+    MicroPartitionStats *mpstats) {
+  if (mpstats) {
+    auto stats_data = PAX_NEW<MicroPartittionFileStatsData>(
+        &summary_.mp_stats, static_cast<int>(column_types_.size()));
+    mpstats->SetStatsMessage(stats_data, column_types_.size());
+    return MicroPartitionWriter::SetStatsCollector(mpstats);
+  }
+  return MicroPartitionWriter::SetStatsCollector(mpstats);
+}
+
+void OrcWriter::Flush() {
+  BufferedOutputStream buffer_mem_stream(2048);
+  if (WriteStripe(&buffer_mem_stream)) {
+    Assert(current_offset_ >= buffer_mem_stream.GetDataBuffer()->Used());
+    summary_.file_size += buffer_mem_stream.GetDataBuffer()->Used();
+    file_->PWriteN(buffer_mem_stream.GetDataBuffer()->GetBuffer(),
+                   buffer_mem_stream.GetDataBuffer()->Used(),
+                   current_offset_ - buffer_mem_stream.GetDataBuffer()->Used());
+    PAX_DELETE(pax_columns_);
+    pax_columns_ =
+        PAX_NEW<PaxColumns>(column_types_, writer_options_.encoding_opts,
+                            writer_options_.storage_format);
+  }
+}
+
+void OrcWriter::WriteTuple(TupleTableSlot *table_slot) {
+  int n;
+  TupleDesc table_desc;
+  int16 type_len;
+  bool type_by_val;
+  bool is_null, is_dropped;
+  Datum tts_value;
+  bool has_detoast = false;
+  struct varlena *tts_value_vl = nullptr, *detoast_vl = nullptr;
+
+  summary_.num_tuples++;
+
+  table_desc = table_slot->tts_tupleDescriptor;
+  SetTupleOffset(&table_slot->tts_tid, row_index_++);
+  n = table_desc->natts;
+
+  CBDB_CHECK(pax_columns_->GetColumns() == static_cast<size_t>(n),
+             cbdb::CException::ExType::kExTypeSchemaNotMatch);
+
+  for (int i = 0; i < n; i++) {
+    type_len = table_desc->attrs[i].attlen;
+    type_by_val = table_desc->attrs[i].attbyval;
+    is_dropped = table_desc->attrs[i].attisdropped;
+    is_null = table_slot->tts_isnull[i];
+    tts_value = table_slot->tts_values[i];
+
+    AssertImply(is_dropped, is_null);
+
+    if (is_null) {
+      (*pax_columns_)[i]->AppendNull();
+      continue;
+    }
+
+    if (type_by_val) {
+      switch (type_len) {
+        case 1: {
+          auto value = cbdb::DatumToInt8(tts_value);
+          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
+                                     type_len);
+          break;
+        }
+        case 2: {
+          auto value = cbdb::DatumToInt16(tts_value);
+          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
+                                     type_len);
+          break;
+        }
+        case 4: {
+          auto value = cbdb::DatumToInt32(tts_value);
+          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
+                                     type_len);
+          break;
+        }
+        case 8: {
+          auto value = cbdb::DatumToInt64(tts_value);
+          (*pax_columns_)[i]->Append(reinterpret_cast<char *>(&value),
+                                     type_len);
+          break;
+        }
+        default:
+          Assert(!"should not be here! pg_type which attbyval=true only have typlen of "
+                  "1, 2, 4, or 8 ");
+      }
+    } else {
+      switch (type_len) {
+        case -1: {
+          tts_value_vl = (struct varlena *)DatumGetPointer(tts_value);
+          detoast_vl = cbdb::PgDeToastDatum(tts_value_vl);
+          Assert(detoast_vl != nullptr);
+
+          if (tts_value_vl != detoast_vl) {
+            has_detoast = true;
+            toast_holder_[i] = tts_value;
+            table_slot->tts_values[i] = PointerGetDatum(detoast_vl);
+          }
+
+          if (COLUMN_STORAGE_FORMAT_IS_VEC(pax_columns_)) {
+            (*pax_columns_)[i]->Append(VARDATA_ANY(detoast_vl),
+                                       VARSIZE_ANY_EXHDR(detoast_vl));
+          } else {
+            (*pax_columns_)[i]->Append(reinterpret_cast<char *>(detoast_vl),
+                                       VARSIZE_ANY(detoast_vl));
+          }
+          break;
+        }
+        default:
+          Assert(type_len > 0);
+          (*pax_columns_)[i]->Append(
+              static_cast<char *>(cbdb::DatumToPointer(tts_value)), type_len);
+          break;
+      }
+    }
+  }
+
+  pax_columns_->AddRows(1);
+  stats_collector_.AddRow(table_slot);
+
+  if (has_detoast) {
+    for (int i = 0; i < n; i++) {
+      if (PointerIsValid(toast_holder_[i])) {
+        cbdb::Pfree(DatumGetPointer(table_slot->tts_values[i]));
+        table_slot->tts_values[i] = toast_holder_[i];
+        toast_holder_[i] = 0;
+      }
+    }
+  }
+
+  if (pax_columns_->GetRows() >= writer_options_.group_limit) {
+    Flush();
+  }
+}
+
+void OrcWriter::MergeTo(MicroPartitionWriter *writer) {
+  auto orc_writer = dynamic_cast<OrcWriter *>(writer);
+  Assert(orc_writer);
+  Assert(!is_closed_ && !(orc_writer->is_closed_));
+  Assert(this != writer);
+  Assert(writer_options_.rel_oid == orc_writer->writer_options_.rel_oid);
+
+  // merge the groups which in disk
+  MergeGroups(orc_writer);
+
+  // clear the unstate file in disk.
+  orc_writer->DeleteUnstateFile();
+
+  // merge the memory
+  MergePaxColumns(orc_writer);
+
+  // Update summary
+  summary_.num_tuples += orc_writer->summary_.num_tuples;
+  if (mp_stats_) {
+    mp_stats_->MergeTo(orc_writer->mp_stats_, writer_options_.desc);
+  }
+}
+
+void OrcWriter::MergePaxColumns(OrcWriter *writer) {
+  PaxColumns *columns = writer->pax_columns_;
+  Assert(columns->GetColumns() == pax_columns_->GetColumns());
+  Assert(columns->GetRows() < writer_options_.group_limit);
+  if (columns->GetRows() == 0) {
+    return;
+  }
+
+  BufferedOutputStream buffer_mem_stream(2048);
+  auto ok = WriteStripe(&buffer_mem_stream, columns,
+                        &(writer->stats_collector_), writer->mp_stats_);
+
+  // must be ok
+  Assert(ok);
+
+  file_->PWriteN(buffer_mem_stream.GetDataBuffer()->GetBuffer(),
+                 buffer_mem_stream.GetDataBuffer()->Used(),
+                 current_offset_ - buffer_mem_stream.GetDataBuffer()->Used());
+
+  // Not do memory merge
+}
+
+void OrcWriter::MergeGroups(OrcWriter *orc_writer) {
+  DataBuffer<char> merge_buffer(0);
+
+  for (int index = 0; index < orc_writer->file_footer_.stripes_size();
+       index++) {
+    MergeGroup(orc_writer, index, &merge_buffer);
+  }
+}
+
+void OrcWriter::MergeGroup(OrcWriter *orc_writer, int group_index,
+                           DataBuffer<char> *merge_buffer) {
+  const auto &stripe_info = orc_writer->file_footer_.stripes(group_index);
+  auto total_len = stripe_info.footerlength();
+  auto stripe_data_len = stripe_info.datalength();
+  auto number_of_rows = stripe_info.numberofrows();
+
+  // will not flush empty group in disk
+  Assert(stripe_data_len);
+
+  if (!merge_buffer->GetBuffer()) {
+    merge_buffer->Set((char *)cbdb::Palloc(total_len), total_len);
+    merge_buffer->SetMemTakeOver(true);
+  } else if (merge_buffer->Capacity() < total_len) {
+    merge_buffer->Clear();
+    merge_buffer->Set((char *)cbdb::Palloc(total_len), total_len);
+  }
+  orc_writer->file_->Flush();
+  orc_writer->file_->PReadN(merge_buffer->GetBuffer(), total_len,
+                            stripe_info.offset());
+
+  summary_.file_size += total_len;
+  file_->PWriteN(merge_buffer->GetBuffer(), total_len, current_offset_);
+
+  auto stripe_info_write = file_footer_.add_stripes();
+
+  stripe_info_write->set_offset(current_offset_);
+  stripe_info_write->set_datalength(stripe_data_len);
+  stripe_info_write->set_footerlength(total_len);
+  stripe_info_write->set_numberofrows(number_of_rows);
+
+  current_offset_ += total_len;
+  total_rows_ += number_of_rows;
+
+  Assert((size_t)stripe_info.colstats_size() == pax_columns_->GetColumns());
+
+  for (int stats_index = 0; stats_index < stripe_info.colstats_size();
+       stats_index++) {
+    auto col_stats = stripe_info.colstats(stats_index);
+    auto col_stats_write = stripe_info_write->add_colstats();
+    col_stats_write->CopyFrom(col_stats);
+  }
+}
+
+void OrcWriter::DeleteUnstateFile() {
+  file_->Delete();
+  file_->Close();
+  is_closed_ = true;
+}
+
+bool OrcWriter::WriteStripe(BufferedOutputStream *buffer_mem_stream) {
+  return WriteStripe(buffer_mem_stream, pax_columns_, &stats_collector_,
+                     mp_stats_);
+}
+
+bool OrcWriter::WriteStripe(BufferedOutputStream *buffer_mem_stream,
+                            PaxColumns *pax_columns,
+                            MicroPartitionStats *stripe_stats,
+                            MicroPartitionStats *file_stats) {
+  std::vector<pax::orc::proto::Stream> streams;
+  std::vector<ColumnEncoding> encoding_kinds;
+  pax::orc::proto::StripeFooter stripe_footer;
+  pax::orc::proto::StripeInformation *stripe_info;
+
+  size_t data_len = 0;
+  size_t number_of_row = pax_columns->GetRows();
+
+  // No need add stripe if nothing in memeory
+  if (number_of_row == 0) {
+    return false;
+  }
+
+  PaxColumns::ColumnStreamsFunc column_streams_func =
+      [&streams](const pax::orc::proto::Stream_Kind &kind, size_t column,
+                 size_t length) {
+        pax::orc::proto::Stream stream;
+        stream.set_kind(kind);
+        stream.set_column(static_cast<uint32>(column));
+        stream.set_length(length);
+        streams.push_back(std::move(stream));
+      };
+
+  PaxColumns::ColumnEncodingFunc column_encoding_func =
+      [&encoding_kinds](const ColumnEncoding_Kind &encoding_kind,
+                        const uint64 compress_lvl, int64 origin_len) {
+        ColumnEncoding column_encoding;
+        Assert(encoding_kind !=
+               ColumnEncoding_Kind::ColumnEncoding_Kind_DEF_ENCODED);
+        if (encoding_kind != ColumnEncoding_Kind_NO_ENCODED &&
+            origin_len == NO_ENCODE_ORIGIN_LEN) {
+          CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+        }
+        column_encoding.set_kind(encoding_kind);
+        column_encoding.set_compress_lvl(compress_lvl);
+        column_encoding.set_length(origin_len);
+
+        encoding_kinds.push_back(std::move(column_encoding));
+      };
+
+  DataBuffer<char> *data_buffer =
+      pax_columns->GetDataBuffer(column_streams_func, column_encoding_func);
+
+  Assert(data_buffer->Used() == data_buffer->Capacity());
+
+  for (const auto &stream : streams) {
+    *stripe_footer.add_streams() = stream;
+    data_len += stream.length();
+  }
+
+  stripe_info = file_footer_.add_stripes();
+  auto stats_data =
+      dynamic_cast<OrcColumnStatsData *>(stripe_stats->GetStatsData());
+  Assert(stats_data);
+  for (size_t i = 0; i < pax_columns->GetColumns(); i++) {
+    auto pb_stats = stripe_info->add_colstats();
+    PaxColumn *pax_column = (*pax_columns)[i];
+
+    *stripe_footer.add_pax_col_encodings() = encoding_kinds[i];
+
+    pb_stats->set_hasnull(pax_column->HasNull());
+    pb_stats->set_allnull(pax_column->AllNull());
+    *pb_stats->mutable_coldatastats() =
+        *stats_data->GetColumnDataStats(static_cast<int>(i));
+    PAX_LOG_IF(pax_enable_debug,
+               "write group[%lu](allnull=%s, hasnull=%s, nrows=%lu)", i,
+               pax_column->AllNull() ? "true" : "false",
+               pax_column->HasNull() ? "true" : "false", pax_column->GetRows());
+  }
+  if (file_stats) {
+    file_stats->MergeTo(stripe_stats, writer_options_.desc);
+  }
+
+  stats_data->Reset();
+  stripe_stats->LightReset();
+
+  buffer_mem_stream->Set(data_buffer);
+
+  // check memory io with protobuf
+  CBDB_CHECK(stripe_footer.SerializeToZeroCopyStream(buffer_mem_stream),
+             cbdb::CException::ExType::kExTypeIOError);
+
+  stripe_info->set_offset(current_offset_);
+  stripe_info->set_datalength(data_len);
+  stripe_info->set_footerlength(buffer_mem_stream->GetSize());
+  stripe_info->set_numberofrows(number_of_row);
+
+  current_offset_ += buffer_mem_stream->GetSize();
+  total_rows_ += number_of_row;
+
+  return true;
+}
+
+void OrcWriter::Close() {
+  if (is_closed_) {
+    return;
+  }
+  BufferedOutputStream buffer_mem_stream(2048);
+  size_t file_offset = current_offset_;
+  bool empty_stripe = false;
+  DataBuffer<char> *data_buffer;
+
+  empty_stripe = !WriteStripe(&buffer_mem_stream);
+  if (empty_stripe) {
+    data_buffer = PAX_NEW<DataBuffer<char>>(2048);
+    buffer_mem_stream.Set(data_buffer);
+  }
+
+  WriteFileFooter(&buffer_mem_stream);
+  WritePostscript(&buffer_mem_stream);
+  if (summary_callback_) {
+    summary_.file_size += buffer_mem_stream.GetDataBuffer()->Used();
+    summary_callback_(summary_);
+  }
+
+  file_->PWriteN(buffer_mem_stream.GetDataBuffer()->GetBuffer(),
+                 buffer_mem_stream.GetDataBuffer()->Used(), file_offset);
+  file_->Flush();
+  file_->Close();
+  if (empty_stripe) {
+    PAX_DELETE(data_buffer);
+  }
+  is_closed_ = true;
+}
+
+size_t OrcWriter::PhysicalSize() const { return pax_columns_->PhysicalSize(); }
+
+void OrcWriter::BuildFooterType() {
+  auto proto_type = file_footer_.add_types();
+  proto_type->set_kind(::pax::orc::proto::Type_Kind_STRUCT);
+
+  for (size_t i = 0; i < column_types_.size(); ++i) {
+    auto orc_type = column_types_[i];
+
+    auto sub_proto_type = file_footer_.add_types();
+    sub_proto_type->set_kind(orc_type);
+    file_footer_.mutable_types(0)->add_subtypes(i);
+  }
+}
+
+void OrcWriter::WriteFileFooter(BufferedOutputStream *buffer_mem_stream) {
+  Assert(writer_options_.storage_format == kTypeStorageOrcNonVec ||
+         writer_options_.storage_format == kTypeStorageOrcVec);
+  file_footer_.set_contentlength(current_offset_);
+  file_footer_.set_numberofrows(total_rows_);
+  file_footer_.set_storageformat(writer_options_.storage_format);
+
+  auto stats_data =
+      dynamic_cast<OrcColumnStatsData *>(stats_collector_.GetStatsData());
+  Assert(file_footer_.colinfo_size() == 0);
+  for (size_t i = 0; i < pax_columns_->GetColumns(); i++) {
+    auto pb_colinfo = file_footer_.add_colinfo();
+    *pb_colinfo = *stats_data->GetColumnBasicInfo(static_cast<int>(i));
+  }
+
+  buffer_mem_stream->StartBufferOutRecord();
+  CBDB_CHECK(file_footer_.SerializeToZeroCopyStream(buffer_mem_stream),
+             cbdb::CException::ExType::kExTypeIOError);
+
+  post_script_.set_footerlength(buffer_mem_stream->EndBufferOutRecord());
+}
+
+void OrcWriter::WritePostscript(BufferedOutputStream *buffer_mem_stream) {
+  buffer_mem_stream->StartBufferOutRecord();
+  CBDB_CHECK(post_script_.SerializeToZeroCopyStream(buffer_mem_stream),
+             cbdb::CException::ExType::kExTypeIOError);
+
+  auto ps_len = (uint64)buffer_mem_stream->EndBufferOutRecord();
+  Assert(ps_len > 0);
+  static_assert(sizeof(ps_len) == ORC_POST_SCRIPT_SIZE,
+                "post script type len not match.");
+  buffer_mem_stream->DirectWrite((char *)&ps_len, ORC_POST_SCRIPT_SIZE);
+}
+
+OrcColumnStatsData *OrcColumnStatsData::Initialize(int natts) {
+  Assert(natts >= 0);
+  col_data_stats_.resize(natts);
+  col_basic_info_.resize(natts);
+  has_nulls_.resize(natts);
+  all_nulls_.resize(natts);
+
+  Reset();
+  return this;
+}
+
+void OrcColumnStatsData::CopyFrom(MicroPartitionStatsData * /*stats*/) {
+  CBDB_RAISE(cbdb::CException::ExType::kExTypeUnImplements);
+}
+
+void OrcColumnStatsData::CheckVectorSize() const {
+  Assert(col_data_stats_.size() == col_basic_info_.size());
+}
+
+void OrcColumnStatsData::Reset() {
+  auto n = col_basic_info_.size();
+  for (size_t i = 0; i < n; i++) {
+    col_data_stats_[i].Clear();
+    has_nulls_[i] = false;
+    all_nulls_[i] = true;
+  }
+}
+
+::pax::stats::ColumnBasicInfo *OrcColumnStatsData::GetColumnBasicInfo(
+    int column_index) {
+  Assert(column_index >= 0 && column_index < ColumnSize());
+  return &col_basic_info_[column_index];
+}
+
+::pax::stats::ColumnDataStats *OrcColumnStatsData::GetColumnDataStats(
+    int column_index) {
+  Assert(column_index >= 0 && column_index < ColumnSize());
+  return &col_data_stats_[column_index];
+}
+
+int OrcColumnStatsData::ColumnSize() const {
+  Assert(col_data_stats_.size() == col_basic_info_.size());
+  return static_cast<int>(col_basic_info_.size());
+}
+
+void OrcColumnStatsData::SetAllNull(int column_index, bool allnull) {
+  all_nulls_[column_index] = allnull;
+}
+
+void OrcColumnStatsData::SetHasNull(int column_index, bool hasnull) {
+  has_nulls_[column_index] = hasnull;
+}
+
+bool OrcColumnStatsData::GetAllNull(int column_index) {
+  return all_nulls_[column_index];
+}
+
+bool OrcColumnStatsData::GetHasNull(int column_index) {
+  return has_nulls_[column_index];
+}
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax.cc b/contrib/pax_storage/src/cpp/storage/pax.cc
index fad15fed303..0d36de7cbed 100644
--- a/contrib/pax_storage/src/cpp/storage/pax.cc
+++ b/contrib/pax_storage/src/cpp/storage/pax.cc
@@ -1,38 +1,121 @@
 #include "storage/pax.h"
 
-#include <uuid/uuid.h>
-
+#include <map>
 #include <utility>
 
-#include "catalog/micro_partition_stats.h"
+#include "access/paxc_rel_options.h"
 #include "catalog/pax_aux_table.h"
 #include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
+#include "storage/columns/pax_encoding.h"
 #include "storage/micro_partition_file_factory.h"
 #include "storage/micro_partition_metadata.h"
+#include "storage/micro_partition_row_filter_reader.h"
+#include "storage/micro_partition_stats.h"
 
 #ifdef VEC_BUILD
 #include "storage/vec/pax_vec_reader.h"
 #endif
 
-namespace pax {
+namespace paxc {
+class IndexUpdaterInternal {
+ public:
+  void Begin(Relation rel) {
+    Assert(rel);
 
-static std::string GenRandomBlockId() {
-  CBDB_WRAP_START;
-  {
-    uuid_t uuid;
-    char str[36] = {0};
+    rel_ = rel;
+    slot_ = MakeTupleTableSlot(rel->rd_att, &TTSOpsVirtual);
 
-    uuid_generate(uuid);
-    uuid_unparse(uuid, str);
+    if (HasIndex()) {
+      estate_ = CreateExecutorState();
 
-    std::string uuid_str = str;
-    return uuid_str;
+      relinfo_ = makeNode(ResultRelInfo);
+      relinfo_->ri_RelationDesc = rel;
+      ExecOpenIndices(relinfo_, false);
+    }
   }
-  CBDB_WRAP_END;
-}
+
+  void UpdateIndex(TupleTableSlot *slot) {
+    Assert(slot == slot_);
+    Assert(HasIndex());
+    auto recheck_index =
+        ExecInsertIndexTuples(relinfo_, slot_, estate_, true, false, NULL, NIL);
+    list_free(recheck_index);
+  }
+
+  void End() {
+    if (HasIndex()) {
+      Assert(relinfo_ && estate_);
+
+      ExecCloseIndices(relinfo_);
+      pfree(relinfo_);
+      relinfo_ = nullptr;
+
+      FreeExecutorState(estate_);
+      estate_ = nullptr;
+    }
+    Assert(relinfo_ == nullptr && estate_ == nullptr);
+
+    ExecDropSingleTupleTableSlot(slot_);
+    slot_ = nullptr;
+
+    rel_ = nullptr;
+  }
+
+  inline TupleTableSlot *GetSlot() { return slot_; }
+  inline bool HasIndex() const { return rel_->rd_rel->relhasindex; }
+
+ private:
+  Relation rel_ = nullptr;
+  TupleTableSlot *slot_ = nullptr;
+  EState *estate_ = nullptr;
+  ResultRelInfo *relinfo_ = nullptr;
+};
+}  // namespace paxc
+
+namespace pax {
+class IndexUpdater final {
+ public:
+  void Begin(Relation rel) {
+    CBDB_WRAP_START;
+    { stub_.Begin(rel); }
+    CBDB_WRAP_END;
+  }
+  void UpdateIndex(TupleTableSlot *slot) {
+    CBDB_WRAP_START;
+    { stub_.UpdateIndex(slot); }
+    CBDB_WRAP_END;
+  }
+  void End() {
+    CBDB_WRAP_START;
+    { stub_.End(); }
+    CBDB_WRAP_END;
+  }
+  inline TupleTableSlot *GetSlot() { return stub_.GetSlot(); }
+  inline bool HasIndex() const { return stub_.HasIndex(); }
+
+ private:
+  paxc::IndexUpdaterInternal stub_;
+};
+}  // namespace pax
+
+namespace pax {
 
 TableWriter::TableWriter(Relation relation)
-    : relation_(relation), summary_callback_(nullptr) {}
+    : relation_(relation), summary_callback_(nullptr) {
+  Assert(relation);
+}
+
+PaxStorageFormat TableWriter::GetStorageFormat() {
+  if (!already_get_format_) {
+    Assert(relation_);
+    storage_format_ = StorageFormatKeyToPaxStorageFormat(RelationGetOptions(
+        relation_, storage_format, STORAGE_FORMAT_TYPE_DEFAULT));
+    already_get_format_ = true;
+  }
+
+  return storage_format_;
+}
 
 TableWriter *TableWriter::SetWriteSummaryCallback(
     WriteSummaryCallback callback) {
@@ -60,8 +143,8 @@ TableWriter::~TableWriter() {
   // must call close before delete table writer
   Assert(writer_ == nullptr);
 
-  delete strategy_;
-  delete mp_stats_;
+  PAX_DELETE(strategy_);
+  PAX_DELETE(mp_stats_);
 }
 
 const FileSplitStrategy *TableWriter::GetFileSplitStrategy() const {
@@ -69,10 +152,42 @@ const FileSplitStrategy *TableWriter::GetFileSplitStrategy() const {
 }
 
 std::string TableWriter::GenFilePath(const std::string &block_id) {
-  return cbdb::BuildPaxFilePath(relation_, block_id);
+  return cbdb::BuildPaxFilePath(rel_path_, block_id);
 }
 
-void TableWriter::Open() {
+std::vector<std::tuple<ColumnEncoding_Kind, int>>
+TableWriter::GetRelEncodingOptions() {
+  size_t nattrs = 0;
+  paxc::PaxOptions **pax_options = nullptr;
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
+
+  CBDB_WRAP_START;
+  { pax_options = paxc::paxc_relation_get_attribute_options(relation_); }
+  CBDB_WRAP_END;
+  Assert(pax_options);
+
+  nattrs = relation_->rd_att->natts;
+
+  for (size_t index = 0; index < nattrs; index++) {
+    if (pax_options[index]) {
+      encoding_opts.emplace_back(std::make_tuple(
+          CompressKeyToColumnEncodingKind(pax_options[index]->compress_type),
+          pax_options[index]->compress_level));
+    } else {
+      // TODO(jiaqizho): In pax, we will fill a `DEF_ENCODED` if user not set
+      // the encoding clause. Need a GUC to decide whether we should use
+      // `NO_ENCODE` or keep use `DEF_ENCODED` also may allow user define
+      // different default encoding type for the different pg_type?
+      encoding_opts.emplace_back(
+          std::make_tuple(ColumnEncoding_Kind_DEF_ENCODED, 0));
+    }
+  }
+  cbdb::Pfree(pax_options);
+  return encoding_opts;
+}
+
+MicroPartitionWriter *TableWriter::CreateMicroPartitionWriter(
+    MicroPartitionStats *mp_stats) {
   MicroPartitionWriter::WriterOptions options;
   std::string file_path;
   std::string block_id;
@@ -81,43 +196,61 @@ void TableWriter::Open() {
   Assert(strategy_);
   Assert(summary_callback_);
 
-  block_id = GenRandomBlockId();
+  block_id = GenerateBlockID(relation_);
   file_path = GenFilePath(block_id);
+  current_blockno_ = std::stol(block_id);
 
   options.rel_oid = relation_->rd_id;
   options.desc = relation_->rd_att;
   options.block_id = std::move(block_id);
   options.file_name = std::move(file_path);
+  options.encoding_opts = std::move(GetRelEncodingOptions());
+  options.storage_format = GetStorageFormat();
 
-  File *file =
-      Singleton<LocalFileSystem>::GetInstance()->Open(options.file_name);
+  File *file = Singleton<LocalFileSystem>::GetInstance()->Open(
+      options.file_name, fs::kReadWriteMode);
 
-  writer_ = MicroPartitionFileFactory::CreateMicroPartitionWriter(
+  auto mp_writer = MicroPartitionFileFactory::CreateMicroPartitionWriter(
       MICRO_PARTITION_TYPE_PAX, file, std::move(options));
 
-  writer_->SetWriteSummaryCallback(summary_callback_);
-  writer_->SetStatsCollector(mp_stats_);
+  mp_writer->SetWriteSummaryCallback(summary_callback_);
+  mp_writer->SetStatsCollector(mp_stats);
+
+  if (mp_stats) {
+    mp_stats->DoInitialCheck(relation_->rd_att);
+  }
+
+  return mp_writer;
 }
 
-void TableWriter::WriteTuple(CTupleSlot *slot) {
+void TableWriter::Open() {
+  rel_path_ = cbdb::BuildPaxDirectoryPath(relation_->rd_node, relation_->rd_backend);
+  writer_ = CreateMicroPartitionWriter(mp_stats_);
+  num_tuples_ = 0;
+  // insert tuple into the aux table before inserting any tuples.
+  cbdb::InsertMicroPartitionPlaceHolder(RelationGetRelid(relation_),
+                                        std::to_string(current_blockno_));
+}
+
+void TableWriter::WriteTuple(TupleTableSlot *slot) {
   Assert(writer_);
   Assert(strategy_);
   // should check split strategy before write tuple
   // otherwise, may got a empty file in the disk
-  if (strategy_->ShouldSplit(writer_, num_tuples_)) {
-    this->Close();
-    this->Open();
+  if (strategy_->ShouldSplit(writer_->PhysicalSize(), num_tuples_)) {
+    writer_->Close();
+    PAX_DELETE(writer_);
+    Open();
   }
-  if (mp_stats_) mp_stats_->AddRow(slot->GetTupleTableSlot());
 
   writer_->WriteTuple(slot);
+  SetBlockNumber(&slot->tts_tid, current_blockno_);
   ++num_tuples_;
-  ++total_tuples_;
 }
 
 void TableWriter::Close() {
   writer_->Close();
-  delete writer_;
+  PAX_DELETE(writer_);
   writer_ = nullptr;
   num_tuples_ = 0;
 }
@@ -128,14 +261,12 @@ TableReader::TableReader(
     : iterator_(std::move(iterator)),
       reader_(nullptr),
       is_empty_(true),
-      reader_options_(options),
-      table_no_(0),
-      table_index_(0) {}
+      reader_options_(options) {}
 
 TableReader::~TableReader() {
   if (reader_) {
     reader_->Close();
-    delete reader_;
+    PAX_DELETE(reader_);
     reader_ = nullptr;
   }
 }
@@ -145,12 +276,6 @@ void TableReader::Open() {
     is_empty_ = true;
     return;
   }
-
-  if (reader_options_.build_bitmap) {
-    // first open, now alloc a table no in pax shmem for scan
-    cbdb::GetTableIndexAndTableNumber(reader_options_.rel_oid, &table_no_,
-                                      &table_index_);
-  }
   OpenFile();
   is_empty_ = false;
 }
@@ -172,12 +297,12 @@ void TableReader::Close() {
   }
 }
 
-bool TableReader::ReadTuple(CTupleSlot *slot) {
+bool TableReader::ReadTuple(TupleTableSlot *slot) {
   if (is_empty_) {
     return false;
   }
 
-  slot->ClearTuple();
+  ExecClearTuple(slot);
   while (!reader_->ReadTuple(slot)) {
     reader_->Close();
     if (!iterator_->HasNext()) {
@@ -186,9 +311,10 @@ bool TableReader::ReadTuple(CTupleSlot *slot) {
     }
     OpenFile();
   }
-  slot->SetTableNo(table_no_);
-  slot->SetBlockNumber(current_block_number_);
-  slot->StoreVirtualTuple();
+
+  SetBlockNumber(&slot->tts_tid, current_block_number_);
+  ExecStoreVirtualTuple(slot);
+
   return true;
 }
 
@@ -197,32 +323,30 @@ void TableReader::OpenFile() {
   auto it = iterator_->Next();
   MicroPartitionReader::ReaderOptions options;
   micro_partition_id_ = options.block_id = it.GetMicroPartitionId();
-  if (reader_options_.build_bitmap) {
-    int block_number = 0;
-    block_number =
-        cbdb::GetBlockNumber(reader_options_.rel_oid, table_index_,
-                             paxc::PaxBlockId(options.block_id.c_str()));
-
-    Assert(block_number >= 0);
-    current_block_number_ = block_number;
-  }
-  options.file_name = it.GetFileName();
+  current_block_number_ = std::stol(options.block_id);
+
   options.filter = reader_options_.filter;
   options.reused_buffer = reader_options_.reused_buffer;
+#ifdef ENABLE_PLASMA
+  options.pax_cache = reader_options_.pax_cache;
+#endif
 
-  if (reader_) {
-    delete reader_;
-  }
+  PAX_DELETE(reader_);
 
-  reader_ = new OrcReader(
-      Singleton<LocalFileSystem>::GetInstance()->Open(options.file_name));
+  reader_ = PAX_NEW<OrcReader>(Singleton<LocalFileSystem>::GetInstance()->Open(
+      it.GetFileName(), fs::kReadMode));
 
 #ifdef VEC_BUILD
   if (reader_options_.is_vec) {
     Assert(reader_options_.adapter);
-    reader_ = new PaxVecReader(reader_, reader_options_.adapter);
-  }
-#endif
+    reader_ = PAX_NEW<PaxVecReader>(reader_, reader_options_.adapter,
+                                    reader_options_.filter);
+  } else
+#endif  // VEC_BUILD
+    if (reader_options_.filter && reader_options_.filter->HasRowScanFilter()) {
+      reader_ =
+          MicroPartitionRowFilterReader::New(reader_, reader_options_.filter);
+    }
 
   reader_->Open(options);
 }
@@ -230,77 +354,69 @@ void TableReader::OpenFile() {
 TableDeleter::TableDeleter(
     Relation rel,
     std::unique_ptr<IteratorBase<MicroPartitionMetadata>> &&iterator,
-    std::map<std::string, std::unique_ptr<DynamicBitmap>> &&delete_bitmap,
+    std::map<std::string, std::unique_ptr<Bitmap64>> &&delete_bitmap,
     Snapshot snapshot)
     : rel_(rel),
       iterator_(std::move(iterator)),
       delete_bitmap_(std::move(delete_bitmap)),
       snapshot_(snapshot),
       reader_(nullptr),
-      writer_(nullptr),
-      slot_(nullptr) {}
+      writer_(nullptr) {}
 
 TableDeleter::~TableDeleter() {
   if (reader_) {
     reader_->Close();
-    delete reader_;
+    PAX_DELETE(reader_);
     reader_ = nullptr;
   }
 
   if (writer_) {
     writer_->Close();
-    delete writer_;
+    PAX_DELETE(writer_);
     writer_ = nullptr;
   }
-  if (slot_) {
-    ExecDropSingleTupleTableSlot(slot_);
-  }
 }
 
 void TableDeleter::Delete() {
   if (!iterator_->HasNext()) {
     return;
   }
-  slot_ = MakeTupleTableSlot(rel_->rd_att, &TTSOpsVirtual);
   OpenReader();
   OpenWriter();
+  pax::IndexUpdater index_updater;
+
+  index_updater.Begin(rel_);
+  Assert(rel_->rd_rel->relhasindex == index_updater.HasIndex());
+  auto slot = index_updater.GetSlot();
 
-  CTupleSlot cslot(slot_);
+  slot->tts_tableOid = RelationGetRelid(rel_);
   // TODO(gongxun): because bulk insert as AO/HEAP does with tuples iteration
   // not implemented. we should implement bulk insert firstly. and then we can
   // use ReadTupleN and WriteTupleN to delete tuples in batch.
-  while (reader_->ReadTuple(&cslot)) {
+  while (reader_->ReadTuple(slot)) {
     auto block_id = reader_->GetCurrentMicroPartitionId();
     auto it = delete_bitmap_.find(block_id);
-    if (it == delete_bitmap_.end()) {
-      // should not be here
-      Assert(!"should not be here, block_id is marked as delete but not in "
-                "delete_bitmap_");
-      continue;
-    }
+    Assert(it != delete_bitmap_.end());
 
     auto bitmap = it->second.get();
-    if (cslot.GetOffset() < bitmap->NumBits() &&
-        bitmap->Test(cslot.GetOffset())) {
-      continue;
+    if (bitmap->Test(pax::GetTupleOffset(slot->tts_tid))) continue;
+
+    writer_->WriteTuple(slot);
+    if (index_updater.HasIndex()) {
+      // Already store the ctid after WriteTuple
+      Assert(TTS_EMPTY(slot));
+      Assert(ItemPointerIsValid(&slot->tts_tid));
+      index_updater.UpdateIndex(slot);
     }
-    writer_->WriteTuple(&cslot);
-  }
-
-  // loop delete_bitmap
-  for (const auto &it : delete_bitmap_) {
-    auto block_id = it.first;
-    cbdb::DeleteMicroPartitionEntry(rel_->rd_id, snapshot_, block_id);
-
-    // TODO(gongxun): delete the block file
   }
+  index_updater.End();
 }
 
 void TableDeleter::OpenWriter() {
-  writer_ = new TableWriter(rel_);
-  writer_->SetWriteSummaryCallback(&cbdb::AddMicroPartitionEntry)
-      ->SetFileSplitStrategy(new PaxDefaultSplitStrategy())
-      ->SetStatsCollector(new MicroPartitionStats())
+  writer_ = PAX_NEW<TableWriter>(rel_);
+  writer_->SetWriteSummaryCallback(&cbdb::InsertOrUpdateMicroPartitionEntry)
+      ->SetFileSplitStrategy(PAX_NEW<PaxDefaultSplitStrategy>())
+      ->SetStatsCollector(PAX_NEW<MicroPartitionStats>())
       ->Open();
 }
 
@@ -308,7 +424,7 @@ void TableDeleter::OpenReader() {
   TableReader::ReaderOptions reader_options{};
   reader_options.build_bitmap = false;
   reader_options.rel_oid = rel_->rd_id;
-  reader_ = new TableReader(std::move(iterator_), reader_options);
+  reader_ = PAX_NEW<TableReader>(std::move(iterator_), reader_options);
   reader_->Open();
 }
 
diff --git a/contrib/pax_storage/src/cpp/storage/pax.h b/contrib/pax_storage/src/cpp/storage/pax.h
index b3c3360b88a..d2f47234d75 100644
--- a/contrib/pax_storage/src/cpp/storage/pax.h
+++ b/contrib/pax_storage/src/cpp/storage/pax.h
@@ -14,9 +14,8 @@
 #include "storage/micro_partition.h"
 #include "storage/micro_partition_metadata.h"
 #include "storage/orc/orc.h"
-#include "storage/pax_block_id.h"
 #include "storage/pax_filter.h"
-#include "storage/paxc_block_map_manager.h"
+#include "storage/pax_itemptr.h"
 #include "storage/strategy.h"
 
 #ifdef VEC_BUILD
@@ -33,9 +32,11 @@ class TableWriter {
 
   virtual ~TableWriter();
 
+  PaxStorageFormat GetStorageFormat();
+
   virtual const FileSplitStrategy *GetFileSplitStrategy() const;
 
-  virtual void WriteTuple(CTupleSlot *slot);
+  virtual void WriteTuple(TupleTableSlot *slot);
 
   virtual void Open();
 
@@ -47,10 +48,19 @@ class TableWriter {
 
   TableWriter *SetStatsCollector(MicroPartitionStats *mp_stats);
 
+  BlockNumber GetBlockNumber() const { return current_blockno_; }
+
  protected:
   virtual std::string GenFilePath(const std::string &block_id);
 
+  virtual std::vector<std::tuple<ColumnEncoding_Kind, int>>
+  GetRelEncodingOptions();
+
+  MicroPartitionWriter *CreateMicroPartitionWriter(
+      MicroPartitionStats *mp_stats);
+
  protected:
+  std::string rel_path_;
   const Relation relation_ = nullptr;
   MicroPartitionWriter *writer_ = nullptr;
   const FileSplitStrategy *strategy_ = nullptr;
@@ -59,7 +69,9 @@ class TableWriter {
   const FileSystem *file_system_ = Singleton<LocalFileSystem>::GetInstance();
 
   size_t num_tuples_ = 0;
-  size_t total_tuples_ = 0;
+  BlockNumber current_blockno_ = 0;
+  bool already_get_format_ = false;
+  PaxStorageFormat storage_format_ = PaxStorageFormat::kTypeStorageOrcNonVec;
 };
 
 class TableReader final {
@@ -77,6 +89,10 @@ class TableReader final {
     bool is_vec = false;
     VecAdapter *adapter = nullptr;
 #endif
+
+#ifdef ENABLE_PLASMA
+    PaxCache *pax_cache = nullptr;
+#endif  // ENABLE_PLASMA
   };
 
   TableReader(std::unique_ptr<IteratorBase<MicroPartitionMetadata>> &&iterator,
@@ -89,7 +105,7 @@ class TableReader final {
 
   void Close();
 
-  bool ReadTuple(CTupleSlot *slot);
+  bool ReadTuple(TupleTableSlot *slot);
 
   // deprecate:
   // DON'T USE, this function will be removed
@@ -101,25 +117,21 @@ class TableReader final {
   void OpenFile();
 
  private:
-  const std::unique_ptr<IteratorBase<MicroPartitionMetadata>> iterator_;
+  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> iterator_;
   MicroPartitionReader *reader_ = nullptr;
   bool is_empty_ = false;
   const ReaderOptions reader_options_;
-  int current_block_number_ = 0;
+  uint32 current_block_number_ = 0;
 
   std::string micro_partition_id_;
-  // only for ctid bitmap
-  uint8 table_no_;
-  uint32 table_index_;
 };
 
 class TableDeleter final {
  public:
-  TableDeleter(
-      Relation rel,
-      std::unique_ptr<IteratorBase<MicroPartitionMetadata>> &&iterator,
-      std::map<std::string, std::unique_ptr<DynamicBitmap>> &&delete_bitmap,
-      Snapshot snapshot);
+  TableDeleter(Relation rel,
+               std::unique_ptr<IteratorBase<MicroPartitionMetadata>> &&iterator,
+               std::map<std::string, std::unique_ptr<Bitmap64>> &&delete_bitmap,
+               Snapshot snapshot);
 
   ~TableDeleter();
 
@@ -133,11 +145,10 @@ class TableDeleter final {
  private:
   Relation rel_;
   std::unique_ptr<IteratorBase<MicroPartitionMetadata>> iterator_;
-  std::map<std::string, std::unique_ptr<DynamicBitmap>> delete_bitmap_;
+  std::map<std::string, std::unique_ptr<Bitmap64>> delete_bitmap_;
   Snapshot snapshot_;
   TableReader *reader_;
   TableWriter *writer_;
-  TupleTableSlot *slot_;
 };
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_block_id.h b/contrib/pax_storage/src/cpp/storage/pax_block_id.h
deleted file mode 100644
index 9f140fa774a..00000000000
--- a/contrib/pax_storage/src/cpp/storage/pax_block_id.h
+++ /dev/null
@@ -1,19 +0,0 @@
-#pragma once
-
-#include "comm/cbdb_api.h"
-
-#include <assert.h>
-
-#define BLOCK_ID_SIZE 36
-namespace paxc {
-struct PaxBlockId {
-  char pax_block_id[BLOCK_ID_SIZE + 1];
-  explicit PaxBlockId(const char *block_id) {
-    Assert(strlen(block_id) == BLOCK_ID_SIZE);
-    strncpy(pax_block_id, block_id, BLOCK_ID_SIZE);
-    pax_block_id[BLOCK_ID_SIZE] = '\0';
-  }
-
-  const char *ToStr() const { return pax_block_id; }
-};
-}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/storage/pax_buffer.cc b/contrib/pax_storage/src/cpp/storage/pax_buffer.cc
index 54b1a869f5d..4bfab83e766 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_buffer.cc
+++ b/contrib/pax_storage/src/cpp/storage/pax_buffer.cc
@@ -25,11 +25,6 @@ void BlockBufferBase::Set(char *ptr, size_t size) {
   block_pos_ = ptr;
 }
 
-void BlockBufferBase::Write(char *ptr, size_t size) {
-  Assert(block_pos_ + size <= block_buffer_.End());
-  memcpy(block_pos_, ptr, size);
-}
-
 void BlockBufferBase::Combine(const BlockBufferBase &buffer) {
   Assert(Available() > buffer.Used());
   Write(buffer.block_buffer_.Start(), buffer.Used());
@@ -57,16 +52,6 @@ template <typename T>  // NOLINT: redirect constructor
 DataBuffer<T>::DataBuffer(size_t size)
     : DataBuffer(nullptr, size, false, true) {}
 
-template <typename T>
-T &DataBuffer<T>::operator[](size_t i) {
-  return data_buffer_[i];
-}
-
-template <typename T>
-size_t DataBuffer<T>::GetSize() {
-  return Used() / sizeof(T);
-}
-
 template <typename T>
 DataBuffer<T>::~DataBuffer() {
   if (mem_take_over_ && data_buffer_) {
@@ -96,43 +81,19 @@ void DataBuffer<T>::Reset() {
 }
 
 template <typename T>
-void DataBuffer<T>::Write(T value) {
-  Assert(block_pos_ + sizeof(T) <= block_buffer_.End());
-  *(reinterpret_cast<T *>(block_pos_)) = value;
-}
-
-template <typename T>
-void DataBuffer<T>::Write(T *ptr, size_t size) {
-  Assert(size % sizeof(T) == 0 && (block_pos_ + size) <= block_buffer_.End());
-  memcpy(block_pos_, reinterpret_cast<const char *>(ptr), size);
-}
-
-template <typename T>
-void DataBuffer<T>::Write(const T *ptr, size_t size) {
-  Assert(size % sizeof(T) == 0 && (block_pos_ + size) <= block_buffer_.End());
-  memcpy(block_pos_, reinterpret_cast<const char *>(ptr), size);
-}
+void DataBuffer<T>::ReSize(size_t size, double mul_ratio) {
+  Assert(mul_ratio > 1);
+  auto cap = Capacity();
 
-template <typename T>
-void DataBuffer<T>::Read(T *dst) {
-  Assert(Used() > sizeof(T) && Used() <= Capacity());
-  memcpy(dst, block_pos_, sizeof(T));
-}
-
-template <typename T>
-void DataBuffer<T>::Read(void *dst, size_t n) {
-  Assert(Used() > n && Used() <= Capacity());
-  memcpy(dst, block_pos_, n);
-}
+  if (size <= cap) {
+    return;
+  }
 
-template <typename T>
-T *DataBuffer<T>::GetBuffer() const {
-  return data_buffer_;
-}
+  while (cap < size) {
+    cap = cap * mul_ratio;
+  }
 
-template <typename T>
-T *DataBuffer<T>::GetAvailableBuffer() const {
-  return data_buffer_ + Used();
+  ReSize(cap);
 }
 
 template <typename T>
@@ -154,24 +115,6 @@ void DataBuffer<T>::ReSize(size_t size) {
   BlockBufferBase::Set(reinterpret_cast<char *>(data_buffer_), size, used);
 }
 
-template <typename T>
-bool DataBuffer<T>::IsMemTakeOver() const {
-  return mem_take_over_;
-}
-
-template <typename T>
-void DataBuffer<T>::SetMemTakeOver(bool take_over) {
-  mem_take_over_ = take_over;
-}
-
-template <typename T>
-void DataBuffer<T>::Clear() {
-  if (mem_take_over_ && data_buffer_) {
-    cbdb::Pfree(data_buffer_);
-  }
-  data_buffer_ = nullptr;
-}
-
 template class DataBuffer<char>;
 template class DataBuffer<int8>;
 template class DataBuffer<int16>;
@@ -231,6 +174,13 @@ void UntreatedDataBuffer<T>::TreatedAll() {
   untreated_pos_ = BlockBufferBase::block_buffer_.Start();
 }
 
+template <typename T>
+void UntreatedDataBuffer<T>::ReSize(size_t size, double mul_ratio) {
+  size_t untreated = UnTreated();
+  DataBuffer<T>::ReSize(size, mul_ratio);
+  untreated_pos_ = BlockBufferBase::block_buffer_.Start() + untreated;
+}
+
 template <typename T>
 void UntreatedDataBuffer<T>::ReSize(size_t size) {
   size_t untreated = UnTreated();
diff --git a/contrib/pax_storage/src/cpp/storage/pax_buffer.h b/contrib/pax_storage/src/cpp/storage/pax_buffer.h
index 2bc838be317..60e65a0ab45 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_buffer.h
+++ b/contrib/pax_storage/src/cpp/storage/pax_buffer.h
@@ -77,7 +77,16 @@ class BlockBufferBase {
 
   virtual void Set(char *ptr, size_t size);
 
-  void Write(char *ptr, size_t size);
+  inline void Write(char *ptr, size_t size) {
+    Assert(block_pos_ + size <= block_buffer_.End());
+    memcpy(block_pos_, ptr, size);
+  }
+
+  inline void WriteZero(size_t size) {
+    Assert(block_pos_ + size <= block_buffer_.End());
+    memset(block_pos_, 0, size);
+  }
+
 
   void Combine(const BlockBufferBase &buffer);
 
@@ -137,12 +146,16 @@ class DataBuffer : public BlockBufferBase {
         data_buffer_(reinterpret_cast<T *>(data_buffer.data_buffer_)) {}
 
   // Direct access elements of internal buffer
-  T &operator[](size_t i);
+  inline T &operator[](size_t i) {
+    return data_buffer_[i];
+  }
 
-  T *StartT() const { return data_buffer_; }
+  inline T *StartT() const { return data_buffer_; }
 
   // Get size of elements of internal buffer
-  size_t GetSize();
+  inline size_t GetSize() {
+    return Used() / sizeof(T);
+  }
 
   ~DataBuffer() override;
 
@@ -158,35 +171,69 @@ class DataBuffer : public BlockBufferBase {
 
   // Direct write a element into available buffer
   // Should call `Brush` after write
-  virtual void Write(T value);
+  inline void Write(T value) {
+    Assert(block_pos_ + sizeof(T) <= block_buffer_.End());
+    *(reinterpret_cast<T *>(block_pos_)) = value;
+  }
 
-  virtual void Write(T *ptr, size_t size);
+  inline void Write(T *ptr, size_t size) {
+    Assert(size % sizeof(T) == 0 && (block_pos_ + size) <= block_buffer_.End());
+    memcpy(block_pos_, reinterpret_cast<const char *>(ptr), size);
+  }
 
-  virtual void Write(const T *ptr, size_t size);
+  inline void Write(const T *ptr, size_t size) {
+    Assert(size % sizeof(T) == 0 && (block_pos_ + size) <= block_buffer_.End());
+    memcpy(block_pos_, reinterpret_cast<const char *>(ptr), size);
+  }
 
   // Read all to dst pointer
-  virtual void Read(T *dst);
+  inline void Read(T *dst) {
+    Assert(Used() > sizeof(T) && Used() <= Capacity());
+    memcpy(dst, block_pos_, sizeof(T));
+  }
 
-  virtual void Read(void *dst, size_t n);
+  inline void Read(void *dst, size_t n) {
+    Assert(Used() > n && Used() <= Capacity());
+    memcpy(dst, block_pos_, n);
+  }
 
   // Get the internal buffer pointer
-  T *GetBuffer() const;
+  inline T *GetBuffer() const {
+    return data_buffer_;
+  }
 
   // Get the available buffer pointer
-  T *GetAvailableBuffer() const;
+  inline T *GetAvailableBuffer() const {
+    return data_buffer_ + Used();
+  }
 
   // Resize the internal buffer, size should bigger than capacity of internal
   // buffer `mem_take_over` should be true
+  // The `mul_rate` means that the current Buffer will be expanded according to
+  // this ratio If `mul_rate` is 0 means derict do realloc
+  virtual void ReSize(size_t size, double mul_ratio);
+
+  // Direct resize the internal buffer, size should bigger than capacity of
+  // internal buffer `mem_take_over` should be true
   virtual void ReSize(size_t size);
 
   // Is current internal buffer take over by DataBuffer
-  bool IsMemTakeOver() const;
+  inline bool IsMemTakeOver() const {
+    return mem_take_over_;
+  }
 
-  void SetMemTakeOver(bool take_over);
+  inline void SetMemTakeOver(bool take_over) {
+    mem_take_over_ = take_over;
+  }
 
   // Clear up the DataBuffer
   // Caller should call `Set` to reuse current `DataBuffer` after call `Clear`
-  virtual void Clear();
+  inline void Clear() {
+    if (mem_take_over_ && data_buffer_) {
+      cbdb::Pfree(data_buffer_);
+    }
+    data_buffer_ = nullptr;
+  }
 
  protected:
   bool mem_take_over_;
@@ -211,6 +258,8 @@ class UntreatedDataBuffer final : public DataBuffer<T> {
  public:
   explicit UntreatedDataBuffer(size_t size);
 
+  void ReSize(size_t size, double mul_ratio) override;
+
   void ReSize(size_t size) override;
 
   void BrushUnTreated(size_t size);
diff --git a/contrib/pax_storage/src/cpp/storage/pax_defined.h b/contrib/pax_storage/src/cpp/storage/pax_defined.h
new file mode 100644
index 00000000000..21d689ac683
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/pax_defined.h
@@ -0,0 +1,32 @@
+#pragma once
+#include <vector>
+namespace pax {
+
+#define VEC_BATCH_LENGTH (16384)
+#define MEMORY_ALIGN_SIZE (8)
+#define PAX_DATA_NO_ALIGN (1)
+
+#define BITS_TO_BYTES(bits) (((bits) + 7) / 8)
+
+#define COLUMN_STORAGE_FORMAT_IS_VEC(column) \
+  (((column)->GetStorageFormat()) == PaxStorageFormat::kTypeStorageOrcVec)
+
+enum PaxStorageFormat {
+  // default non-vec store
+  // which split null field and null bitmap
+  kTypeStorageOrcNonVec = 1,
+  // vec storage format
+  // spec the storage format
+  kTypeStorageOrcVec = 2,
+};
+
+// filter kind
+enum PaxFilterStatisticsKind {
+  // The value will be index at `filter_kind_desc`
+  kFile = 0,
+  kGroup = 1,
+};
+
+static std::vector<const char *> filter_kind_desc = {"file", "group"};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_filter.cc b/contrib/pax_storage/src/cpp/storage/pax_filter.cc
index 62e9cc8dfa2..e58039ff844 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_filter.cc
+++ b/contrib/pax_storage/src/cpp/storage/pax_filter.cc
@@ -2,21 +2,175 @@
 
 #include "comm/cbdb_api.h"
 
-#include "catalog/micro_partition_stats.h"
 #include "comm/cbdb_wrappers.h"
+#include "comm/pax_memory.h"
+#include "storage/micro_partition_stats.h"
 #include "storage/proto/proto_wrappers.h"
 
 namespace paxc {
+
+static bool BuildScanKeyOpExpr(ScanKey this_scan_key, Expr *clause,
+                               const Oid *opfamilies, bool isorderby,
+                               int indnkeyatts);
+static bool BuildScanKeyNullTest(ScanKey this_scan_key, Expr *clause);
+
+static bool BuildScanKeyOpExpr(ScanKey this_scan_key, Expr *clause,
+                               const Oid *opfamilies, bool isorderby,
+                               int indnkeyatts) {
+  /* indexkey op const or indexkey op expression */
+  int flags = 0;
+  Datum scanvalue;
+
+  Oid opno;              /* operator's OID */
+  RegProcedure opfuncid; /* operator proc id used in scan */
+  Oid opfamily;          /* opfamily of index column */
+  int op_strategy;       /* operator's strategy number */
+  Oid op_lefttype;       /* operator's declared input types */
+  Oid op_righttype;
+  Expr *leftop;        /* expr on lhs of operator */
+  Expr *rightop;       /* expr on rhs ... */
+  AttrNumber varattno; /* att number used in scan */
+
+  opno = ((OpExpr *)clause)->opno;
+  opfuncid = ((OpExpr *)clause)->opfuncid;
+
+  /*
+   * leftop should be the index key Var, possibly relabeled
+   */
+  leftop = (Expr *)get_leftop(clause);
+
+  if (leftop && IsA(leftop, RelabelType)) leftop = ((RelabelType *)leftop)->arg;
+
+  Assert(leftop != NULL);
+
+  if (!IsA(leftop, Var)) goto ignore_clause;
+
+  varattno = ((Var *)leftop)->varattno;
+  if (varattno < 1 || varattno > indnkeyatts) goto ignore_clause;
+
+  /*
+   * We have to look up the operator's strategy number.  This
+   * provides a cross-check that the operator does match the index.
+   */
+  opfamily = opfamilies[varattno - 1];
+  if (!OidIsValid(opfamily) || !op_in_opfamily(opno, opfamily))
+    goto ignore_clause;
+
+  get_op_opfamily_properties(opno, opfamily, isorderby, &op_strategy,
+                             &op_lefttype, &op_righttype);
+
+  if (isorderby) flags |= SK_ORDER_BY;
+
+  /*
+   * rightop is the constant or variable comparison value
+   */
+  rightop = (Expr *)get_rightop(clause);
+
+  if (rightop && IsA(rightop, RelabelType))
+    rightop = ((RelabelType *)rightop)->arg;
+
+  Assert(rightop != NULL);
+
+  if (IsA(rightop, Const)) {
+    /* OK, simple constant comparison value */
+    scanvalue = ((Const *)rightop)->constvalue;
+    if (((Const *)rightop)->constisnull) flags |= SK_ISNULL;
+  } else {
+    // No support for runtime keys now
+    goto ignore_clause;
+  }
+
+  /*
+   * initialize the scan key's fields appropriately
+   */
+  ScanKeyEntryInitialize(this_scan_key, flags,
+                         varattno,     /* attribute number to scan */
+                         op_strategy,  /* op's strategy */
+                         op_righttype, /* strategy subtype */
+                         ((OpExpr *)clause)->inputcollid, /* collation */
+                         opfuncid,                        /* reg proc to use */
+                         scanvalue);                      /* constant */
+  return true;
+ignore_clause:
+  return false;
+}
+
+static bool BuildScanKeyNullTest(ScanKey this_scan_key, Expr *clause) {
+  auto ntest = reinterpret_cast<NullTest *>(clause);
+  int flags;
+
+  Expr *leftop;        /* expr on lhs of operator */
+  AttrNumber varattno; /* att number used in scan */
+  /*
+   * argument should be the index key Var, possibly relabeled
+   */
+  leftop = ntest->arg;
+
+  if (leftop && IsA(leftop, RelabelType)) leftop = ((RelabelType *)leftop)->arg;
+
+  Assert(leftop != NULL);
+
+  if (!IsA(leftop, Var)) goto ignore_clause;
+
+  varattno = ((Var *)leftop)->varattno;
+
+  /*
+   * initialize the scan key's fields appropriately
+   */
+  switch (ntest->nulltesttype) {
+    case IS_NULL:
+      flags = SK_ISNULL | SK_SEARCHNULL;
+      break;
+    case IS_NOT_NULL:
+      flags = SK_ISNULL | SK_SEARCHNOTNULL;
+      break;
+    default:
+      elog(ERROR, "unrecognized nulltesttype: %d", (int)ntest->nulltesttype);
+      flags = 0; /* keep compiler quiet */
+      break;
+  }
+
+  ScanKeyEntryInitialize(this_scan_key, flags,
+                         varattno,        /* attribute number to scan */
+                         InvalidStrategy, /* no strategy */
+                         InvalidOid,      /* no strategy subtype */
+                         InvalidOid,      /* no collation */
+                         InvalidOid,      /* no reg proc for this */
+                         (Datum)0);       /* constant */
+
+  return true;
+ignore_clause:
+  return false;
+}
+
 static bool BuildScanKeys(Relation rel, List *quals, bool isorderby,
                           ScanKey *p_scan_keys, int *p_num_scan_keys) {
-  ListCell *qual_cell;
+  List *flat_quals = NIL;
+  ListCell *qual_cell, *lc1;
   ScanKey scan_keys;
   int n_scan_keys;
-  int j;
+  int index_of_scan_key;
   TupleDesc desc;
 
+  foreach (qual_cell, quals) {
+    Expr *clause = (Expr *)lfirst(qual_cell);
+
+    if (IsA(clause, BoolExpr)) {
+      if (is_andclause(clause)) {
+        foreach (lc1, ((BoolExpr *)clause)->args) {
+          Expr *sub_clause = (Expr *)lfirst(lc1);
+          flat_quals = lappend(flat_quals, sub_clause);
+        }
+      } else if (is_orclause(clause)) {
+        // TODO: support it
+      }
+    } else {
+      flat_quals = lappend(flat_quals, clause);
+    }
+  }
+
   /* Allocate array for ScanKey structs: one per qual */
-  n_scan_keys = list_length(quals);
+  n_scan_keys = list_length(flat_quals);
   scan_keys = (ScanKey)palloc(n_scan_keys * sizeof(ScanKeyData));
   desc = rel->rd_att;
   Oid *opfamilies = (Oid *)palloc(sizeof(Oid) * desc->natts);
@@ -34,153 +188,131 @@ static bool BuildScanKeys(Relation rel, List *quals, bool isorderby,
     opfamilies[i] = get_opclass_family(opclass);
   }
 
-  j = 0;
-  foreach (qual_cell, quals) {
+  index_of_scan_key = 0;
+  foreach (qual_cell, flat_quals) {
     Expr *clause = (Expr *)lfirst(qual_cell);
-    ScanKey this_scan_key = &scan_keys[j];
-    Oid opno;              /* operator's OID */
-    RegProcedure opfuncid; /* operator proc id used in scan */
-    Oid opfamily;          /* opfamily of index column */
-    int op_strategy;       /* operator's strategy number */
-    Oid op_lefttype;       /* operator's declared input types */
-    Oid op_righttype;
-    Expr *leftop;        /* expr on lhs of operator */
-    Expr *rightop;       /* expr on rhs ... */
-    AttrNumber varattno; /* att number used in scan */
+    ScanKey this_scan_key = &scan_keys[index_of_scan_key];
     int indnkeyatts;
 
     indnkeyatts = RelationGetNumberOfAttributes(rel);
+
     if (IsA(clause, OpExpr)) {
       /* indexkey op const or indexkey op expression */
-      int flags = 0;
-      Datum scanvalue;
-
-      opno = ((OpExpr *)clause)->opno;
-      opfuncid = ((OpExpr *)clause)->opfuncid;
-
-      /*
-       * leftop should be the index key Var, possibly relabeled
-       */
-      leftop = (Expr *)get_leftop(clause);
-
-      if (leftop && IsA(leftop, RelabelType))
-        leftop = ((RelabelType *)leftop)->arg;
-
-      Assert(leftop != NULL);
-
-      if (!IsA(leftop, Var)) goto ignore_clause;
-
-      varattno = ((Var *)leftop)->varattno;
-      if (varattno < 1 || varattno > indnkeyatts)
-        elog(ERROR, "bogus index qualification");
-
-      /*
-       * We have to look up the operator's strategy number.  This
-       * provides a cross-check that the operator does match the index.
-       */
-      opfamily = opfamilies[varattno - 1];
-      if (!OidIsValid(opfamily)) goto ignore_clause;
-
-      get_op_opfamily_properties(opno, opfamily, isorderby, &op_strategy,
-                                 &op_lefttype, &op_righttype);
-
-      if (isorderby) flags |= SK_ORDER_BY;
-
-      /*
-       * rightop is the constant or variable comparison value
-       */
-      rightop = (Expr *)get_rightop(clause);
-
-      if (rightop && IsA(rightop, RelabelType))
-        rightop = ((RelabelType *)rightop)->arg;
-
-      Assert(rightop != NULL);
-
-      if (IsA(rightop, Const)) {
-        /* OK, simple constant comparison value */
-        scanvalue = ((Const *)rightop)->constvalue;
-        if (((Const *)rightop)->constisnull) flags |= SK_ISNULL;
-      } else {
-        // No support for runtime keys now
-        goto ignore_clause;
+      if (BuildScanKeyOpExpr(this_scan_key, clause, opfamilies, isorderby,
+                             indnkeyatts)) {
+        index_of_scan_key++;
       }
-
-      /*
-       * initialize the scan key's fields appropriately
-       */
-      ScanKeyEntryInitialize(this_scan_key, flags,
-                             varattno,     /* attribute number to scan */
-                             op_strategy,  /* op's strategy */
-                             op_righttype, /* strategy subtype */
-                             ((OpExpr *)clause)->inputcollid, /* collation */
-                             opfuncid,   /* reg proc to use */
-                             scanvalue); /* constant */
-      j++;
     } else if (IsA(clause, NullTest)) {
       /* indexkey IS NULL or indexkey IS NOT NULL */
-      auto ntest = reinterpret_cast<NullTest *>(clause);
-      int flags;
-
       Assert(!isorderby);
-
-      /*
-       * argument should be the index key Var, possibly relabeled
-       */
-      leftop = ntest->arg;
-
-      if (leftop && IsA(leftop, RelabelType))
-        leftop = ((RelabelType *)leftop)->arg;
-
-      Assert(leftop != NULL);
-
-      if (!IsA(leftop, Var)) goto ignore_clause;
-
-      varattno = ((Var *)leftop)->varattno;
-
-      /*
-       * initialize the scan key's fields appropriately
-       */
-      switch (ntest->nulltesttype) {
-        case IS_NULL:
-          flags = SK_ISNULL | SK_SEARCHNULL;
-          break;
-        case IS_NOT_NULL:
-          flags = SK_ISNULL | SK_SEARCHNOTNULL;
-          break;
-        default:
-          elog(ERROR, "unrecognized nulltesttype: %d",
-               (int)ntest->nulltesttype);
-          flags = 0; /* keep compiler quiet */
-          break;
+      if (BuildScanKeyNullTest(this_scan_key, clause)) {
+        index_of_scan_key++;
       }
-
-      ScanKeyEntryInitialize(this_scan_key, flags,
-                             varattno,        /* attribute number to scan */
-                             InvalidStrategy, /* no strategy */
-                             InvalidOid,      /* no strategy subtype */
-                             InvalidOid,      /* no collation */
-                             InvalidOid,      /* no reg proc for this */
-                             (Datum)0);       /* constant */
-      j++;
     } else {
       // not support other qual types yet
     }
-
-  ignore_clause:
-    continue;
   }
   pfree(opfamilies);
+  list_free(flat_quals);
 
   /*
    * Return info to our caller.
    */
-  if (j > 0) {
+  if (index_of_scan_key > 0) {
     *p_scan_keys = scan_keys;
-    *p_num_scan_keys = j;
+    *p_num_scan_keys = index_of_scan_key;
     return true;
   }
   return false;
 }
+
+static inline void FindAttrsInQual(Node *qual, bool *proj, int ncol,
+                                   int *proj_atts, int *num_proj_atts) {
+  int i, k;
+  /* get attrs in qual */
+  extractcolumns_from_node(qual, proj, ncol);
+
+  /* collect the number of proj attr and attr_no from proj[] */
+  k = 0;
+  for (i = 0; i < ncol; i++) {
+    if (proj[i]) proj_atts[k++] = i;
+  }
+  *num_proj_atts = k;
+}
+
+bool BuildExecutionFilterForColumns(Relation rel, PlanState *ps,
+                                    pax::ExecutionFilterContext *ctx) {
+  List *qual = ps->plan->qual;
+  List **qual_list;
+  ListCell *lc;
+  bool *proj;
+  int *qual_atts;
+  int natts = RelationGetNumberOfAttributes(rel);
+
+  if (!qual || !IsA(qual, List)) return false;
+
+  if (list_length(qual) == 1 && IsA(linitial(qual), BoolExpr)) {
+    auto boolexpr = (BoolExpr *)linitial(qual);
+    if (boolexpr->boolop != AND_EXPR) return false;
+    qual = boolexpr->args;
+  }
+  Assert(IsA(qual, List));
+
+  proj = (bool *)palloc(sizeof(bool) * natts);
+  qual_atts = (int *)palloc(sizeof(int) * natts);
+  qual_list = (List **)palloc0(sizeof(List *) * (natts + 1));
+
+  ctx->econtext = ps->ps_ExprContext;
+  ctx->estate_final = nullptr;
+  ctx->estates = nullptr;
+  ctx->attnos = nullptr;
+  ctx->size = 0;
+
+  foreach (lc, qual) {
+    Expr *subexpr = (Expr *)lfirst(lc);
+    int num_qual_atts = 0;
+    int attno;
+
+    Assert(subexpr);
+    memset(proj, 0, sizeof(bool) * natts);
+    FindAttrsInQual((Node *)subexpr, proj, natts, qual_atts, &num_qual_atts);
+    if (num_qual_atts == 0 || num_qual_atts > 1) {
+      qual_list[0] = lappend(qual_list[0], subexpr);
+      continue;
+    }
+    attno = qual_atts[0] + 1;
+    Assert(num_qual_atts == 1 && attno > 0 && attno <= natts);
+    if (!qual_list[attno]) ctx->size++;
+    qual_list[attno] = lappend(qual_list[attno], subexpr);
+  }
+
+  if (ctx->size > 0) {
+    int k = 0;
+    ctx->estates = (ExprState **)palloc(sizeof(ExprState *) * ctx->size);
+    ctx->attnos = (AttrNumber *)palloc(sizeof(AttrNumber) * ctx->size);
+    for (AttrNumber i = 1; i <= (AttrNumber)natts; i++) {
+      if (!qual_list[i]) continue;
+      ctx->estates[k] = ExecInitQual(qual_list[i], ps);
+      ctx->attnos[k] = i;
+      list_free(qual_list[i]);
+      k++;
+    }
+    Assert(ctx->size == k);
+  }
+  if (qual_list[0]) {
+    ctx->estate_final = ExecInitQual(qual_list[0], ps);
+    list_free(qual_list[0]);
+  }
+
+  Assert(ctx->size > 0 || ctx->estate_final);
+  ps->qual = nullptr;
+
+  pfree(proj);
+  pfree(qual_atts);
+  pfree(qual_list);
+  return true;
+}
+
 }  // namespace paxc
 
 namespace pax {
@@ -194,7 +326,17 @@ bool BuildScanKeys(Relation rel, List *quals, bool isorderby,
   CBDB_WRAP_END;
 }
 
-PaxFilter::~PaxFilter() { delete[] proj_; }
+bool BuildExecutionFilterForColumns(Relation rel, PlanState *ps,
+                                    pax::ExecutionFilterContext *ctx) {
+  CBDB_WRAP_START;
+  { return paxc::BuildExecutionFilterForColumns(rel, ps, ctx); }
+  CBDB_WRAP_END;
+}
+
+PaxFilter::PaxFilter(bool allow_fallback_to_pg)
+    : allow_fallback_to_pg_(allow_fallback_to_pg) {}
+
+PaxFilter::~PaxFilter() { PAX_DELETE_ARRAY(proj_); }
 
 std::pair<bool *, size_t> PaxFilter::GetColumnProjection() {
   return std::make_pair(proj_, proj_len_);
@@ -214,8 +356,7 @@ void PaxFilter::SetScanKeys(ScanKey scan_keys, int num_scan_keys) {
   }
 }
 
-static inline bool CheckNullKey(
-    ScanKey scan_key, const ::pax::stats::ColumnStatisitcsInfo &column_stats) {
+static inline bool CheckNullKey(ScanKey scan_key, bool allnull, bool hasnull) {
   // handle null test
   // SK_SEARCHNULL and SK_SEARCHNOTNULL must not co-exist with each other
   Assert(scan_key->sk_flags & SK_ISNULL);
@@ -224,10 +365,10 @@ static inline bool CheckNullKey(
 
   if (scan_key->sk_flags & SK_SEARCHNULL) {
     // test: IS NULL
-    if (!column_stats.hasnull()) return false;
+    if (!hasnull) return false;
   } else if (scan_key->sk_flags & SK_SEARCHNOTNULL) {
     // test: IS NOT NULL
-    if (column_stats.allnull()) return false;
+    if (allnull) return false;
   } else {
     // Neither IS NULL nor IS NOT NULL was used; assume all indexable
     // operators are strict and thus return false with NULL value in
@@ -237,103 +378,139 @@ static inline bool CheckNullKey(
   return true;
 }
 
-static inline bool CheckProcid(const ::pax::stats::MinmaxStatistics &minmax,
-                               StrategyNumber strategy, Oid procid) {
-  switch (strategy) {
-    case BTLessStrategyNumber:
-      return minmax.proclt() == procid;
-    case BTLessEqualStrategyNumber:
-      return minmax.procle() == procid;
-    case BTGreaterStrategyNumber:
-      return minmax.procgt() == procid;
-    case BTGreaterEqualStrategyNumber:
-      return minmax.procge() == procid;
-    default:
-      Assert(false);
-      break;
-  }
-  // should not reach here, otherwise we ignore the scan key.
-  return false;
+static inline bool CheckOpfamily(const ::pax::stats::ColumnBasicInfo &info,
+                                 Oid opfamily) {
+  return info.opfamily() == opfamily;
 }
 
-static bool CheckNonnullValue(const ::pax::stats::MinmaxStatistics &minmax,
-                              ScanKey scan_key, Form_pg_attribute attr) {
-  Oid procid;
+static bool CheckNonnullValue(const ::pax::stats::ColumnBasicInfo &minmax,
+                              const ::pax::stats::ColumnDataStats &data_stats,
+                              ScanKey scan_key, Form_pg_attribute attr,
+                              bool allow_fallback_to_pg) {
+  Oid opfamily;
   FmgrInfo finfo;
   Datum datum;
-  Datum matches;
+  Datum matches = true;
   auto value = scan_key->sk_argument;
   auto typid = attr->atttypid;
   auto collation = minmax.collation();
   auto typlen = attr->attlen;
   auto typbyval = attr->attbyval;
 
+  bool ok;
+  OperMinMaxFunc lfunc, lfunc2;
+
   switch (scan_key->sk_strategy) {
     case BTLessStrategyNumber:
     case BTLessEqualStrategyNumber: {
-      auto ok = cbdb::MinMaxGetStrategyProcinfo(typid, &procid, &finfo,
-                                                scan_key->sk_strategy);
-      if (!ok || !CheckProcid(minmax, scan_key->sk_strategy, procid))
-        return true;
-      datum = pax::MicroPartitionStats::FromValue(minmax.minimal(), typlen,
-                                                  typbyval, &ok);
-      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-      matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+      if (MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype, collation,
+                                    lfunc, scan_key->sk_strategy)) {
+        Assert(lfunc);
+        datum = pax::MicroPartitionStats::FromValue(data_stats.minimal(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+
+        matches = lfunc(&datum, &value, collation);
+      } else if (allow_fallback_to_pg) {
+        ok = cbdb::MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype,
+                                             &opfamily, &finfo,
+                                             scan_key->sk_strategy);
+        if (!ok || !CheckOpfamily(minmax, opfamily)) break;
+        datum = pax::MicroPartitionStats::FromValue(data_stats.minimal(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+      }
+
       break;
     }
     case BTEqualStrategyNumber: {
-      auto ok = cbdb::MinMaxGetStrategyProcinfo(typid, &procid, &finfo,
-                                                BTLessEqualStrategyNumber);
-      if (!ok || !CheckProcid(minmax, BTLessEqualStrategyNumber, procid))
-        return true;
-      datum = pax::MicroPartitionStats::FromValue(minmax.minimal(), typlen,
-                                                  typbyval, &ok);
-      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-      matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
-
-      if (!DatumGetBool(matches))
-        // not (min <= value) --> min > value
-        return false;
+      if (MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype, collation,
+                                    lfunc, BTLessEqualStrategyNumber) &&
+          MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype, collation,
+                                    lfunc2, BTGreaterEqualStrategyNumber)) {
+        Assert(lfunc && lfunc2);
+
+        datum = pax::MicroPartitionStats::FromValue(data_stats.minimal(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = lfunc(&datum, &value, collation);
+        if (!DatumGetBool(matches))
+          // not (min <= value) --> min > value
+          break;
+
+        datum = pax::MicroPartitionStats::FromValue(data_stats.maximum(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = lfunc2(&datum, &value, collation);
+
+      } else if (allow_fallback_to_pg) {
+        ok = cbdb::MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype,
+                                             &opfamily, &finfo,
+                                             BTLessEqualStrategyNumber);
+        if (!ok || !CheckOpfamily(minmax, opfamily)) break;
+        datum = pax::MicroPartitionStats::FromValue(data_stats.minimal(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+
+        if (!DatumGetBool(matches))
+          // not (min <= value) --> min > value
+          break;
 
-      ok = cbdb::MinMaxGetStrategyProcinfo(typid, &procid, &finfo,
-                                           BTGreaterEqualStrategyNumber);
-      if (!ok || !CheckProcid(minmax, BTGreaterEqualStrategyNumber, procid))
-        return true;
-      datum = pax::MicroPartitionStats::FromValue(minmax.maximum(), typlen,
-                                                  typbyval, &ok);
-      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-      matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+        ok = cbdb::MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype,
+                                             &opfamily, &finfo,
+                                             BTGreaterEqualStrategyNumber);
+        if (!ok || !CheckOpfamily(minmax, opfamily)) break;
+        datum = pax::MicroPartitionStats::FromValue(data_stats.maximum(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+      }
       break;
     }
     case BTGreaterEqualStrategyNumber:
     case BTGreaterStrategyNumber: {
-      auto ok = cbdb::MinMaxGetStrategyProcinfo(typid, &procid, &finfo,
-                                                scan_key->sk_strategy);
-      if (!ok || !CheckProcid(minmax, scan_key->sk_strategy, procid))
-        return true;
-      datum = pax::MicroPartitionStats::FromValue(minmax.maximum(), typlen,
-                                                  typbyval, &ok);
-      CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
-      matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+      if (MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype, collation,
+                                    lfunc, scan_key->sk_strategy)) {
+        Assert(lfunc);
+        datum = pax::MicroPartitionStats::FromValue(data_stats.maximum(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+
+        matches = lfunc(&datum, &value, collation);
+      } else if (allow_fallback_to_pg) {
+        ok = cbdb::MinMaxGetStrategyProcinfo(typid, scan_key->sk_subtype,
+                                             &opfamily, &finfo,
+                                             scan_key->sk_strategy);
+        if (!ok || !CheckOpfamily(minmax, opfamily)) break;
+
+        datum = pax::MicroPartitionStats::FromValue(data_stats.maximum(),
+                                                    typlen, typbyval, &ok);
+        CBDB_CHECK(ok, cbdb::CException::kExTypeLogicError);
+        matches = cbdb::FunctionCall2Coll(&finfo, collation, datum, value);
+      }
+
       break;
     }
     default:
-      Assert(false);
+      // not support others `sk_strategy`
       matches = BoolGetDatum(true);
       break;
   }
+
   return DatumGetBool(matches);
 }
 
 // returns true: if the micro partition needs to scan
 // returns false: the micro partition could be ignored
-bool PaxFilter::TestMicroPartitionScanInternal(
-    const pax::stats::MicroPartitionStatisticsInfo &stats,
-    TupleDesc desc) const {
+bool PaxFilter::TestScanInternal(const ColumnStatsProvider &provider,
+                                 const TupleDesc desc) const {
   auto natts = desc->natts;
+  auto column_stats_size = provider.ColumnSize();
 
   Assert(num_scan_keys_ > 0);
-  Assert(stats.columnstats_size() <= natts);
+  Assert(column_stats_size <= natts);
   for (int i = 0; i < num_scan_keys_; i++) {
     auto scan_key = &scan_keys_[i];
     auto column_index = scan_key->sk_attno - 1;
@@ -345,27 +522,52 @@ bool PaxFilter::TestMicroPartitionScanInternal(
     // the collation in catalog and scan key should be consistent
     Assert(scan_key->sk_collation == attr->attcollation);
 
-    if (column_index >= stats.columnstats_size())
+    if (column_index >= column_stats_size)
       continue;  // missing attributes have no stats
 
-    const auto &column_stats = stats.columnstats(column_index);
-    const auto &minmax = column_stats.minmaxstats();
+    const auto &info = provider.ColumnInfo(column_index);
+    const auto &data_stats = provider.DataStats(column_index);
 
     // Check whether alter column type will result rewriting whole table.
-    Assert(attr->atttypid == minmax.typid());
+    AssertImply(info.typid(), attr->atttypid == info.typid());
 
     if (scan_key->sk_flags & SK_ISNULL) {
-      if (!CheckNullKey(scan_key, column_stats)) return false;
-    } else if (column_stats.allnull()) {
+      if (!CheckNullKey(scan_key, provider.AllNull(column_index),
+                        provider.HasNull(column_index)))
+        return false;
+    } else if (provider.AllNull(column_index)) {
       // ALL values are null, but the scan key is not null
       return false;
-    } else if (scan_key->sk_collation != minmax.collation()) {
+    } else if (scan_key->sk_collation != info.collation()) {
       // collation doesn't match ignore this scan key
-    } else if (!CheckNonnullValue(minmax, scan_key, attr)) {
+    } else if (!CheckNonnullValue(info, data_stats, scan_key, attr,
+                                  allow_fallback_to_pg_)) {
       return false;
     }
   }
   return true;
 }
 
+void PaxFilter::FillRemainingColumns(Relation rel) {
+  int natts = RelationGetNumberOfAttributes(rel);
+  bool *atts = PAX_NEW_ARRAY<bool>(natts);
+  if (proj_len_ > 0) {
+    Assert(natts >= 0 && static_cast<size_t>(natts) >= proj_len_);
+    memcpy(atts, proj_, sizeof(bool) * proj_len_);
+    for (auto i = static_cast<int>(proj_len_); i < natts; i++) atts[i] = false;
+  } else {
+    for (int i = 0; i < natts; i++) atts[i] = true;
+  }
+  // minus attnos in efctx_.attnos
+  for (int i = 0; i < efctx_.size; i++) {
+    auto attno = efctx_.attnos[i];
+    Assert(attno > 0 && attno <= natts);
+    atts[attno - 1] = false;
+  }
+  for (AttrNumber attno = 1; attno <= (AttrNumber)natts; attno++) {
+    if (atts[attno - 1]) remaining_attnos_.emplace_back(attno);
+  }
+  PAX_DELETE_ARRAY(atts);
+}
+
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_filter.h b/contrib/pax_storage/src/cpp/storage/pax_filter.h
index 1d3cfda7b65..f7bb8da0477 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_filter.h
+++ b/contrib/pax_storage/src/cpp/storage/pax_filter.h
@@ -1,18 +1,48 @@
 #pragma once
 #include "comm/cbdb_api.h"
 
+#include <map>
 #include <utility>
+#include <vector>
 
+#include "comm/guc.h"
+#include "comm/log.h"
+#include "storage/pax_defined.h"
 namespace pax {
 namespace stats {
 class MicroPartitionStatisticsInfo;
-}
+class ColumnBasicInfo;
+class ColumnDataStats;
+}  // namespace stats
+
+struct ExecutionFilterContext {
+  ExprContext *econtext;
+  ExprState *estate_final = nullptr;
+  ExprState **estates;
+  AttrNumber *attnos;
+  int size = 0;
+  inline bool HasExecutionFilter() const { return size > 0 || estate_final; }
+};
+
 bool BuildScanKeys(Relation rel, List *quals, bool isorderby,
                    ScanKey *scan_keys, int *num_scan_keys);
+bool BuildExecutionFilterForColumns(Relation rel, PlanState *ps,
+                                    pax::ExecutionFilterContext *ctx);
+class ColumnStatsProvider {
+ public:
+  virtual ~ColumnStatsProvider() = default;
+  virtual int ColumnSize() const = 0;
+  virtual bool AllNull(int column_index) const = 0;
+  virtual bool HasNull(int column_index) const = 0;
+  virtual const ::pax::stats::ColumnBasicInfo &ColumnInfo(
+      int column_index) const = 0;
+  virtual const ::pax::stats::ColumnDataStats &DataStats(
+      int column_index) const = 0;
+};
 
 class PaxFilter final {
  public:
-  PaxFilter() = default;
+  explicit PaxFilter(bool allow_fallback_to_pg = false);
 
   ~PaxFilter();
 
@@ -24,20 +54,54 @@ class PaxFilter final {
 
   void SetScanKeys(ScanKey scan_keys, int num_scan_keys);
 
+  ExecutionFilterContext *GetExecutionFilterContext() { return &efctx_; }
+  const std::vector<AttrNumber> &GetRemainingColumns() const {
+    return remaining_attnos_;
+  }
+
   // true: if failed to filter the whole micro-partition, reader SHOULD scan the
   // tuples false: if success to filter the micro-partition, the whole
   // micro-partition SHOULD be ignored.
-  inline bool TestMicroPartitionScan(
-      const pax::stats::MicroPartitionStatisticsInfo &stats,
-      TupleDesc desc) const {
-    if (num_scan_keys_ == 0) return true;
-    return TestMicroPartitionScanInternal(stats, desc);
+  inline bool TestScan(const ColumnStatsProvider &provider,
+                       const TupleDesc desc, int kind) {
+    bool filter_failed = true;
+    if (num_scan_keys_ == 0) goto finish;
+    filter_failed = TestScanInternal(provider, desc);
+
+  finish:
+    if (!filter_failed) {
+      hits_[kind] += 1;
+    }
+
+    totals_[kind] += 1;
+    return filter_failed;
+  }
+
+  inline void LogStatistics() {
+    for (size_t i = 0; i < filter_kind_desc.size(); i++) {
+      if (this->totals_[i] == 0) {
+        PAX_LOG("kind %s, no filter. ", filter_kind_desc[i]);
+      } else {
+        PAX_LOG("kind %s, filter rate: %d / %d", filter_kind_desc[i], hits_[i],
+                this->totals_[i]);
+      }
+    }
+  }
+
+  inline bool HasRowScanFilter() const { return efctx_.HasExecutionFilter(); }
+  inline bool BuildExecutionFilterForColumns(Relation rel, PlanState *ps) {
+    auto ok = pax::BuildExecutionFilterForColumns(rel, ps, &efctx_);
+    if (ok) FillRemainingColumns(rel);
+    return ok;
   }
 
  private:
-  bool TestMicroPartitionScanInternal(
-      const pax::stats::MicroPartitionStatisticsInfo &stats,
-      TupleDesc desc) const;
+  bool TestScanInternal(const ColumnStatsProvider &provider,
+                        TupleDesc desc) const;
+
+  void FillRemainingColumns(Relation rel);
+
+  bool allow_fallback_to_pg_ = false;
 
   // micro partition filter: we use the scan keys to filter a whole of micro
   // partition by comparing the scan keys with the min/max values in micro
@@ -49,6 +113,16 @@ class PaxFilter final {
   // column projection
   bool *proj_ = nullptr;
   size_t proj_len_ = 0;
+
+  // row-level filter
+  ExecutionFilterContext efctx_;
+  // all selected columns - single row filting columns
+  // before running final cross columns expression filtering, the remaining
+  // columns should be filled.
+  std::vector<AttrNumber> remaining_attnos_;
+
+  std::map<int, int> hits_;
+  std::map<int, int> totals_;
 };  // class PaxFilter
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_itemptr.cc b/contrib/pax_storage/src/cpp/storage/pax_itemptr.cc
new file mode 100644
index 00000000000..b0df35343ce
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/pax_itemptr.cc
@@ -0,0 +1,17 @@
+#include "storage/pax_itemptr.h"
+
+#include "comm/cbdb_wrappers.h"
+#include "catalog/pax_fastsequence.h"
+
+namespace pax {
+std::string GenerateBlockID(Relation relation) {
+  int32 seqno = -1;
+  CBDB_WRAP_START;
+  {
+    seqno = paxc::CPaxGetFastSequences(RelationGetRelid(relation));
+  }
+  CBDB_WRAP_END;
+  return std::to_string(seqno);
+}
+}  // namespace pax
+
diff --git a/contrib/pax_storage/src/cpp/storage/pax_itemptr.h b/contrib/pax_storage/src/cpp/storage/pax_itemptr.h
index 0f4f28ef103..1c638c3a692 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_itemptr.h
+++ b/contrib/pax_storage/src/cpp/storage/pax_itemptr.h
@@ -1,108 +1,91 @@
 #pragma once
 #include "comm/cbdb_api.h"
 
-#include <stdint.h>
-
 #include <string>
 
+#include "comm/cbdb_wrappers.h"
+
 namespace pax {
-#define PAX_TABLE_NUM_BIT_SIZE 5
-#define PAX_BLOCK_BIT_SIZE 22
-#define PAX_TUPLE_BIT_SIZE (48 - 7 - PAX_BLOCK_BIT_SIZE)
-#define MAX_TABLE_NUM_IN_CTID ((1 << PAX_TABLE_NUM_BIT_SIZE) - 1)
-
-#define BLOCK_NO_BITS_IN_BYTES_0_1 (16 - PAX_TABLE_NUM_BIT_SIZE)
-#define TUPLE_NO_BITS_IN_BYTES_2_3 (PAX_TUPLE_BIT_SIZE - 16)
-#define BLOCK_NO_BITS_IN_BYTES_2_3 (16 - TUPLE_NO_BITS_IN_BYTES_2_3)
-
-// 9bit
-// 0x1ff
-#define BLOCK_NO_MASK_IN_BYTES_0_1 (0xffff >> PAX_TABLE_NUM_BIT_SIZE)
-// 11bit
-// 0x07fff
-#define BLOCK_NO_MASK_IN_BYTES_2_3 (0xffff >> TUPLE_NO_BITS_IN_BYTES_2_3)
-
-// 5bit
-// 0x001f
-#define TUPLE_NO_MASK_IN_BYTES_2_3 (0xffff >> BLOCK_NO_BITS_IN_BYTES_2_3)
-
-// #define PAX_BLOCK_BIT_IN_BI_LO_BITS (PAX_BLOCK_BIT_SIZE - 16)
-// #define PAX_TUPLE_BIT_IN_BI_LO_BITS (32 - PAX_BLOCK_BIT_SIZE)
-// #define PAX_TUPLE_BIT_IN_BI_LO_MASK (0xFFFF >> PAX_BLOCK_BIT_IN_BI_LO_BITS)
-
-#define PAX_TUPLE_ID_MAX_ROW_NUM INT64CONST((1 << (PAX_TUPLE_BIT_SIZE - 1)) - 1)
-
-// | block number (24 bits) | tuple number (23 bits) |
-// | (16 bits) | 8bit       |8bit |1bit |7bit | 8bit |
-struct PaxItemPointer final {
-  uint16 bytes_0_1;
-  uint16 bytes_2_3;
-  uint16 bytes_4_5;
-  PaxItemPointer() {
-    bytes_0_1 = 0;
-    bytes_2_3 = 0;
-    bytes_4_5 = 0;
-  }
-  PaxItemPointer(uint8 table_no, uint32 block_number, uint32 tuple_number) {
-    bytes_0_1 = (table_no << BLOCK_NO_BITS_IN_BYTES_0_1);
-    bytes_0_1 |= (block_number >> BLOCK_NO_BITS_IN_BYTES_2_3);
-
-    // |7bit 9bit|11 bit 5 biy| 16bit|
-
-    bytes_2_3 |= (block_number & BLOCK_NO_MASK_IN_BYTES_2_3)
-                 << TUPLE_NO_BITS_IN_BYTES_2_3;
-    bytes_2_3 = (tuple_number >> 15);
-
-    bytes_4_5 = (tuple_number & 0x7FFF) + 1;
-  }
-
-  explicit PaxItemPointer(const PaxItemPointer *tid) {
-    bytes_0_1 = tid->bytes_0_1;
-    bytes_2_3 = tid->bytes_2_3;
-    bytes_4_5 = tid->bytes_4_5;
-  }
-
-  inline bool Valid() const { return bytes_4_5 != 0; }
-  static ItemPointerData GetTupleId(uint8 table_no, uint32 block_number,
-                                    uint32 tuple_number) {
-    ItemPointerData tid;
-    // table_no in bi_hi
-    tid.ip_blkid.bi_hi = (table_no << BLOCK_NO_BITS_IN_BYTES_0_1);
-
-    // block_number in bi_hi
-    tid.ip_blkid.bi_hi |= (block_number >> BLOCK_NO_BITS_IN_BYTES_2_3);
-
-    // |7bit 9bit|11 bit 5 biy| 16bit|
-
-    // block_number in bi_lo
-    tid.ip_blkid.bi_lo = (block_number & BLOCK_NO_MASK_IN_BYTES_2_3)
-                         << TUPLE_NO_BITS_IN_BYTES_2_3;
-    // tuple_number in bi_lo
-    tid.ip_blkid.bi_lo |= (tuple_number >> 15);
-    // tuple_number in ip_posid
-    tid.ip_posid = (tuple_number & 0x7FFF) + 1;
-    return tid;
-  }
-
-  uint8 GetTableNo() const { return bytes_0_1 >> BLOCK_NO_BITS_IN_BYTES_0_1; }
-
-  uint32 GetBlockNumber() const {
-    Assert(Valid());
-    // get block_number in bytes_0_1
-    uint32 block_number = (bytes_0_1 & BLOCK_NO_MASK_IN_BYTES_0_1)
-                          << BLOCK_NO_BITS_IN_BYTES_2_3;
-    block_number |= (bytes_2_3 >> TUPLE_NO_BITS_IN_BYTES_2_3);
-    return block_number;
-  }
-  uint32 GetTupleNumber() const {
-    Assert(Valid());
-    return bytes_4_5 - 1 + ((bytes_2_3 & TUPLE_NO_MASK_IN_BYTES_2_3) << 15);
-  }
-
-  void Clear() {
-    bytes_0_1 = 0;
-    bytes_2_3 = 0;
-    bytes_4_5 = 0;
-  }
-};
+#define PAX_BLOCK_BIT_SIZE 24
+#define PAX_TUPLE_BIT_SIZE (48 - (PAX_BLOCK_BIT_SIZE + 1))
+
+static inline ItemPointerData MakeCTID(uint32 block_number,
+                                       uint32 tuple_offset) {
+  ItemPointerData ctid;
+
+  static_assert(16 < PAX_BLOCK_BIT_SIZE && PAX_BLOCK_BIT_SIZE < 32,
+                "bit number of block number < 32");
+  static_assert(16 < PAX_TUPLE_BIT_SIZE && PAX_TUPLE_BIT_SIZE < 32,
+                "bit number of tuple number < 32");
+
+  Assert(block_number < (1UL << PAX_BLOCK_BIT_SIZE));
+  Assert(tuple_offset < (1UL << PAX_TUPLE_BIT_SIZE));
+
+  ctid.ip_blkid.bi_hi = block_number >> (PAX_BLOCK_BIT_SIZE - 16);
+  ctid.ip_blkid.bi_lo = block_number << (32 - PAX_BLOCK_BIT_SIZE);
+  ctid.ip_blkid.bi_lo |= tuple_offset >> 15;
+  ctid.ip_posid = (tuple_offset & 0x7FFF) + 1;
+  return ctid;
+}
+
+static inline uint32 GetBlockNumber(ItemPointerData ctid) {
+  uint32 block_number = ((uint32)ctid.ip_blkid.bi_hi)
+                        << (PAX_BLOCK_BIT_SIZE - 16);
+  return block_number |
+         ((uint32)ctid.ip_blkid.bi_lo) >> (32 - PAX_BLOCK_BIT_SIZE);
+}
+
+static inline void SetBlockNumber(ItemPointer ctid, uint32 block_number) {
+  Assert(block_number < (1UL << PAX_BLOCK_BIT_SIZE));
+
+  uint32 mask = (1UL << (32 - PAX_BLOCK_BIT_SIZE)) - 1;
+  ctid->ip_blkid.bi_hi = block_number >> (PAX_BLOCK_BIT_SIZE - 16);
+  ctid->ip_blkid.bi_lo = (ctid->ip_blkid.bi_lo & mask) |
+                         (block_number << (32 - PAX_BLOCK_BIT_SIZE));
+}
+
+static inline std::string MapToBlockNumber(Relation /* rel */,
+                                           ItemPointerData ctid) {
+  auto block_number = pax::GetBlockNumber(ctid);
+  return std::to_string(block_number);
+}
+
+static inline uint32 GetTupleOffsetInternal(ItemPointerData ctid) {
+  uint32 mask = (1UL << (PAX_TUPLE_BIT_SIZE - 15)) - 1;
+  uint32 hi = ctid.ip_blkid.bi_lo & mask;
+  uint32 lo = ctid.ip_posid - 1;
+  return (hi << 15) | lo;
+}
+
+static inline uint32 GetTupleOffset(ItemPointerData ctid) {
+  Assert(ItemPointerIsValid(&ctid));
+  return GetTupleOffsetInternal(ctid);
+}
+
+#ifndef BUILD_PAX_FORMAT
+static inline void SetTupleOffset(ItemPointer ctid, uint32 offset) {
+  Assert(offset < (1UL << PAX_TUPLE_BIT_SIZE));
+
+  uint32 mask = (1UL << (PAX_TUPLE_BIT_SIZE - 15)) - 1;
+  ctid->ip_blkid.bi_lo = (ctid->ip_blkid.bi_lo & ~mask) | (offset >> 15);
+  ctid->ip_posid = (offset & 0x7FFF) + 1;
+}
+#else
+// if paxformat.so is compiled separately, it is advisable not to set the tuple offset when reading tuples, 
+// other access methods (AMs) may use the pax storage format with a different partitioning scheme for ctid, 
+// which can lead to tuple offset overflow.
+static inline void SetTupleOffset(ItemPointer ctid, uint32 offset) {}
+#endif
+
+static inline uint64 CTIDToUint64(ItemPointerData ctid) {
+  uint64 ctid_u64 = 0;
+  ctid_u64 |= ((uint64)ctid.ip_blkid.bi_hi) << 48;
+  ctid_u64 |= ((uint64)ctid.ip_blkid.bi_lo) << 32;
+  ctid_u64 |= ctid.ip_posid;
+
+  return ctid_u64;
+}
+
+extern std::string GenerateBlockID(Relation relation);
+
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_itemptr_test.cc b/contrib/pax_storage/src/cpp/storage/pax_itemptr_test.cc
index 25e9d3cea11..bdc76c8091c 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_itemptr_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/pax_itemptr_test.cc
@@ -12,45 +12,54 @@ class PaxItemPtrTest : public ::testing::Test {
   void TearDown() override {}
 };
 
-TEST_F(PaxItemPtrTest, GetBlockNumber) {
-  auto tid = new PaxItemPointer();
-  tid->bytes_0_1 = 0xffff;
-  tid->bytes_2_3 = 0xff00;
-  tid->bytes_4_5 = 0;
-
-  PaxItemPointer pax_tid_1(tid);
-  EXPECT_EQ(pax_tid_1.Valid(), false);
-
-  ItemPointerData htid;
-
-  htid = PaxItemPointer::GetTupleId(0, 0xff, 1);
-  PaxItemPointer pax_tid_2(reinterpret_cast<PaxItemPointer *>(&htid));
-  EXPECT_EQ(pax_tid_2.GetTableNo(), 0);
-  EXPECT_EQ(pax_tid_2.GetBlockNumber(), 0xff);
-  EXPECT_EQ(pax_tid_2.GetTupleNumber(), 1);
-  EXPECT_EQ(pax_tid_2.Valid(), true);
-
-  htid = PaxItemPointer::GetTupleId(31, 0xffff, 0xff00);
-  PaxItemPointer pax_tid_3(reinterpret_cast<PaxItemPointer *>(&htid));
-  EXPECT_EQ(pax_tid_3.GetTableNo(), 31);
-  EXPECT_EQ(pax_tid_3.GetBlockNumber(), 0xffff);
-  EXPECT_EQ(pax_tid_3.GetTupleNumber(), 0xff00);
-  EXPECT_EQ(pax_tid_3.Valid(), true);
-
-  htid = PaxItemPointer::GetTupleId(0xf, 0xffff, PAX_TUPLE_ID_MAX_ROW_NUM);
-  PaxItemPointer pax_tid_4(reinterpret_cast<PaxItemPointer *>(&htid));
-  EXPECT_EQ(pax_tid_4.GetTableNo(), 0xf);
-  EXPECT_EQ(pax_tid_4.GetBlockNumber(), 0xffff);
-  EXPECT_EQ(pax_tid_4.GetTupleNumber(), PAX_TUPLE_ID_MAX_ROW_NUM);
-  EXPECT_EQ(pax_tid_4.Valid(), true);
-
-  htid = PaxItemPointer::GetTupleId(0x14, 0x12345, PAX_TUPLE_ID_MAX_ROW_NUM);
-  PaxItemPointer pax_tid_5(reinterpret_cast<PaxItemPointer *>(&htid));
-  EXPECT_EQ(pax_tid_5.GetTableNo(), 0x14);
-  EXPECT_EQ(pax_tid_5.GetBlockNumber(), 0x12345);
-  EXPECT_EQ(pax_tid_5.GetTupleNumber(), PAX_TUPLE_ID_MAX_ROW_NUM);
-  EXPECT_EQ(pax_tid_5.Valid(), true);
-
-  delete tid;
+#define MAX_BIT_NUMBER(nbits) ((1ULL << (nbits)) - 1)
+
+TEST_F(PaxItemPtrTest, ItemPointerLocalIndexBlockNumber) {
+  uint32 block;
+  uint32 tuple_offsets[] = {0, 1, MAX_BIT_NUMBER(PAX_TUPLE_BIT_SIZE)};
+  for (auto tuple_offset : tuple_offsets) {
+    for (block = 0; block <= 0xFFFF; block++) {
+      auto ctid = pax::MakeCTID(block, tuple_offset);
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+
+      SetBlockNumber(&ctid, block);
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+    }
+    for (block = MAX_BIT_NUMBER(PAX_BLOCK_BIT_SIZE) - 0xFFFF;
+         block <= MAX_BIT_NUMBER(PAX_BLOCK_BIT_SIZE); block++) {
+      auto ctid = pax::MakeCTID(block, tuple_offset);
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+
+      SetBlockNumber(&ctid, block);
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+    }
+  }
+}
+
+TEST_F(PaxItemPtrTest, ItemPointerLocalIndexTupleNumber) {
+  uint32 blocks[] = {0, 1, 0xff, 0xfff, MAX_BIT_NUMBER(PAX_BLOCK_BIT_SIZE)};
+  uint32 tuple_offset;
+  for (auto block : blocks) {
+    for (tuple_offset = 0; tuple_offset <= 0xFFFF; tuple_offset++) {
+      auto ctid = pax::MakeCTID(block, tuple_offset);
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+
+      SetTupleOffset(&ctid, tuple_offset);
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+    }
+    for (tuple_offset = MAX_BIT_NUMBER(PAX_TUPLE_BIT_SIZE) - 0xFFFF;
+         tuple_offset <= MAX_BIT_NUMBER(PAX_TUPLE_BIT_SIZE); tuple_offset++) {
+      auto ctid = pax::MakeCTID(block, tuple_offset);
+      EXPECT_EQ(block, pax::GetBlockNumber(ctid));
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+
+      SetTupleOffset(&ctid, tuple_offset);
+      EXPECT_EQ(tuple_offset, pax::GetTupleOffset(ctid));
+    }
+  }
 }
+
 }  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.cc b/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.cc
new file mode 100644
index 00000000000..e72b1cbfbb0
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.cc
@@ -0,0 +1,259 @@
+#include "storage/pax_table_partition_writer.h"
+
+#include <cstring>
+
+#include "access/pax_deleter.h"
+#include "access/pax_partition.h"
+#include "catalog/pax_aux_table.h"
+#include "comm/pax_memory.h"
+#include "storage/micro_partition_stats.h"
+
+namespace pax {
+TableParitionWriter::TableParitionWriter(Relation relation,
+                                         PartitionObject *part_obj)
+    : TableWriter(relation),
+      part_obj_(part_obj),
+      writers_(nullptr),
+      mp_stats_(nullptr),
+      num_tuples_(nullptr),
+      current_blocknos_(nullptr),
+      writer_counts_(0) {}
+
+TableParitionWriter::~TableParitionWriter() {
+  for (int i = 0; i < writer_counts_; i++) {
+    PAX_DELETE(writers_[i]);
+    PAX_DELETE(mp_stats_[i]);
+  }
+  PAX_DELETE_ARRAY(writers_);
+  PAX_DELETE_ARRAY(mp_stats_);
+  PAX_DELETE_ARRAY(num_tuples_);
+  PAX_DELETE_ARRAY(current_blocknos_);
+}
+
+void TableParitionWriter::WriteTuple(TupleTableSlot *slot) {
+  auto part_index = part_obj_->FindPartition(slot);
+  Assert(part_index < writer_counts_);
+  Assert(strategy_);
+
+  if (part_index == -1) {
+    part_index = writer_counts_ - 1;
+  }
+
+  if (!writers_[part_index]) {
+    Assert(!mp_stats_[part_index]);
+    mp_stats_[part_index] = PAX_NEW<MicroPartitionStats>();
+    writers_[part_index] = CreateMicroPartitionWriter(mp_stats_[part_index]);
+
+    // insert tuple into the aux table before inserting any tuples.
+    current_blocknos_[part_index] = current_blockno_;
+    cbdb::InsertMicroPartitionPlaceHolder(RelationGetRelid(relation_),
+                                          std::to_string(current_blockno_));
+  }
+  else if (strategy_->ShouldSplit(writers_[part_index]->PhysicalSize(),
+                             num_tuples_[part_index])) {
+    writers_[part_index]->Close();
+    PAX_DELETE(writers_[part_index]);
+    writers_[part_index] = CreateMicroPartitionWriter(mp_stats_[part_index]);
+    num_tuples_[part_index] = 0;
+
+    // insert tuple into the aux table before inserting any tuples.
+    current_blocknos_[part_index] = current_blockno_;
+    cbdb::InsertMicroPartitionPlaceHolder(RelationGetRelid(relation_),
+                                          std::to_string(current_blockno_));
+  }
+
+  writers_[part_index]->WriteTuple(slot);
+  num_tuples_[part_index]++;
+  SetBlockNumber(&slot->tts_tid, current_blocknos_[part_index]);
+  ExecStoreVirtualTuple(slot);
+}
+
+void TableParitionWriter::Open() {
+  // still need init rel_path_, which used to generate next file
+  rel_path_ = cbdb::BuildPaxDirectoryPath(relation_->rd_node, relation_->rd_backend);
+  // 1 for the default parition
+  writer_counts_ = part_obj_->NumPartitions() + 1;
+  Assert(writer_counts_ > 1);
+
+  writers_ = PAX_NEW_ARRAY<MicroPartitionWriter *>(writer_counts_);
+  memset(writers_, 0,
+         sizeof(MicroPartitionWriter *) * writer_counts_);  // NOLINT
+
+  mp_stats_ = PAX_NEW_ARRAY<MicroPartitionStats *>(writer_counts_);
+  memset(mp_stats_, 0,
+         sizeof(MicroPartitionStats *) * writer_counts_);  // NOLINT
+
+  num_tuples_ = PAX_NEW_ARRAY<size_t>(writer_counts_);
+  memset(num_tuples_, 0, sizeof(size_t) * writer_counts_);
+
+  current_blocknos_ = PAX_NEW_ARRAY<BlockNumber>(writer_counts_);
+}
+
+static inline bool PartIndexIsNear(const int *const inverted_indexes,
+                                   int part_counts, int l, int r) {
+  Assert(l < part_counts && r < part_counts);
+  if (inverted_indexes[l] == -1 || inverted_indexes[r] == -1) {
+    return false;
+  }
+
+  return inverted_indexes[l] == inverted_indexes[r];
+}
+
+static void BuildInvertedPartIndex(
+    const std::pair<int *, size_t> &merge_list_info, int *inverted_indexes,
+    int part_counts) {
+  int *part_range = nullptr;
+  size_t part_range_size = 0;
+  std::tie(part_range, part_range_size) = merge_list_info;
+  int merge_index = 0;
+  int nums_of_part = part_range_size / 2;
+
+  Assert(part_range && part_range_size != 0);
+  // Must be an even number
+  Assert(part_range_size % 2 == 0);
+
+  int i;
+  for (i = 0; i < part_counts; i++) {
+  retry:
+    if (merge_index >= nums_of_part) {
+      break;
+    }
+
+    auto mid_l = part_range[merge_index * 2];
+    auto mid_r = part_range[merge_index * 2 + 1];
+
+    if (i >= mid_l && i <= mid_r) {
+      inverted_indexes[i] = merge_index;
+    } else if (i > mid_r) {
+      merge_index++;
+      goto retry;
+    } else {  // i < mid_l
+      inverted_indexes[i] = -1;
+    }
+  }
+
+  for (; i < part_counts; i++) {
+    inverted_indexes[i] = -1;
+  }
+}
+
+std::vector<std::vector<size_t>> TableParitionWriter::GetPartitionMergeInfos() {
+  int l = 0, r = 1;
+  size_t tuples_counts;
+
+  std::vector<std::vector<size_t>> merge_list;
+  int part_counts = writer_counts_ - 1;
+  std::pair<int *, size_t> near_list = part_obj_->GetMergeListInfo();
+  int *inverted_indexes = PAX_NEW_ARRAY<int>(part_counts);
+  auto split_tuple_limit = strategy_->SplitTupleNumbers();
+
+  BuildInvertedPartIndex(near_list, inverted_indexes, part_counts);
+
+  auto gen_merge_info = [](size_t left, size_t right) {
+    std::vector<size_t> gen;
+    for (size_t i = left; i < right; i++) {
+      gen.emplace_back(i);
+    }
+    return gen;
+  };
+
+  while (r < part_counts) {
+    tuples_counts = 0;
+    Assert(r > l);
+    // skip the empty writer
+    while (!num_tuples_[l] && l < part_counts) {
+      l++;
+      r = l + 1;
+    }
+
+    if (r >= part_counts) {
+      break;
+    }
+
+    // calculate number of tuple within an [l, r)
+    for (int i = l; i < r; i++) {
+      tuples_counts += num_tuples_[i];
+    }
+
+    // right pointer got empty writer
+    // current partition can't merge right partitions
+    if (!num_tuples_[r]) {
+      if (r - 1 != l) {
+        merge_list.emplace_back(gen_merge_info(l, r));
+      }
+      l = r + 1;
+      r = l + 1;
+    } else if (tuples_counts <=
+               split_tuple_limit) {  // still can merge more partitions
+      // no more right partitions
+      if (r >= part_counts) {
+        break;
+      }
+
+      // check current partition is near the last partition
+      if (PartIndexIsNear(inverted_indexes, part_counts, r - 1, r)) {
+        r++;
+      } else if (r - 1 !=
+                 l) {  // not nearby last one and not the single partition
+        merge_list.emplace_back(gen_merge_info(l, r));
+        l = r;
+        r = l + 1;
+      } else {  // single partition
+        l = r;
+        r = l + 1;
+      }
+    } else if (r - l > 1) {  // tuples_counts > split_tuple_limit
+      // not the single partition
+      merge_list.emplace_back(gen_merge_info(l, r));
+      l = r;
+      r = l + 1;
+    } else {  // single partition, not need add it into list
+      l = r;
+      r = l + 1;
+    }
+  }
+
+  Assert(l < r);
+  if (l != r - 1) {
+    merge_list.emplace_back(gen_merge_info(l, r));
+  }
+
+  PAX_DELETE_ARRAY(inverted_indexes);
+
+  return merge_list;
+}
+
+void TableParitionWriter::Close() {
+  Assert(part_obj_->NumPartitions() + 1 == writer_counts_);
+  const auto merge_indexes_list = GetPartitionMergeInfos();
+
+  for (const auto &merge_indexes : merge_indexes_list) {
+    Assert(!merge_indexes.empty());
+
+    {
+      Snapshot snapshot = nullptr;
+      pax::CPaxDeleter del(relation_, snapshot);
+      for (size_t i = 0; i < merge_indexes.size(); i++) {
+        auto w = writers_[merge_indexes[i]];
+        auto block = current_blocknos_[merge_indexes[i]];
+        w->Close();
+        PAX_DELETE(w);
+        writers_[merge_indexes[i]] = nullptr;
+
+        del.MarkDelete(block);
+      }
+      CommandCounterIncrement();
+      del.ExecDelete();
+    }
+  }
+
+  for (int i = 0; i < writer_counts_; i++) {
+    if (writers_[i]) {
+      writers_[i]->Close();
+      PAX_DELETE(writers_[i]);
+      writers_[i] = nullptr;
+    }
+  }
+}
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.h b/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.h
new file mode 100644
index 00000000000..ea9b1bfbde6
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/pax_table_partition_writer.h
@@ -0,0 +1,36 @@
+#pragma once
+#include <vector>
+
+#include "storage/micro_partition.h"
+#include "storage/pax.h"
+
+namespace pax {
+class PartitionObject;
+class TableParitionWriter : public TableWriter {
+ public:
+  explicit TableParitionWriter(Relation relation, PartitionObject *part_obj);
+
+  ~TableParitionWriter() override;
+
+  void WriteTuple(TupleTableSlot *slot) override;
+
+  void Open() override;
+
+  void Close() override;
+
+#ifndef RUN_GTEST
+ private:
+#endif
+  std::vector<std::vector<size_t>> GetPartitionMergeInfos();
+
+ private:
+  PartitionObject *part_obj_;
+  MicroPartitionWriter **writers_;
+  MicroPartitionStats **mp_stats_;
+  size_t *num_tuples_;
+  BlockNumber *current_blocknos_;
+
+  int writer_counts_;
+};
+
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/pax_test.cc b/contrib/pax_storage/src/cpp/storage/pax_test.cc
index 29940298013..589ec528146 100644
--- a/contrib/pax_storage/src/cpp/storage/pax_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/pax_test.cc
@@ -6,54 +6,27 @@
 #include <utility>
 #include <vector>
 
+#include "access/pax_partition.h"
 #include "comm/gtest_wrappers.h"
 #include "exceptions/CException.h"
+#include "pax_gtest_helper.h"
 #include "storage/local_file_system.h"
 #include "storage/micro_partition.h"
 #include "storage/orc/orc.h"
+#include "storage/pax_table_partition_writer.h"
+#include "stub.h"
+
+#ifdef ENABLE_PLASMA
+#include "storage/cache/pax_plasma_cache.h"
+#endif
 
 namespace pax::tests {
 using ::testing::_;
 using ::testing::AtLeast;
 using ::testing::Return;
+using ::testing::ReturnRoundRobin;
 
-const char *pax_file_name = "./test.pax";
-#define COLUMN_NUMS 2
-
-CTupleSlot *CreateFakeCTupleSlot(bool with_value) {
-  TupleTableSlot *tuple_slot;
-
-  auto tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
-      sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * COLUMN_NUMS));
-
-  tuple_desc->natts = COLUMN_NUMS;
-  tuple_desc->attrs[0] = {
-      .attlen = 4,
-      .attbyval = true,
-  };
-
-  tuple_desc->attrs[1] = {
-      .attlen = 4,
-      .attbyval = true,
-  };
-
-  tuple_slot = MakeTupleTableSlot(tuple_desc, &TTSOpsVirtual);
-
-  if (with_value) {
-    bool *fake_is_null = new bool[COLUMN_NUMS];
-
-    fake_is_null[0] = false;
-    fake_is_null[1] = false;
-
-    tuple_slot->tts_values[0] = Int32GetDatum(1);
-    tuple_slot->tts_values[1] = Int32GetDatum(2);
-    tuple_slot->tts_isnull = fake_is_null;
-  }
-
-  auto ctuple_slot = new CTupleSlot(tuple_slot);
-
-  return ctuple_slot;
-}
+const char *pax_file_name = "12";
 
 class MockReaderInterator : public IteratorBase<MicroPartitionMetadata> {
  public:
@@ -80,38 +53,46 @@ class MockWriter : public TableWriter {
   MockWriter(const Relation relation, WriteSummaryCallback callback)
       : TableWriter(relation) {
     SetWriteSummaryCallback(callback);
-    SetFileSplitStrategy(new PaxDefaultSplitStrategy());
   }
 
   MOCK_METHOD(std::string, GenFilePath, (const std::string &), (override));
+  MOCK_METHOD((std::vector<std::tuple<ColumnEncoding_Kind, int>>),
+              GetRelEncodingOptions, (), (override));
+};
+
+class MockSplitStrategy final : public FileSplitStrategy {
+  size_t SplitTupleNumbers() const override {
+    // 1000 tuple
+    return 200 * 8;
+  }
+
+  size_t SplitFileSize() const override { return 0; }
+
+  bool ShouldSplit(size_t phy_size, size_t num_tuples) const override {
+    return num_tuples >= SplitTupleNumbers();
+  }
 };
 
 class PaxWriterTest : public ::testing::Test {
  public:
   void SetUp() override {
-    Singleton<LocalFileSystem>::GetInstance();
-    CurrentResourceOwner = ResourceOwnerCreate(NULL, "OrcTestResourceOwner");
+    Singleton<LocalFileSystem>::GetInstance()->Delete(pax_file_name);
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
   void TearDown() override {
-    std::remove(pax_file_name);
-    ResourceOwner tmp_resource_owner = CurrentResourceOwner;
-    CurrentResourceOwner = NULL;
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_BEFORE_LOCKS,
-                         false, true);
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_LOCKS, false,
-                         true);
-    ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_AFTER_LOCKS,
-                         false, true);
-    ResourceOwnerDelete(tmp_resource_owner);
+    Singleton<LocalFileSystem>::GetInstance()->Delete(pax_file_name);
+    ReleaseTestResourceOwner();
   }
 };
 
 TEST_F(PaxWriterTest, WriteReadTuple) {
-  CTupleSlot *slot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *slot = CreateTestTupleTableSlot(true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
 
   auto relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
-  relation->rd_att = slot->GetTupleTableSlot()->tts_tupleDescriptor;
+  relation->rd_att = slot->tts_tupleDescriptor;
   bool callback_called = false;
 
   TableWriter::WriteSummaryCallback callback =
@@ -120,17 +101,26 @@ TEST_F(PaxWriterTest, WriteReadTuple) {
       };
 
   auto writer = new MockWriter(relation, callback);
+  writer->SetFileSplitStrategy(new PaxDefaultSplitStrategy());
   EXPECT_CALL(*writer, GenFilePath(_))
       .Times(AtLeast(1))
       .WillRepeatedly(Return(pax_file_name));
 
+  for (size_t i = 0; i < COLUMN_NUMS; i++) {
+    encoding_opts.emplace_back(
+        std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  }
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
+
   writer->Open();
 
   writer->WriteTuple(slot);
   writer->Close();
   ASSERT_TRUE(callback_called);
 
-  cbdb::Pfree(slot->GetTupleTableSlot());
+  DeleteTestTupleTableSlot(slot);
   delete writer;
 
   std::vector<MicroPartitionMetadata> meta_info_list;
@@ -152,21 +142,134 @@ TEST_F(PaxWriterTest, WriteReadTuple) {
   reader = new TableReader(std::move(meta_info_iterator), reader_options);
   reader->Open();
 
-  CTupleSlot *rslot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *rslot = CreateTestTupleTableSlot(false);
 
   reader->ReadTuple(rslot);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(rslot));
 
-  ASSERT_EQ(1, cbdb::DatumToInt32(rslot->GetTupleTableSlot()->tts_values[0]));
-  ASSERT_EQ(2, cbdb::DatumToInt32(rslot->GetTupleTableSlot()->tts_values[1]));
+  DeleteTestTupleTableSlot(rslot);
   delete relation;
   delete reader;
 }
 
+TEST_F(PaxWriterTest, TestOper) {
+  TupleTableSlot *slot = CreateTestTupleTableSlot(true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
+  Relation relation;
+  std::vector<size_t> mins;
+  std::vector<size_t> maxs;
+  int origin_pax_max_tuples_per_group = pax_max_tuples_per_group;
+
+  std::remove((pax_file_name + std::to_string(0)).c_str());
+  std::remove((pax_file_name + std::to_string(1)).c_str());
+  std::remove((pax_file_name + std::to_string(2)).c_str());
+
+  relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
+  relation->rd_att = slot->tts_tupleDescriptor;
+
+  TableWriter::WriteSummaryCallback callback =
+      [&mins, &maxs](const WriteSummary &summary) {
+        auto min = *reinterpret_cast<const int32 *>(
+            summary.mp_stats.columnstats(2).datastats().minimal().data());
+        auto max = *reinterpret_cast<const int32 *>(
+            summary.mp_stats.columnstats(2).datastats().maximum().data());
+
+        mins.emplace_back(min);
+        maxs.emplace_back(max);
+      };
+
+  auto strategy = new MockSplitStrategy();
+  auto split_size = strategy->SplitTupleNumbers();
+
+  // 8 groups in a file
+  pax_max_tuples_per_group = split_size / 8;
+
+  auto writer = new MockWriter(relation, callback);
+  writer->SetFileSplitStrategy(strategy);
+  writer->SetStatsCollector(new MicroPartitionStats());
+  uint32 call_times = 0;
+  EXPECT_CALL(*writer, GenFilePath(_))
+      .Times(AtLeast(2))
+      .WillRepeatedly(testing::Invoke([&call_times]() -> std::string {
+        return std::string(pax_file_name) + std::to_string(call_times++);
+      }));
+  for (size_t i = 0; i < COLUMN_NUMS; i++) {
+    encoding_opts.emplace_back(
+        std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  }
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
+
+  writer->Open();
+
+  // 3 files
+  for (size_t i = 0; i < split_size * 3; i++) {
+    slot->tts_values[2] = i;
+    writer->WriteTuple(slot);
+  }
+  writer->Close();
+
+  // verify file min/max
+  ASSERT_EQ(mins.size(), 3);
+  ASSERT_EQ(maxs.size(), 3);
+
+  for (size_t i = 0; i < 3; i++) {
+    std::cout << "mins[i]: " << mins[i] << std::endl;
+    std::cout << "maxs[i]: " << maxs[i] << std::endl;
+    ASSERT_EQ(mins[i], split_size * i);
+    ASSERT_EQ(maxs[i], split_size * (i + 1) - 1);
+  }
+
+  DeleteTestTupleTableSlot(slot);
+  delete writer;
+
+  // verify stripe min/max
+  auto verify_single_file = [](size_t file_index, size_t file_tuples) {
+    LocalFileSystem *local_fs;
+    MicroPartitionReader::ReaderOptions reader_options;
+    TupleTableSlot *rslot = CreateTestTupleTableSlot(false);
+    size_t file_min_max_offset = file_index * file_tuples;
+
+    local_fs = Singleton<LocalFileSystem>::GetInstance();
+    auto reader = new OrcReader(local_fs->Open(
+        pax_file_name + std::to_string(file_index), fs::kReadMode));
+    reader->Open(reader_options);
+
+    ASSERT_EQ(reader->GetGroupNums(), 8);
+    for (size_t i = 0; i < 8; i++) {
+      auto stats = reader->GetGroupStatsInfo(i);
+      auto min = *reinterpret_cast<const int32 *>(
+          stats->DataStats(2).minimal().data());
+      auto max = *reinterpret_cast<const int32 *>(
+          stats->DataStats(2).maximum().data());
+
+      EXPECT_EQ(pax_max_tuples_per_group * i + file_min_max_offset, min);
+      EXPECT_EQ(pax_max_tuples_per_group * (i + 1) + file_min_max_offset - 1,
+                max);
+    }
+
+    delete reader;
+    DeleteTestTupleTableSlot(rslot);
+  };
+
+  verify_single_file(0, split_size);
+  verify_single_file(1, split_size);
+  verify_single_file(2, split_size);
+
+  std::remove((pax_file_name + std::to_string(0)).c_str());
+  std::remove((pax_file_name + std::to_string(1)).c_str());
+  std::remove((pax_file_name + std::to_string(2)).c_str());
+
+  pax_max_tuples_per_group = origin_pax_max_tuples_per_group;
+}
+
 TEST_F(PaxWriterTest, WriteReadTupleSplitFile) {
-  CTupleSlot *slot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *slot = CreateTestTupleTableSlot(true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
   auto relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
 
-  relation->rd_att = slot->GetTupleTableSlot()->tts_tupleDescriptor;
+  relation->rd_att = slot->tts_tupleDescriptor;
   bool callback_called = false;
 
   TableWriter::WriteSummaryCallback callback =
@@ -175,23 +278,33 @@ TEST_F(PaxWriterTest, WriteReadTupleSplitFile) {
       };
 
   auto writer = new MockWriter(relation, callback);
+  writer->SetFileSplitStrategy(new MockSplitStrategy());
   uint32 call_times = 0;
   EXPECT_CALL(*writer, GenFilePath(_))
       .Times(AtLeast(2))
       .WillRepeatedly(testing::Invoke([&call_times]() -> std::string {
-        return pax_file_name + std::to_string(call_times++);
+        return std::string(pax_file_name) + std::to_string(call_times++);
       }));
+  for (size_t i = 0; i < COLUMN_NUMS; i++) {
+    encoding_opts.emplace_back(
+        std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  }
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
 
   writer->Open();
 
   ASSERT_TRUE(writer->GetFileSplitStrategy()->SplitTupleNumbers());
   auto split_size = writer->GetFileSplitStrategy()->SplitTupleNumbers();
 
-  for (size_t i = 0; i < split_size + 1; i++) writer->WriteTuple(slot);
+  for (size_t i = 0; i < split_size + 1; i++) {
+    writer->WriteTuple(slot);
+  }
   writer->Close();
   ASSERT_TRUE(callback_called);
 
-  cbdb::Pfree(slot->GetTupleTableSlot());
+  DeleteTestTupleTableSlot(slot);
   delete writer;
 
   std::vector<MicroPartitionMetadata> meta_info_list;
@@ -217,16 +330,16 @@ TEST_F(PaxWriterTest, WriteReadTupleSplitFile) {
   reader = new TableReader(std::move(meta_info_iterator), reader_options);
   reader->Open();
 
-  CTupleSlot *rslot = CreateFakeCTupleSlot(true);
+  TupleTableSlot *rslot = CreateTestTupleTableSlot(false);
 
   for (size_t i = 0; i < split_size + 1; i++) {
     ASSERT_TRUE(reader->ReadTuple(rslot));
-    ASSERT_EQ(1, cbdb::DatumToInt32(rslot->GetTupleTableSlot()->tts_values[0]));
-    ASSERT_EQ(2, cbdb::DatumToInt32(rslot->GetTupleTableSlot()->tts_values[1]));
+    EXPECT_TRUE(VerifyTestTupleTableSlot(rslot));
   }
   ASSERT_FALSE(reader->ReadTuple(rslot));
   reader->Close();
 
+  DeleteTestTupleTableSlot(rslot);
   delete reader;
   delete relation;
 
@@ -234,4 +347,261 @@ TEST_F(PaxWriterTest, WriteReadTupleSplitFile) {
   std::remove((pax_file_name + std::to_string(1)).c_str());
 }
 
+#ifdef ENABLE_PLASMA
+
+TEST_F(PaxWriterTest, TestCacheColumns) {
+  TupleTableSlot *slot = CreateTestTupleTableSlot(true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
+  const char *uuid_file_name = "40fdcd4e-52cc-11ee-a652-52549e1c7e53";
+
+  std::remove(uuid_file_name);
+
+  auto relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
+  relation->rd_att = slot->tts_tupleDescriptor;
+  bool callback_called = false;
+
+  TableWriter::WriteSummaryCallback callback =
+      [&callback_called](const WriteSummary & /*summary*/) {
+        callback_called = true;
+      };
+
+  auto writer = new MockWriter(relation, callback);
+  writer->SetFileSplitStrategy(new PaxDefaultSplitStrategy());
+  EXPECT_CALL(*writer, GenFilePath(_))
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(uuid_file_name));
+
+  for (size_t i = 0; i < COLUMN_NUMS; i++) {
+    encoding_opts.emplace_back(
+        std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  }
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
+
+  writer->Open();
+  writer->WriteTuple(slot);
+  writer->Close();
+  ASSERT_TRUE(callback_called);
+
+  DeleteTestTupleTableSlot(slot);
+  delete writer;
+
+  std::vector<MicroPartitionMetadata> meta_info_list;
+  MicroPartitionMetadata meta_info;
+
+  meta_info.SetFileName(uuid_file_name);
+  meta_info.SetMicroPartitionId(uuid_file_name);
+
+  meta_info_list.push_back(std::move(meta_info));
+
+  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> meta_info_iterator =
+      std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(
+          new MockReaderInterator(meta_info_list));
+
+  PaxPlasmaCache::CacheOptions cache_options;
+  cache_options.domain_socket = "/tmp/plasma";
+  cache_options.client_name = "";
+  cache_options.memory_quota = 10 * 1024 * 1024;
+  cache_options.waitting_ms = 0;
+
+  auto pax_cache = new PaxPlasmaCache(std::move(cache_options));
+  pax_cache->Initialize();
+
+  PaxFilter *filter = new PaxFilter();
+  auto proj_map = new bool[2];
+  memset(proj_map, true, 2);
+  filter->SetColumnProjection(proj_map, 2);
+
+  TableReader *reader;
+  TableReader::ReaderOptions reader_options{};
+  reader_options.build_bitmap = false;
+  reader_options.rel_oid = 0;
+  reader_options.filter = filter;
+  reader_options.pax_cache = pax_cache;
+
+  reader = new TableReader(std::move(meta_info_iterator), reader_options);
+  reader->Open();
+
+  TupleTableSlot *rslot = CreateTestTupleTableSlot(false);
+
+  reader->ReadTuple(rslot);
+  reader->Close();
+
+  DeleteTestTupleTableSlot(rslot);
+  delete reader;
+
+  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> meta_info_iterator2 =
+      std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(
+          new MockReaderInterator(meta_info_list));
+
+  reader = new TableReader(std::move(meta_info_iterator2), reader_options);
+  reader->Open();
+  rslot = CreateTestTupleTableSlot(false);
+
+  reader->ReadTuple(rslot);
+  EXPECT_TRUE(VerifyTestTupleTableSlot(rslot));
+
+  reader->Close();
+  DeleteTestTupleTableSlot(rslot);
+  delete reader;
+
+  std::remove(uuid_file_name);
+  pax_cache->Destroy();
+
+  delete relation;
+  delete filter;
+  delete pax_cache;
+}
+
+#endif  // #ifdef ENABLE_PLASMA
+
+class MockParitionWriter : public TableParitionWriter {
+ public:
+  MockParitionWriter(const Relation relation, PartitionObject *bucket,
+                     WriteSummaryCallback callback)
+      : TableParitionWriter(relation, bucket) {
+    SetWriteSummaryCallback(callback);
+    SetFileSplitStrategy(new PaxDefaultSplitStrategy());
+  }
+
+  MOCK_METHOD(std::string, GenFilePath, (const std::string &), (override));
+  MOCK_METHOD((std::vector<std::tuple<ColumnEncoding_Kind, int>>),
+              GetRelEncodingOptions, (), (override));
+};
+
+namespace mock_partition_test {
+int NumPartitions() { return 10; }
+int FindPartition(TupleTableSlot * /*slot*/) {
+  static int round = 0;
+  auto index = round % 8;
+  static std::vector<int> round_indexs = {0, 2, 3, 4, 5, 6, 8, 9};
+  ++round;
+  return round_indexs[index];
+};
+
+std::vector<std::vector<size_t>> GetPartitionMergeInfos() {
+  return {{0, 2, 3}, {4, 5}, {6, 8, 9}};
+}
+
+void MicroPartitionStatsMerge(MicroPartitionStats *stats, TupleDesc desc) {}
+}  // namespace mock_partition_test
+
+TEST_F(PaxWriterTest, ParitionWriteReadTuple) {
+  std::vector<const char *> file_names = {
+      "pax_parition_0.file", "pax_parition_2.file", "pax_parition_3.file",
+      "pax_parition_4.file", "pax_parition_5.file", "pax_parition_6.file",
+      "pax_parition_8.file", "pax_parition_9.file",
+  };
+  TupleTableSlot *slot = CreateTestTupleTableSlot(true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
+  auto relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
+  relation->rd_rel = (Form_pg_class)cbdb::Palloc0(sizeof(*relation->rd_rel));
+  relation->rd_att = slot->tts_tupleDescriptor;
+  bool callback_called = false;
+  Stub *stub;
+  stub = new Stub();
+
+  auto clear_disk_file = [file_names] {
+    for (const auto &file_name : file_names) {
+      std::remove(file_name);
+    }
+  };
+
+  clear_disk_file();
+
+  TableWriter::WriteSummaryCallback callback =
+      [&callback_called](const WriteSummary & /*summary*/) {
+        callback_called = true;
+      };
+
+  for (size_t i = 0; i < COLUMN_NUMS; i++) {
+    encoding_opts.emplace_back(
+        std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  }
+
+  stub->set(ADDR(PartitionObject, NumPartitions),
+            mock_partition_test::NumPartitions);
+  stub->set(ADDR(PartitionObject, FindPartition),
+            mock_partition_test::FindPartition);
+  stub->set(ADDR(MockParitionWriter, GetPartitionMergeInfos),
+            mock_partition_test::GetPartitionMergeInfos);
+  stub->set(ADDR(MicroPartitionStats, MergeTo),
+            mock_partition_test::MicroPartitionStatsMerge);
+
+  auto part_obj = new PartitionObject();
+  auto writer = new MockParitionWriter(relation, part_obj, callback);
+
+  EXPECT_CALL(*writer, GenFilePath(_))
+      .Times(8)  // must be 8
+      .WillRepeatedly(ReturnRoundRobin(file_names));
+
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
+
+  writer->Open();
+
+  for (size_t i = 0; i < 400; i++) {
+    writer->WriteTuple(slot);
+  }
+
+  writer->Close();
+  ASSERT_TRUE(callback_called);
+
+  DeleteTestTupleTableSlot(slot);
+  delete part_obj;
+  delete writer;
+
+  // will remain pax_parition_0.file, pax_parition_4.file,
+  // pax_parition_6.file after merge
+  ASSERT_EQ(0, access(file_names[0], 0));
+  ASSERT_NE(0, access(file_names[1], 0));
+  ASSERT_NE(0, access(file_names[2], 0));
+  ASSERT_EQ(0, access(file_names[3], 0));
+  ASSERT_NE(0, access(file_names[4], 0));
+  ASSERT_EQ(0, access(file_names[5], 0));
+  ASSERT_NE(0, access(file_names[6], 0));
+  ASSERT_NE(0, access(file_names[7], 0));
+
+  std::vector<MicroPartitionMetadata> meta_info_list;
+  MicroPartitionMetadata meta_info;
+  meta_info.SetFileName(file_names[0]);
+  meta_info.SetMicroPartitionId(file_names[0]);
+  meta_info_list.push_back(meta_info);
+
+  meta_info.SetFileName(file_names[3]);
+  meta_info.SetMicroPartitionId(file_names[3]);
+  meta_info_list.push_back(meta_info);
+
+  meta_info.SetFileName(file_names[5]);
+  meta_info.SetMicroPartitionId(file_names[5]);
+  meta_info_list.push_back(meta_info);
+
+  std::unique_ptr<IteratorBase<MicroPartitionMetadata>> meta_info_iterator =
+      std::unique_ptr<IteratorBase<MicroPartitionMetadata>>(
+          new MockReaderInterator(meta_info_list));
+
+  TableReader *reader;
+  TableReader::ReaderOptions reader_options{};
+  reader_options.build_bitmap = false;
+  reader_options.rel_oid = 0;
+  reader = new TableReader(std::move(meta_info_iterator), reader_options);
+  reader->Open();
+
+  TupleTableSlot *rslot = CreateTestTupleTableSlot(false);
+
+  for (int i = 0; i < 400; i++) {
+    ASSERT_TRUE(reader->ReadTuple(rslot));
+    EXPECT_TRUE(VerifyTestTupleTableSlot(rslot));
+  }
+
+  DeleteTestTupleTableSlot(rslot);
+  delete relation;
+  delete reader;
+  delete stub;
+
+  clear_disk_file();
+}
+
 }  // namespace pax::tests
diff --git a/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.cc b/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.cc
deleted file mode 100644
index 64d8e819be7..00000000000
--- a/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.cc
+++ /dev/null
@@ -1,479 +0,0 @@
-#include "storage/paxc_block_map_manager.h"
-
-#include <unistd.h>
-
-#include "comm/cbdb_wrappers.h"
-namespace paxc {
-
-static PaxXactSharedState *current_xact_shared_pax_ss = NULL;
-
-#define DEFAULT_BLOCK_IDS_SIZE 16
-
-#define ACQUIRE_HASH_LOCK(hash_lock, lockmode) \
-  LWLockAcquire(&hash_lock->lock, lockmode);
-
-#define RELEASE_HASH_LOCK(hash_lock) LWLockRelease(&hash_lock->lock)
-
-static LocalTableBlockMappingData
-    local_pax_block_mapping_data[BLOCK_MAPPING_ARRAY_SIZE];
-
-static MemoryContext pax_block_mapping_context = NULL;
-
-static int max_procs = 0;
-// the lock for pax_xact_hash
-static LWLockPadded *pax_hash_lock = NULL;
-static HTAB *pax_xact_hash = NULL;
-// common PaxSharedState
-static PaxSharedState *pax_shared_state;
-
-void init_local_command_resource();
-void init_command_shmem_resource();
-void cleanup_local_command_resource();
-void cleanup_command_shmem_resource();
-
-Size struct_mem_size() { return sizeof(PaxSharedState); }
-
-Size pax_mem_size() {
-  Size size = 0;
-  size = add_size(size, struct_mem_size());
-  // hash size
-  size = add_size(size, hash_estimate_size(max_procs, sizeof(XactHashEntry)));
-  return size;
-}
-
-void init_pax_xact_hash() {
-  HASHCTL info;
-  memset(&info, 0, sizeof(HASHCTL));
-  info.keysize = sizeof(XactHashKey);
-  info.entrysize = sizeof(XactHashEntry);
-  pax_xact_hash = ShmemInitHash("pax_xact_hash", max_procs, max_procs, &info,
-                                HASH_ELEM | HASH_BLOBS);
-}
-
-void init_shmem_locks() {
-  pax_hash_lock = GetNamedLWLockTranche("pax_hash_lock");
-}
-
-void paxc_shmem_request() {
-  max_procs = MaxConnections;
-  RequestAddinShmemSpace(pax_mem_size());
-  RequestNamedLWLockTranche("pax_hash_lock", 1);
-}
-
-void paxc_shmem_startup() {
-  bool found;
-  current_xact_shared_pax_ss = NULL;
-  pax_block_mapping_context = AllocSetContextCreate(
-      TopMemoryContext, "Pax Block Mapping Context", ALLOCSET_DEFAULT_SIZES);
-
-  LWLockAcquire(AddinShmemInitLock, LW_EXCLUSIVE);
-  pax_shared_state = reinterpret_cast<PaxSharedState *>(
-      ShmemInitStruct("pax_shared_stat", struct_mem_size(), &found));
-  if (!found) {
-    pax_shared_state->pax_xact_lock_tranche_id_ = LWLockNewTrancheId();
-  }
-  LWLockRegisterTranche(pax_shared_state->pax_xact_lock_tranche_id_,
-                        "pax_xact_array_locks");
-  init_pax_xact_hash();
-  init_shmem_locks();
-  LWLockRelease(AddinShmemInitLock);
-  if (pax_shared_state == NULL) {
-    ereport(
-        FATAL,
-        (errcode(ERRCODE_OUT_OF_MEMORY), errmsg("out of memory"),
-         errdetail("Failed while allocation block %lu bytes in shared memory.",
-                   struct_mem_size())));
-  }
-}
-
-void init_command_resource() {
-  init_command_shmem_resource();
-  init_local_command_resource();
-}
-
-void release_command_resource() {
-  cleanup_local_command_resource();
-  cleanup_command_shmem_resource();
-}
-
-// there may be multiple scan processes scanning the same table,
-// which will modify the current_xact_shared_pax_ss state,
-// so a LW_EXCLUSIVE lock is required
-void get_table_index_and_table_number(const Oid table_rel_oid, uint8 *table_no,
-                                      uint32 *table_index) {
-  LWLockAcquire(&current_xact_shared_pax_ss->lock_, LW_EXCLUSIVE);
-  uint8 alloc_table_no = 0;
-  for (uint32 i = 0; i < current_xact_shared_pax_ss->block_mapping_used_size_;
-       i++) {
-    if (current_xact_shared_pax_ss->shared_block_mapping_[i].relid_ ==
-        table_rel_oid) {
-      alloc_table_no++;
-    }
-  }
-  *table_index = current_xact_shared_pax_ss->block_mapping_used_size_++;
-  *table_no = alloc_table_no;
-  ereport(
-      DEBUG1,
-      (errmsg("get_table_index_and_table_number pax_xact_hash=%p, lock=%p,"
-              "gp_session_id=%d "
-              "pid=%d, db_id=%d, segment_id=%d, gp_command_id=%d "
-              "table_oid=%d, table_index=%d, "
-              "table_no=%d, is_gp_writer=%d, shmem_ptr=%p, lock=%p",
-              pax_xact_hash, &pax_hash_lock->lock, gp_session_id, getpid(),
-              GpIdentity.dbid, GpIdentity.segindex, gp_command_count,
-              table_rel_oid, *table_index, *table_no, Gp_is_writer,
-              current_xact_shared_pax_ss, &current_xact_shared_pax_ss->lock_)));
-  LWLockRelease(&current_xact_shared_pax_ss->lock_);
-  if (*table_index >= BLOCK_MAPPING_ARRAY_SIZE) {
-    ereport(ERROR,
-            (errcode(ERRCODE_ARRAY_ELEMENT_ERROR), errmsg("out of array size"),
-             errdetail("Failed while allocation table slot %d in  "
-                       "current_xact_shared_pax_ss->shared_block_mapping_, max "
-                       "size is %d",
-                       *table_index, BLOCK_MAPPING_ARRAY_SIZE)));
-  }
-  if (alloc_table_no > MAX_TABLE_NUM_IN_CTID) {
-    ereport(ERROR,
-            (errcode(ERRCODE_ARRAY_ELEMENT_ERROR), errmsg("out of array size"),
-             errdetail("Failed while table no %d overflow the max table num %d",
-                       *table_no, MAX_TABLE_NUM_IN_CTID)));
-  }
-}
-
-// FIXME(gongxun): the delete and update processes only read
-// current_xact_shared_pax_ss , whether it is possible to not add a shared lock?
-uint32 pax_get_table_index(const Oid table_rel_oid, const uint8 table_no) {
-  LWLockAcquire(&current_xact_shared_pax_ss->lock_, LW_SHARED);
-  uint8 tmp_table_no = -1;
-  int index = -1;
-  for (uint32 i = 0; i < current_xact_shared_pax_ss->block_mapping_used_size_;
-       i++) {
-    if (current_xact_shared_pax_ss->shared_block_mapping_[i].relid_ ==
-        table_rel_oid) {
-      if ((++tmp_table_no) == table_no) {
-        index = i;
-        break;
-      }
-    }
-  }
-  LWLockRelease(&current_xact_shared_pax_ss->lock_);
-  Assert(tmp_table_no == table_no);
-  return index;
-}
-
-void dump_shared_block_ids(const Oid table_rel_oid, const uint32 table_index) {
-  LocalTableBlockMappingData *block_mapping_data =
-      &local_pax_block_mapping_data[table_index];
-
-  PaxBlockId *shared_ptr;
-
-  // save old segment, if shared memory is full, we need to alloc a new
-  // segment and copy old data,then free old segment
-  dsm_segment *old_segment = block_mapping_data->block_ids_segment_;
-  dsm_segment *new_segment = nullptr;
-  block_mapping_data->relid_ = table_rel_oid;
-
-  // if local memory size is large than shared memory's size, we need to
-  // resize shared memory
-  SharedTableBlockMappingData *shared_block_mapping_data =
-      &current_xact_shared_pax_ss->shared_block_mapping_[table_index];
-  ereport(DEBUG1, (errmsg("dump_shared_block_ids pax_xact_hash=%p, lock=%p,"
-                          "gp_session_id=%d "
-                          "pid=%d, db_id=%d, segment_id=%d, gp_command_id=%d "
-                          "table_oid=%d, table_index=%d, local_size =%d, "
-                          "shared_size=%d, is_gp_writer=%d",
-                          pax_xact_hash, &pax_hash_lock->lock, gp_session_id,
-                          getpid(), GpIdentity.dbid, GpIdentity.segindex,
-                          gp_command_count, table_rel_oid, table_index,
-                          block_mapping_data->used_block_ids_,
-                          shared_block_mapping_data->shared_size_block_ids_,
-                          Gp_is_writer)));
-  if (block_mapping_data->used_block_ids_ >
-          shared_block_mapping_data->shared_size_block_ids_ ||
-      old_segment == NULL) {
-    // need to resize shared memory
-    ResourceOwner oldowner;
-    oldowner = CurrentResourceOwner;
-    CurrentResourceOwner = TopTransactionResourceOwner;
-
-    uint32 new_size = block_mapping_data->size_block_ids_;
-    new_segment = dsm_create(sizeof(PaxBlockId) * new_size,
-                             DSM_CREATE_NULL_IF_MAXSEGMENTS);
-
-    if (new_segment == NULL) {
-      ereport(ERROR, (errcode(ERRCODE_OUT_OF_MEMORY),
-                      errmsg("could not create DSM segment for %d PaxBlockId",
-                             new_size)));
-    }
-
-    dsm_pin_mapping(new_segment);
-    dsm_pin_segment(new_segment);
-    block_mapping_data->block_ids_segment_ = new_segment;
-
-    shared_block_mapping_data->shared_size_block_ids_ = new_size;
-
-    shared_block_mapping_data->shared_used_block_ids_ = 0;
-
-    shared_ptr =
-        reinterpret_cast<PaxBlockId *>(dsm_segment_address(new_segment));
-
-    CurrentResourceOwner = oldowner;
-  }
-
-  shared_ptr = reinterpret_cast<PaxBlockId *>(
-      dsm_segment_address(block_mapping_data->block_ids_segment_));
-
-  memcpy(
-      shared_ptr + shared_block_mapping_data->shared_used_block_ids_,
-      block_mapping_data->block_ids_ +
-          shared_block_mapping_data->shared_used_block_ids_,
-      sizeof(PaxBlockId) * (block_mapping_data->used_block_ids_ -
-                            shared_block_mapping_data->shared_used_block_ids_));
-
-  pg_write_barrier();
-  shared_block_mapping_data->shared_used_block_ids_ =
-      block_mapping_data->used_block_ids_;
-
-  shared_block_mapping_data->relid_ = block_mapping_data->relid_;
-  if (old_segment != block_mapping_data->block_ids_segment_) {
-    shared_block_mapping_data->shared_block_ids_handle_ =
-        dsm_segment_handle(block_mapping_data->block_ids_segment_);
-
-    if (old_segment) {
-      dsm_unpin_segment(dsm_segment_handle(old_segment));
-      dsm_detach(old_segment);
-    }
-  }
-}
-
-void load_shared_block_ids(const Oid table_rel_oid, const uint32 table_index) {
-  dsm_handle table_block_mapping_handle;
-  dsm_segment *attached_block_ids;
-  PaxBlockId *shared_ptr;
-
-  for (;;) {
-    table_block_mapping_handle =
-        current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-            .shared_block_ids_handle_;
-
-    attached_block_ids = dsm_attach(table_block_mapping_handle);
-    if (attached_block_ids != NULL) break;
-
-    if (table_block_mapping_handle ==
-        current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-            .shared_block_ids_handle_) {
-      elog(ERROR, "could not attach to table(%d) shared block ids array",
-           table_rel_oid);
-    }
-  }
-
-  shared_ptr =
-      reinterpret_cast<PaxBlockId *>(dsm_segment_address(attached_block_ids));
-
-  pg_read_barrier();
-
-  if (current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-          .shared_used_block_ids_ >
-      local_pax_block_mapping_data[table_index].size_block_ids_) {
-    // resize local memory
-    uint32 new_size =
-        current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-            .shared_size_block_ids_;
-    MemoryContext oldcontext = MemoryContextSwitchTo(pax_block_mapping_context);
-    if (local_pax_block_mapping_data[table_index].block_ids_ == nullptr) {
-      local_pax_block_mapping_data[table_index].used_block_ids_ = 0;
-      local_pax_block_mapping_data[table_index].size_block_ids_ = new_size;
-      local_pax_block_mapping_data[table_index].block_ids_ =
-          reinterpret_cast<PaxBlockId *>(
-              palloc0(sizeof(PaxBlockId) * new_size));
-    } else {
-      local_pax_block_mapping_data[table_index].block_ids_ =
-          reinterpret_cast<PaxBlockId *>(
-              repalloc(local_pax_block_mapping_data[table_index].block_ids_,
-                       sizeof(PaxBlockId) * new_size));
-    }
-    MemoryContextSwitchTo(oldcontext);
-    local_pax_block_mapping_data[table_index].size_block_ids_ = new_size;
-  }
-
-  memcpy(local_pax_block_mapping_data[table_index].block_ids_ +
-             local_pax_block_mapping_data[table_index].used_block_ids_,
-         shared_ptr + local_pax_block_mapping_data[table_index].used_block_ids_,
-         (current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-              .shared_used_block_ids_ -
-          local_pax_block_mapping_data[table_index].used_block_ids_) *
-             sizeof(PaxBlockId));
-  local_pax_block_mapping_data[table_index].relid_ = table_rel_oid;
-  local_pax_block_mapping_data[table_index].used_block_ids_ =
-      current_xact_shared_pax_ss->shared_block_mapping_[table_index]
-          .shared_used_block_ids_;
-
-  dsm_detach(attached_block_ids);
-}
-
-uint32 get_block_number(const Oid table_rel_oid, const uint32 table_index,
-                        const PaxBlockId block_id) {
-  LocalTableBlockMappingData *block_mapping_data =
-      &local_pax_block_mapping_data[table_index];
-
-  if (block_mapping_data->used_block_ids_ >=
-      block_mapping_data->size_block_ids_) {
-    MemoryContext oldcontext = MemoryContextSwitchTo(pax_block_mapping_context);
-    if (block_mapping_data->block_ids_ == nullptr) {
-      block_mapping_data->block_ids_ = reinterpret_cast<PaxBlockId *>(
-          palloc0(sizeof(PaxBlockId) * DEFAULT_BLOCK_IDS_SIZE));
-      block_mapping_data->size_block_ids_ = DEFAULT_BLOCK_IDS_SIZE;
-      block_mapping_data->block_ids_segment_ = NULL;
-    } else {
-      uint32 new_size = block_mapping_data->size_block_ids_ * 2;
-      block_mapping_data->block_ids_ = reinterpret_cast<PaxBlockId *>(repalloc(
-          block_mapping_data->block_ids_, sizeof(PaxBlockId) * new_size));
-      block_mapping_data->size_block_ids_ = new_size;
-    }
-    MemoryContextSwitchTo(oldcontext);
-  }
-
-  uint32 block_number = block_mapping_data->used_block_ids_++;
-  block_mapping_data->block_ids_[block_number] = block_id;
-  // TODO(gongxun): should we add the condition that only Gp_reader dump
-  // to shared memory?
-  dump_shared_block_ids(table_rel_oid, table_index);
-  return block_number;
-}
-
-PaxBlockId pax_get_block_id(const Oid table_rel_oid, const uint32 table_index,
-                            const uint32 block_number) {
-  LocalTableBlockMappingData *block_mapping_data =
-      &local_pax_block_mapping_data[table_index];
-
-  if (block_mapping_data->relid_ != table_rel_oid ||
-      block_number >= block_mapping_data->used_block_ids_) {
-    load_shared_block_ids(table_rel_oid, table_index);
-  }
-
-  block_mapping_data = &local_pax_block_mapping_data[table_index];
-  if (block_number >= block_mapping_data->used_block_ids_) {
-    elog(FATAL, "invalid block number %d for table %d", block_number,
-         table_rel_oid);
-  }
-  return block_mapping_data->block_ids_[block_number];
-}
-
-PaxBlockId get_block_id(const Oid table_rel_oid, const uint8 table_no,
-                        const uint32 block_number) {
-  uint32 table_index = pax_get_table_index(table_rel_oid, table_no);
-  return pax_get_block_id(table_rel_oid, table_index, block_number);
-}
-
-void init_command_shmem_resource() {
-  XactHashKey pax_xact_hash_key;
-  pax_xact_hash_key.session_id_ = gp_session_id;
-  pax_xact_hash_key.command_id_ = gp_command_count;
-  XactHashEntry *entry = NULL;
-  bool found;
-  ACQUIRE_HASH_LOCK(pax_hash_lock, LW_EXCLUSIVE);
-  entry = reinterpret_cast<XactHashEntry *>(
-      hash_search(pax_xact_hash, &pax_xact_hash_key, HASH_ENTER, &found));
-  if (!found) {
-    entry->key_ = pax_xact_hash_key;
-    LWLockInitialize(&entry->shared_state_.lock_,
-                     pax_shared_state->pax_xact_lock_tranche_id_);
-    entry->shared_state_.block_mapping_used_size_ = 0;
-  } else {
-    if (!entry) {
-      ereport(FATAL,
-              (errcode(ERRCODE_OUT_OF_MEMORY), errmsg("out of memory"),
-               errdetail(
-                   "Failed while allocation block %lu bytes in shared memory.",
-                   sizeof(XactHashEntry))));
-    }
-  }
-
-  ereport(DEBUG1,
-          (errmsg("init_command_shmem_resource pax_xact_hash=%p, lock=%p,"
-                  "gp_session_id=%d "
-                  "pid=%d, db_id=%d, segment_id=%d, found=%s, gp_command_id=%d "
-                  ",gp_is_writer=%d",
-                  pax_xact_hash, &pax_hash_lock->lock, gp_session_id, getpid(),
-                  GpIdentity.dbid, GpIdentity.segindex,
-                  found ? "true" : "false", gp_command_count, Gp_is_writer)));
-  RELEASE_HASH_LOCK(pax_hash_lock);
-  current_xact_shared_pax_ss = &entry->shared_state_;
-}
-
-// FIXME(gongxun): do we need to lock current_xact_shared_pax_ss here to protect
-// the case where gp_reader is still executing dump_shared_block_ids
-void cleanup_command_shmem_resource() {
-  if (Gp_is_writer && current_xact_shared_pax_ss != NULL) {
-    XactHashKey pax_xact_hash_key;
-    pax_xact_hash_key.session_id_ = gp_session_id;
-    pax_xact_hash_key.command_id_ = gp_command_count;
-    bool found;
-    ereport(DEBUG1,
-            (errmsg("cleanup_command_shmem_resource pax_xact_hash=%p, "
-                    "gp_session_id=%d "
-                    "pid=%d, db_id=%d, segment_id=%d,  gp_command_id=%d "
-                    ",gp_is_writer=%d",
-                    pax_xact_hash, gp_session_id, getpid(), GpIdentity.dbid,
-                    GpIdentity.segindex, gp_command_count, Gp_is_writer)));
-    for (uint32 i = 0; i < current_xact_shared_pax_ss->block_mapping_used_size_;
-         i++) {
-      current_xact_shared_pax_ss->shared_block_mapping_[i].relid_ = InvalidOid;
-      current_xact_shared_pax_ss->shared_block_mapping_[i]
-          .shared_used_block_ids_ = 0;
-      current_xact_shared_pax_ss->shared_block_mapping_[i]
-          .shared_size_block_ids_ = 0;
-      if (current_xact_shared_pax_ss->shared_block_mapping_[i]
-              .shared_block_ids_handle_ != 0) {
-        dsm_unpin_segment(current_xact_shared_pax_ss->shared_block_mapping_[i]
-                              .shared_block_ids_handle_);
-      }
-      current_xact_shared_pax_ss->shared_block_mapping_[i]
-          .shared_block_ids_handle_ = 0;
-    }
-    current_xact_shared_pax_ss->block_mapping_used_size_ = 0;
-    ACQUIRE_HASH_LOCK(pax_hash_lock, LW_EXCLUSIVE);
-    hash_search(pax_xact_hash, &pax_xact_hash_key, HASH_REMOVE, &found);
-    RELEASE_HASH_LOCK(pax_hash_lock);
-    current_xact_shared_pax_ss = NULL;
-  }
-}
-
-void init_local_command_resource() {
-  for (uint32 i = 0; i < BLOCK_MAPPING_ARRAY_SIZE; i++) {
-    local_pax_block_mapping_data[i].relid_ = InvalidOid;
-    local_pax_block_mapping_data[i].size_block_ids_ = 0;
-    local_pax_block_mapping_data[i].used_block_ids_ = 0;
-
-    // FIXME(gongxun): unpin the segment and clean the local buffer, because if
-    // transaction abort, we don't release the resource correctly, so we need to
-    // unpin the segment here until we fix the bug
-    local_pax_block_mapping_data[i].block_ids_ = NULL;
-    if (local_pax_block_mapping_data[i].block_ids_segment_) {
-      dsm_detach(local_pax_block_mapping_data[i].block_ids_segment_);
-    }
-    local_pax_block_mapping_data[i].block_ids_segment_ = NULL;
-    if (local_pax_block_mapping_data[i].block_ids_) {
-      pfree(local_pax_block_mapping_data[i].block_ids_);
-    }
-  }
-}
-
-void cleanup_local_command_resource() {
-  // TODO(gongxun): should only clean the slot used
-  for (uint32 i = 0; i < BLOCK_MAPPING_ARRAY_SIZE; i++) {
-    local_pax_block_mapping_data[i].relid_ = InvalidOid;
-    local_pax_block_mapping_data[i].size_block_ids_ = 0;
-    local_pax_block_mapping_data[i].used_block_ids_ = 0;
-    if (local_pax_block_mapping_data[i].block_ids_) {
-      pfree(local_pax_block_mapping_data[i].block_ids_);
-      local_pax_block_mapping_data[i].block_ids_ = NULL;
-    }
-    if (local_pax_block_mapping_data[i].block_ids_segment_) {
-      dsm_detach(local_pax_block_mapping_data[i].block_ids_segment_);
-    }
-    local_pax_block_mapping_data[i].block_ids_segment_ = NULL;
-  }
-  MemoryContextReset(pax_block_mapping_context);
-}
-}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.h b/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.h
deleted file mode 100644
index aa352e039b3..00000000000
--- a/contrib/pax_storage/src/cpp/storage/paxc_block_map_manager.h
+++ /dev/null
@@ -1,83 +0,0 @@
-#pragma once
-
-#include "comm/cbdb_api.h"
-
-#include "storage/pax_block_id.h"
-#include "storage/pax_itemptr.h"
-
-namespace paxc {
-
-#define BLOCK_MAPPING_ARRAY_SIZE 64
-struct SharedTableBlockMappingData {
-  Oid relid_;
-  uint32 shared_size_block_ids_;
-  uint32 shared_used_block_ids_;
-  dsm_handle shared_block_ids_handle_;
-  SharedTableBlockMappingData() {
-    relid_ = InvalidOid;
-    shared_size_block_ids_ = 0;
-    shared_used_block_ids_ = 0;
-    shared_block_ids_handle_ = 0;
-  }
-};
-
-struct PaxXactSharedState {
-  LWLock lock_;
-  uint32 block_mapping_used_size_;
-  SharedTableBlockMappingData shared_block_mapping_[BLOCK_MAPPING_ARRAY_SIZE];
-};
-
-struct LocalTableBlockMappingData {
-  Oid relid_;
-  uint32 size_block_ids_;
-  uint32 used_block_ids_;
-  dsm_segment *block_ids_segment_;
-  PaxBlockId *block_ids_;
-  LocalTableBlockMappingData() {
-    relid_ = InvalidOid;
-    size_block_ids_ = 0;
-    used_block_ids_ = 0;
-    block_ids_segment_ = nullptr;
-    block_ids_ = nullptr;
-  }
-};
-
-struct TableEntry {
-  uint16 table_no;
-  Oid relid_;
-  uint32 table_index_;
-};
-
-struct XactHashKey {
-  int session_id_;
-  int command_id_;
-};
-
-struct XactHashEntry {
-  XactHashKey key_;
-  PaxXactSharedState shared_state_;
-};
-
-struct XactLockSlot {
-  bool used;
-};
-// use this struct find which the lock slot is not used, and assigned it to hash
-// table entry when sql command start
-struct PaxSharedState {
-  int pax_xact_lock_tranche_id_;
-};
-
-void paxc_shmem_request();
-void paxc_shmem_startup();
-
-void init_command_resource();
-void release_command_resource();
-
-void get_table_index_and_table_number(const Oid table_rel_oid, uint8 *table_no,
-                                      uint32 *table_index);
-
-uint32 get_block_number(const Oid table_rel_oid, const uint32 table_index,
-                        const PaxBlockId block_id);
-PaxBlockId get_block_id(const Oid table_rel_oid, const uint8 table_no,
-                        const uint32 block_number);
-}  // namespace paxc
diff --git a/contrib/pax_storage/src/cpp/storage/proto/micro_partition_stats.proto b/contrib/pax_storage/src/cpp/storage/proto/micro_partition_stats.proto
index 3f474a9cd0d..559b7a5c939 100644
--- a/contrib/pax_storage/src/cpp/storage/proto/micro_partition_stats.proto
+++ b/contrib/pax_storage/src/cpp/storage/proto/micro_partition_stats.proto
@@ -1,25 +1,25 @@
 syntax = "proto2";
 package pax.stats;
 
-message MinmaxStatistics {
-  required uint32 typid = 1;              // type oid of the column
-  required uint32 collation = 2;          // collation oid of the column
-  required uint32 procLt = 3;             // Proc id <
-  required uint32 procGt = 4;             // Proc id >
-  required uint32 procLe = 5;             // Proc id <=
-  required uint32 procGe = 6;             // Proc id >=
-  required bytes minimal = 7;             // Minimal value stored as Datum.
-  required bytes maximum = 8;             // Maximum value stored as Datum.
+message ColumnDataStats {
+  optional bytes minimal = 1;             // Minimal value stored as Datum.
+  optional bytes maximum = 2;             // Maximum value stored as Datum.
+}
+message ColumnBasicInfo {
+  optional uint32 typid = 1;              // type oid of the column
+  optional uint32 collation = 2;          // collation oid of the column
+  optional uint32 opfamily = 3;
 }
 
 message MicroPartitionStatisticsInfo
 {
-  repeated ColumnStatisitcsInfo columnStats = 1;  // Statistics info stored by single column.
+  repeated ColumnStats columnStats = 1;  // Statistics info stored by single column.
 }
 
-message ColumnStatisitcsInfo {
+message ColumnStats {
   optional bool allnull = 1 [default=true];     // all-null value for single column.
   optional bool hasnull = 2 [default=false];    // has-null value for single column.
-  optional MinmaxStatistics minmaxStats = 3;    // minimal vaule stats.
+  optional ColumnBasicInfo info = 3;
+  optional ColumnDataStats  dataStats = 4;    // minimal vaule stats.
 }
 
diff --git a/contrib/pax_storage/src/cpp/storage/proto/orc_proto.proto b/contrib/pax_storage/src/cpp/storage/proto/orc_proto.proto
index 45e22af27b7..172a7b8097a 100644
--- a/contrib/pax_storage/src/cpp/storage/proto/orc_proto.proto
+++ b/contrib/pax_storage/src/cpp/storage/proto/orc_proto.proto
@@ -17,151 +17,45 @@
  */
 
 syntax = "proto2";
+package pax.orc.proto;
 
-package orc.proto;
-
-option java_package = "org.apache.orc";
 import "pax.proto";
-
-message IntegerStatistics  {
-  optional sint64 minimum = 1;
-  optional sint64 maximum = 2;
-  optional sint64 sum = 3;
-}
-
-message DoubleStatistics {
-  optional double minimum = 1;
-  optional double maximum = 2;
-  optional double sum = 3;
-}
-
-message StringStatistics {
-  optional string minimum = 1;
-  optional string maximum = 2;
-  // sum will store the total length of all strings in a stripe
-  optional sint64 sum = 3;
-  // If the minimum or maximum value was longer than 1024 bytes, store a lower or upper
-  // bound instead of the minimum or maximum values above.
-  optional string lowerBound = 4;
-  optional string upperBound = 5;
-}
-
-message BucketStatistics {
-  repeated uint64 count = 1 [packed=true];
-}
-
-message DecimalStatistics {
-  optional string minimum = 1;
-  optional string maximum = 2;
-  optional string sum = 3;
-}
-
-message DateStatistics {
-  // min,max values saved as days since epoch
-  optional sint32 minimum = 1;
-  optional sint32 maximum = 2;
-}
-
-message TimestampStatistics {
-  // min,max values saved as milliseconds since epoch
-  optional sint64 minimum = 1;
-  optional sint64 maximum = 2;
-  optional sint64 minimumUtc = 3;
-  optional sint64 maximumUtc = 4;
-  // store the lower 6 TS digits for min/max to achieve nanosecond precision
-  optional int32 minimumNanos = 5;
-  optional int32 maximumNanos = 6;
-}
-
-message BinaryStatistics {
-  // sum will store the total binary blob length in a stripe
-  optional sint64 sum = 1;
-}
-
-// Statistics for list and map
-message CollectionStatistics {
-  optional uint64 minChildren = 1;
-  optional uint64 maxChildren = 2;
-  optional uint64 totalChildren = 3;
-}
+import "micro_partition_stats.proto";
 
 message ColumnStatistics {
-  optional uint64 numberOfValues = 1;
-  optional IntegerStatistics intStatistics = 2;
-  optional DoubleStatistics doubleStatistics = 3;
-  optional StringStatistics stringStatistics = 4;
-  optional BucketStatistics bucketStatistics = 5;
-  optional DecimalStatistics decimalStatistics = 6;
-  optional DateStatistics dateStatistics = 7;
-  optional BinaryStatistics binaryStatistics = 8;
-  optional TimestampStatistics timestampStatistics = 9;
-  optional bool hasNull = 10;
-  optional uint64 bytesOnDisk = 11;
-  optional CollectionStatistics collectionStatistics = 12;
-}
-
-message RowIndexEntry {
-  repeated uint64 positions = 1 [packed=true];
-  optional ColumnStatistics statistics = 2;
-}
-
-message RowIndex {
-  repeated RowIndexEntry entry = 1;
-}
-
-message BloomFilter {
-  optional uint32 numHashFunctions = 1;
-  repeated fixed64 bitset = 2;
-  optional bytes utf8bitset = 3;
-}
-
-message BloomFilterIndex {
-  repeated BloomFilter bloomFilter = 1;
+  // is all of rows are null
+  optional bool allNull = 1 [default=true];
+  // has null row
+  optional bool hasNull = 2 [default=false];
+  // the data statistics
+  optional pax.stats.ColumnDataStats colDataStats = 3;
 }
 
+// `Stream` desc a part of buffer, a column consists of 1 or more streams
+// the mapping of stream to column is not strictly divided.
+// the kind of each column and its last stream must be `DATA`
 message Stream {
   // if you add new index stream kinds, you need to make sure to update
   // StreamName to ensure it is added to the stripe in the right area
   enum Kind {
+    // null stream
     PRESENT = 0;
+    // raw buffer stream
     DATA = 1;
+    // length buffer stream
     LENGTH = 2;
-    DICTIONARY_DATA = 3;
-    DICTIONARY_COUNT = 4;
-    SECONDARY = 5;
-    ROW_INDEX = 6;
-    BLOOM_FILTER = 7;
-    BLOOM_FILTER_UTF8 = 8;
-    // Virtual stream kinds to allocate space for encrypted index and data.
-    ENCRYPTED_INDEX = 9;
-    ENCRYPTED_DATA = 10;
-
-    // stripe statistics streams
-    STRIPE_STATISTICS = 100;
-    // A virtual stream kind that is used for setting the encryption IV.
-    FILE_STATISTICS = 101;
   }
+  // the kind of stream
   optional Kind kind = 1;
+  // the number of entry in stream
   optional uint32 column = 2;
+  // the bytes of stream
   optional uint64 length = 3;
 }
 
 message StripeFooter {
   repeated Stream streams = 1;
-  repeated pax.ColumnEncoding pax_col_encodings = 5;
-  optional string writerTimezone = 3;
-}
-
-// the file tail looks like:
-//   encrypted stripe statistics: ColumnarStripeStatistics (order by variant)
-//   stripe statistics: Metadata
-//   footer: Footer
-//   postscript: PostScript
-//   psLen: byte
-
-message StringPair {
-  optional string key = 1;
-  optional string value = 2;
+  repeated pax.ColumnEncoding pax_col_encodings = 2;
 }
 
 message Type {
@@ -173,248 +67,76 @@ message Type {
     LONG = 4;
     FLOAT = 5;
     DOUBLE = 6;
-    STRING = 7;
-    BINARY = 8;
-    TIMESTAMP = 9;
-    LIST = 10;
-    MAP = 11;
-    STRUCT = 12;
-    UNION = 13;
-    DECIMAL = 14;
-    DATE = 15;
-    VARCHAR = 16;
-    CHAR = 17;
-    TIMESTAMP_INSTANT = 18;
+    DECIMAL = 7;
+    STRING = 8;
+    VARCHAR = 9;
+    CHAR = 10;
+    STRUCT = 11;
   }
+  // the kind of type
   optional Kind kind = 1;
+  // the kind of subtypes
   repeated uint32 subtypes = 2 [packed=true];
-  repeated string fieldNames = 3;
-  optional uint32 maximumLength = 4;
-  optional uint32 precision = 5;
-  optional uint32 scale = 6;
-  repeated StringPair attributes = 7;
 }
 
 message StripeInformation {
   // the global file offset of the start of the stripe
   optional uint64 offset = 1;
-  // the number of bytes of index
-  optional uint64 indexLength = 2;
   // the number of bytes of data
-  optional uint64 dataLength = 3;
+  optional uint64 dataLength = 2;
   // the number of bytes in the stripe footer
-  optional uint64 footerLength = 4;
+  optional uint64 footerLength = 3;
   // the number of rows in this stripe
-  optional uint64 numberOfRows = 5;
-  // If this is present, the reader should use this value for the encryption
-  // stripe id for setting the encryption IV. Otherwise, the reader should
-  // use one larger than the previous stripe's encryptStripeId.
-  // For unmerged ORC files, the first stripe will use 1 and the rest of the
-  // stripes won't have it set. For merged files, the stripe information
-  // will be copied from their original files and thus the first stripe of
-  // each of the input files will reset it to 1.
-  // Note that 1 was choosen, because protobuf v3 doesn't serialize
-  // primitive types that are the default (eg. 0).
-  optional uint64 encryptStripeId = 6;
-  // For each encryption variant, the new encrypted local key to use
-  // until we find a replacement.
-  repeated bytes encryptedLocalKeys = 7;
-}
-
-message UserMetadataItem {
-  optional string name = 1;
-  optional bytes value = 2;
-}
-
-// StripeStatistics (1 per a stripe), which each contain the
-// ColumnStatistics for each column.
-// This message type is only used in ORC v0 and v1.
-message StripeStatistics {
-  repeated ColumnStatistics colStats = 1;
-}
-
-// This message type is only used in ORC v0 and v1.
-message Metadata {
-  repeated StripeStatistics stripeStats = 1;
-}
-
-// In ORC v2 (and for encrypted columns in v1), each column has
-// their column statistics written separately.
-message ColumnarStripeStatistics {
-  // one value for each stripe in the file
-  repeated ColumnStatistics colStats = 1;
-}
-
-enum EncryptionAlgorithm {
-  UNKNOWN_ENCRYPTION = 0;  // used for detecting future algorithms
-  AES_CTR_128 = 1;
-  AES_CTR_256 = 2;
-}
-
-message FileStatistics {
-  repeated ColumnStatistics column = 1;
-}
-
-// How was the data masked? This isn't necessary for reading the file, but
-// is documentation about how the file was written.
-message DataMask {
-  // the kind of masking, which may include third party masks
-  optional string name = 1;
-  // parameters for the mask
-  repeated string maskParameters = 2;
-  // the unencrypted column roots this mask was applied to
-  repeated uint32 columns = 3 [packed = true];
-}
-
-// Information about the encryption keys.
-message EncryptionKey {
-  optional string keyName = 1;
-  optional uint32 keyVersion = 2;
-  optional EncryptionAlgorithm algorithm = 3;
-}
-
-// The description of an encryption variant.
-// Each variant is a single subtype that is encrypted with a single key.
-message EncryptionVariant {
-  // the column id of the root
-  optional uint32 root = 1;
-  // The master key that was used to encrypt the local key, referenced as
-  // an index into the Encryption.key list.
-  optional uint32 key = 2;
-  // the encrypted key for the file footer
-  optional bytes encryptedKey = 3;
-  // the stripe statistics for this variant
-  repeated Stream stripeStatistics = 4;
-  // encrypted file statistics as a FileStatistics
-  optional bytes fileStatistics = 5;
-}
-
-// Which KeyProvider encrypted the local keys.
-enum KeyProviderKind {
-  UNKNOWN = 0;
-  HADOOP = 1;
-  AWS = 2;
-  GCP = 3;
-  AZURE = 4;
-}
-
-message Encryption {
-  // all of the masks used in this file
-  repeated DataMask mask = 1;
-  // all of the keys used in this file
-  repeated EncryptionKey key = 2;
-  // The encrypted variants.
-  // Readers should prefer the first variant that the user has access to
-  // the corresponding key. If they don't have access to any of the keys,
-  // they should get the unencrypted masked data.
-  repeated EncryptionVariant variants = 3;
-  // How are the local keys encrypted?
-  optional KeyProviderKind keyProvider = 4;
-}
-
-enum CalendarKind {
-  UNKNOWN_CALENDAR = 0;
-   // A hybrid Julian/Gregorian calendar with a cutover point in October 1582.
-  JULIAN_GREGORIAN = 1;
-  // A calendar that extends the Gregorian calendar back forever.
-  PROLEPTIC_GREGORIAN = 2;
+  optional uint64 numberOfRows = 4;
+  // the statistics of current stripe
+  repeated ColumnStatistics colStats = 5;
 }
 
 message Footer {
-  optional uint64 headerLength = 1;
-  optional uint64 contentLength = 2;
-  repeated StripeInformation stripes = 3;
-  repeated Type types = 4;
-  repeated UserMetadataItem metadata = 5;
-  optional uint64 numberOfRows = 6;
-  repeated ColumnStatistics statistics = 7;
-  optional uint32 rowIndexStride = 8;
+  // the length(byte) of content
+  optional uint64 contentLength = 1;
 
-  // Each implementation that writes ORC files should register for a code
-  // 0 = ORC Java
-  // 1 = ORC C++
-  // 2 = Presto
-  // 3 = Scritchley Go from https://github.com/scritchley/orc
-  // 4 = Trino
-  optional uint32 writer = 9;
+  // the information of stripes
+  repeated StripeInformation stripes = 2;
 
-  // information about the encryption in this file
-  optional Encryption encryption = 10;
-  optional CalendarKind calendar = 11;
+  // the schema descibe
+  repeated Type types = 3;
+  optional uint64 numberOfRows = 4;
 
-  // informative description about the version of the software that wrote
-  // the file. It is assumed to be within a given writer, so for example
-  // ORC 1.7.2 = "1.7.2". It may include suffixes, such as "-SNAPSHOT".
-  optional string softwareVersion = 12;
-}
+  // all group info
+  repeated pax.stats.ColumnBasicInfo colInfo = 5;
 
-enum CompressionKind {
-  NONE = 0;
-  ZLIB = 1;
-  SNAPPY = 2;
-  LZO = 3;
-  LZ4 = 4;
-  ZSTD = 5;
+  // the data format id in stream
+  // 1: origin format
+  // 2: vec format
+  required uint32 storageFormat = 6;
 }
 
-// Serialized length must be less that 255 bytes
+// the file tail looks like:
+//   group1: 
+//      streams: Stream
+//      stripefooter: StripeFooter
+//    ...
+//   footer: Footer
+//   postscript: PostScript
+//   psLen: byte
+// serialized length better less that 32k 
+// then a single io(32k) can read the footer + meta + postscript
+// If the min/max statistics in the footer have a large attribute value, 
+// then the 32k tail_buffer is not enough and needs to be read multiple times.
 message PostScript {
-  optional uint64 footerLength = 1;
-  optional CompressionKind compression = 2;
-  optional uint64 compressionBlockSize = 3;
-  // the version of the file format
-  //   [0, 11] = Hive 0.11
-  //   [0, 12] = Hive 0.12
-  repeated uint32 version = 4 [packed = true];
-  optional uint64 metadataLength = 5;
+  // current ORC version 
+  required uint32 majorVersion = 1;
+  required uint32 minorVersion = 2;
 
-  // The version of the writer that wrote the file. This number is
-  // updated when we make fixes or large changes to the writer so that
-  // readers can detect whether a given bug is present in the data.
-  //
-  // Only the Java ORC writer may use values under 6 (or missing) so that
-  // readers that predate ORC-202 treat the new writers correctly. Each
-  // writer should assign their own sequence of versions starting from 6.
-  //
-  // Version of the ORC Java writer:
-  //   0 = original
-  //   1 = HIVE-8732 fixed (fixed stripe/file maximum statistics &
-  //                        string statistics use utf8 for min/max)
-  //   2 = HIVE-4243 fixed (use real column names from Hive tables)
-  //   3 = HIVE-12055 added (vectorized writer implementation)
-  //   4 = HIVE-13083 fixed (decimals write present stream correctly)
-  //   5 = ORC-101 fixed (bloom filters use utf8 consistently)
-  //   6 = ORC-135 fixed (timestamp statistics use utc)
-  //   7 = ORC-517 fixed (decimal64 min/max incorrect)
-  //   8 = ORC-203 added (trim very long string statistics)
-  //   9 = ORC-14 added (column encryption)
-  //
-  // Version of the ORC C++ writer:
-  //   6 = original
-  //
-  // Version of the Presto writer:
-  //   6 = original
-  //
-  // Version of the Scritchley Go writer:
-  //   6 = original
-  //
-  // Version of the Trino writer:
-  //   6 = original
-  //
-  optional uint32 writerVersion = 6;
+  // each implementation that writes ORC files should register for a code
+  //  1 = ORC C++
+  optional uint32 writer = 3;
 
-  // the number of bytes in the encrypted stripe statistics
-  optional uint64 stripeStatisticsLength = 7;
+  // the length(bytes) of footer
+  optional uint64 footerLength = 4;
 
-  // Leave this last in the record
+  // leave this last in the record
   optional string magic = 8000;
 }
 
-// The contents of the file tail that must be serialized.
-// This gets serialized as part of OrcSplit, also used by footer cache.
-message FileTail {
-  optional PostScript postscript = 1;
-  optional Footer footer = 2;
-  optional uint64 fileLength = 3;
-  optional uint64 postscriptLength = 4;
-}
diff --git a/contrib/pax_storage/src/cpp/storage/proto/pax.proto b/contrib/pax_storage/src/cpp/storage/proto/pax.proto
index db7a715334f..d27d3418ffd 100644
--- a/contrib/pax_storage/src/cpp/storage/proto/pax.proto
+++ b/contrib/pax_storage/src/cpp/storage/proto/pax.proto
@@ -9,7 +9,7 @@ message ColumnEncoding {
   enum Kind {
     DEF_ENCODED = -1;         // only used in memory, should not store in disk
     NO_ENCODED = 0;           // no encoded
-    ORC_RLE_V2 = 1;           // used orc rle v2
+    RLE_V2 = 1;               // used rle v2
     DIRECT_DELTA = 2;         // used direct delta
 
     COMPRESS_ZSTD = 3;        // use ZTSD to compress 
diff --git a/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.cc b/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.cc
index 52a1d934c6d..51c561b8714 100644
--- a/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.cc
+++ b/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.cc
@@ -4,18 +4,16 @@
 
 namespace pax {
 
-BufferedOutputStream::BufferedOutputStream(DataBuffer<char> *data_buffer,
-                                           uint64 block_size)
-    : data_buffer_(data_buffer), block_size_(block_size) {}
+BufferedOutputStream::BufferedOutputStream(uint64 block_size)
+    : data_buffer_(nullptr), block_size_(block_size) {}
 
-void BufferedOutputStream::Set(DataBuffer<char> *data_buffer,
-                               uint64 block_size) {
-  Assert(data_buffer);
+void BufferedOutputStream::Set(DataBuffer<char> *data_buffer) {
+  Assert(data_buffer && !data_buffer_);
   data_buffer_ = data_buffer;
-  block_size_ = block_size;
 }
 
 bool BufferedOutputStream::Next(void **buffer, int *size) {
+  Assert(data_buffer_);
   uint64 old_capacity = data_buffer_->Capacity();
   uint64 new_capacity = data_buffer_->Capacity();
 
@@ -42,6 +40,7 @@ bool BufferedOutputStream::Next(void **buffer, int *size) {
 
 void BufferedOutputStream::BackUp(int count) {
   if (count >= 0) {
+    Assert(data_buffer_);
     if (static_cast<size_t>(count) > data_buffer_->Used()) {
       CBDB_RAISE(cbdb::CException::ExType::kExTypeIOError);
     }
@@ -50,31 +49,38 @@ void BufferedOutputStream::BackUp(int count) {
 }
 
 google::protobuf::int64 BufferedOutputStream::ByteCount() const {
+  Assert(data_buffer_);
   return static_cast<google::protobuf::int64>(data_buffer_->Used());
 }
 
-bool BufferedOutputStream::WriteAliasedRaw([[maybe_unused]] const void *data,
-                                           [[maybe_unused]] int size) {
+bool BufferedOutputStream::WriteAliasedRaw(const void * /*data*/,
+                                           int /*size*/) {
   return false;
 }
 
 bool BufferedOutputStream::AllowsAliasing() const { return false; }
 
-uint64 BufferedOutputStream::GetSize() const { return data_buffer_->Used(); }
+uint64 BufferedOutputStream::GetSize() const {
+  Assert(data_buffer_);
+  return data_buffer_->Used();
+}
 
 DataBuffer<char> *BufferedOutputStream::GetDataBuffer() const {
   return data_buffer_;
 }
 
 void BufferedOutputStream::StartBufferOutRecord() {
+  Assert(data_buffer_);
   last_used_ = data_buffer_->Used();
 }
 
 size_t BufferedOutputStream::EndBufferOutRecord() {
+  Assert(data_buffer_);
   return data_buffer_->Used() - last_used_;
 }
 
 void BufferedOutputStream::DirectWrite(char *ptr, size_t size) {
+  Assert(data_buffer_);
   if (data_buffer_->Available() < size) {
     data_buffer_->ReSize(data_buffer_->Capacity() + size);
   }
diff --git a/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.h b/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.h
index 61fc9685b87..6fe3a96e4f0 100644
--- a/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.h
+++ b/contrib/pax_storage/src/cpp/storage/proto/protobuf_stream.h
@@ -9,9 +9,9 @@ namespace pax {
 
 class BufferedOutputStream : public google::protobuf::io::ZeroCopyOutputStream {
  public:
-  BufferedOutputStream(DataBuffer<char> *data_buffer, uint64 block_size);
+  explicit BufferedOutputStream(uint64 block_size);
 
-  virtual void Set(DataBuffer<char> *data_buffer, uint64 block_size);
+  virtual void Set(DataBuffer<char> *data_buffer);
 
   bool Next(void **buffer, int *size) override;
 
diff --git a/contrib/pax_storage/src/cpp/storage/strategy.cc b/contrib/pax_storage/src/cpp/storage/strategy.cc
index 6fa32b945b4..2b6f542e3e5 100644
--- a/contrib/pax_storage/src/cpp/storage/strategy.cc
+++ b/contrib/pax_storage/src/cpp/storage/strategy.cc
@@ -16,10 +16,9 @@ size_t PaxDefaultSplitStrategy::SplitFileSize() const {
   return 64 * 1024 * 1024;
 }
 
-bool PaxDefaultSplitStrategy::ShouldSplit(MicroPartitionWriter *writer,
+bool PaxDefaultSplitStrategy::ShouldSplit(size_t phy_size,
                                           size_t num_tuples) const {
-  return (num_tuples >= SplitTupleNumbers()) ||
-         (writer->PhysicalSize() >= SplitFileSize());
+  return (num_tuples >= SplitTupleNumbers()) || (phy_size >= SplitFileSize());
 }
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/strategy.h b/contrib/pax_storage/src/cpp/storage/strategy.h
index 50e49e09ae8..4b08d2b5546 100644
--- a/contrib/pax_storage/src/cpp/storage/strategy.h
+++ b/contrib/pax_storage/src/cpp/storage/strategy.h
@@ -8,8 +8,7 @@ class FileSplitStrategy {
  public:
   virtual ~FileSplitStrategy() = default;
 
-  virtual bool ShouldSplit(MicroPartitionWriter *writer,
-                           size_t num_tuples) const = 0;
+  virtual bool ShouldSplit(size_t phy_size, size_t num_tuples) const = 0;
 
   virtual size_t SplitTupleNumbers() const = 0;
 
@@ -25,7 +24,6 @@ class PaxDefaultSplitStrategy final : public FileSplitStrategy {
 
   size_t SplitFileSize() const override;
 
-  bool ShouldSplit(MicroPartitionWriter *writer,
-                   size_t num_tuples) const override;
+  bool ShouldSplit(size_t phy_size, size_t num_tuples) const override;
 };
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/tools/pax_dump.cpp b/contrib/pax_storage/src/cpp/storage/tools/pax_dump.cpp
new file mode 100644
index 00000000000..0ac8641de75
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/tools/pax_dump.cpp
@@ -0,0 +1,240 @@
+
+#include <getopt.h>
+#include <stdlib.h>
+#include <unistd.h>
+
+#include "exceptions/CException.h"
+#include "storage/proto/proto_wrappers.h"
+#include "storage/tools/pax_dump_reader.h"
+
+const char *progname = NULL;
+
+static void Usage() {
+  std::cout
+  << progname << " - Pax dump tools \n\n"
+  << "Used to dump pax file && pax aux table \n"
+  << "Usage:\n " << progname << " -f [FILE] [OPTION]...\n\n"
+  << "Options:\n"
+
+  << "  -h, -?, --help                    Print this help, then exit\n"
+  << "  -v, --version                     Print the version of current pax tools\n"
+
+  << "  -f, --file [file]                 Specify the file name to be dumped\n"
+  << "  -g, --group-range [start, len]    Specify print with range of group ids\n"
+  << "  -c, --column-range [start, len]   Specify print with range of column ids\n"
+  << "  -r, --row-range [start, len]      Specify print with range of column ids\n"
+
+  << "  -a, --print-all                   Print the all information, which contains meta and data\n"
+  << "  -m, --print-all-desc              Print the all desc part information, which contains version, post script, footer\n"
+  << "  -p, --print-post-script-info      Print the postscript information\n"
+  << "  -t, --print-footer-info           Print the footer information\n"
+  << "  -s, --print-schema-info           Print the schema information\n"
+  << "  -b, --print-group-info            Print the group information\n"
+  << "  -o, --print-group-footer          Print the group footer information\n"
+  << "  -d, --print-data                  Print the data part information\n\n"
+  << "Example:\n"
+  << "  " << progname << " -f test.file -a -g 0,3 -c 0,5 -r 0,10\n"
+  << std::endl;
+}
+
+static struct option long_options[] = {
+    {"help", no_argument, NULL, '?'},
+    {"version", no_argument, NULL, 'v'},
+    {"file", required_argument, NULL, 'f'},
+    {"group-range", optional_argument, NULL, 'g'},
+    {"column-range", optional_argument, NULL, 'c'},
+    {"row-range", optional_argument, NULL, 'r'},
+    {"print-all", optional_argument, NULL, 'a'},
+    {"print-all-desc", optional_argument, NULL, 'm'},
+    {"print-post-script-info", optional_argument, NULL, 'p'},
+    {"print-footer-info", optional_argument, NULL, 't'},
+    {"print-schema-info", optional_argument, NULL, 's'},
+    {"print-group-info", optional_argument, NULL, 'b'},
+    {"print-all-data", optional_argument, NULL, 'd'},
+    {"print-group-footer", optional_argument, NULL, 'o'},
+    {NULL, 0, NULL, 0}};
+
+static inline std::pair<int64_t, int64_t> ParseRangeConfig(
+    const char *range_opt) {
+  char *p;
+  int64_t start, len;
+  char *range;
+  bool succ = false;
+  const char *range_split = ",";
+
+  auto parse_ll = [](char *part) -> std::pair<int64_t, bool> {
+    char *end_ptr;
+    int64_t ll_val = -1;
+
+    if (part == nullptr) {
+      return {ll_val, false};
+    }
+
+    ll_val = strtoll(part, &end_ptr, 10);
+    if (end_ptr == part || *end_ptr != '\0') {
+      return {ll_val, false};
+    }
+
+    return {ll_val, true};
+  };
+
+  range = strdup(range_opt);
+
+  p = strtok(range, range_split);
+  std::tie(start, succ) = parse_ll(p);
+  if (!succ) {
+    goto invalid_args;
+  }
+
+  p = strtok(NULL, range_split);
+  std::tie(len, succ) = parse_ll(p);
+  if (!succ) {
+    goto invalid_args;
+  }
+
+  if (start < 0 || len <= 0) {
+    goto invalid_args;
+  }
+
+  p = strtok(NULL, range_split);
+  if (p != nullptr) {
+    goto invalid_args;
+  }
+
+  free(range);  // NOLINT
+  return {start, len};
+
+invalid_args:
+  std::cout << "Invalid args: " << range_opt << std::endl;
+  free(range);  // NOLINT
+  exit(-1);
+}
+
+static void InitConfig(struct pax::tools::DumpConfig *config, int argc,
+                       char **argv) {
+  int c = 0;
+  if (argc > 1) {
+    if (strcmp(argv[1], "--help") == 0 || strcmp(argv[1], "-?") == 0 ||
+        strcmp(argv[1], "-h") == 0) {
+      Usage();
+      exit(0);
+    }
+  }
+
+  optind = 1;
+  while (optind < argc) {
+    while ((c = getopt_long(argc, argv, "vf:g:c:r:amptsbod", long_options,
+                            NULL)) != -1) {
+      switch (c) {
+        case 'f': {
+          if (!optarg) {
+            goto invalid_args;
+          }
+          config->file_name = strdup(optarg);
+          break;
+        }
+        case 'g': {
+          if (!optarg) {
+            goto invalid_args;
+          }
+          std::tie(config->group_id_start, config->group_id_len) =
+              ParseRangeConfig(optarg);
+          break;
+        }
+        case 'c': {
+          if (!optarg) {
+            goto invalid_args;
+          }
+          std::tie(config->column_id_start, config->column_id_len) =
+              ParseRangeConfig(optarg);
+          break;
+        }
+        case 'r': {
+          if (!optarg) {
+            goto invalid_args;
+          }
+          std::tie(config->row_id_start, config->row_id_len) =
+              ParseRangeConfig(optarg);
+          break;
+        }
+        case 'a': {
+          config->print_all = true;
+          break;
+        }
+        case 'm': {
+          config->print_all_desc = true;
+          break;
+        }
+        case 'p': {
+          config->print_post_script = true;
+          break;
+        }
+        case 't': {
+          config->print_footer = true;
+          break;
+        }
+        case 's': {
+          config->print_schema = true;
+          break;
+        }
+        case 'b': {
+          config->print_group_info = true;
+          break;
+        }
+        case 'o': {
+          config->print_group_footer = true;
+          break;
+        }
+        case 'd': {
+          config->print_all_data = true;
+          break;
+        }
+        default:
+          /* do nothing */
+          break;
+      }
+    }
+  }
+
+  if (!config->file_name) {
+    std::cout << "Invalid file. The input file must be specified via -f/--file"
+              << std::endl;
+    exit(-1);
+  }
+
+  return;
+invalid_args:
+  std::cout << "Invalid args: -" << (char)(c) << ", failed to parse this arg."
+            << std::endl;
+  exit(-1);
+}
+
+int main(int argc, char **argv) {
+  pax::tools::PaxDumpReader *reader = nullptr;
+  pax::tools::DumpConfig config;
+
+  progname = argv[0];
+  InitConfig(&config, argc, argv);
+
+  reader = new pax::tools::PaxDumpReader(&config);
+  bool ok = reader->Initialize();
+  if (!ok) {
+    std::cout << "Failed to dump current file: " << config.file_name
+              << std::endl;
+    reader->Release();
+    delete reader;
+    exit(-1);
+  }
+
+  try {
+    reader->Dump();
+  } catch (cbdb::CException &e) {
+    std::cout << "error happend while dumping\n" << e.Stack() << std::endl;
+    reader->Release();
+    delete reader;
+    exit(-1);
+  }
+
+  reader->Release();
+  delete reader;
+}
diff --git a/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.cpp b/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.cpp
new file mode 100644
index 00000000000..f95582f94f0
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.cpp
@@ -0,0 +1,640 @@
+#include "storage/tools/pax_dump_reader.h"
+
+#include <tabulate/table.hpp>
+
+#include "comm/singleton.h"
+#include "exceptions/CException.h"
+#include "storage/columns/pax_column_traits.h"
+#include "storage/file_system.h"
+#include "storage/local_file_system.h"
+#include "storage/orc/orc_defined.h"
+#include "storage/orc/orc_format_reader.h"
+#include "storage/orc/orc_group.h"
+
+namespace pax::tools {
+
+static inline std::string GetWriterDesc(uint32 writer_id) {
+  switch (writer_id) {
+    case 1:
+      return "CPP writer";
+    default:
+      return "Unknown";
+  }
+}
+
+static inline std::string GetStorageFormat(uint32 storage_format) {
+  switch (storage_format) {
+    case PaxStorageFormat::kTypeStorageOrcNonVec:
+      return "Origin format";
+    case PaxStorageFormat::kTypeStorageOrcVec:
+      return "VEC format";
+    default:
+      return "Unknown";
+  }
+}
+
+static inline std::string BoolCast(const bool b) {
+  std::ostringstream ss;
+  ss << std::boolalpha << b;
+  return ss.str();
+}
+
+static inline std::tuple<int64, int64, bool> ParseRange(
+    const int64 start, const int64 len, const int64 total_size) {
+  int64 range_start = 0;
+  int64 range_end = total_size;
+
+  if (start != NO_SPEC_ID) {
+    if (len == 0 || start + len > total_size) {
+      return {range_start, range_end, false};
+    }
+
+    range_start = start;
+    range_end = start + len;
+  }
+
+  return {range_start, range_end, true};
+}
+
+PaxDumpReader::PaxDumpReader(DumpConfig *config)
+    : config_(config), format_reader_(nullptr) {}
+
+bool PaxDumpReader::Initialize() {
+  assert(config_);
+  assert(config_->file_name);
+
+  try {
+    FileSystem *fs = pax::Singleton<LocalFileSystem>::GetInstance();
+    auto open_file = fs->Open(config_->file_name, fs::kReadMode);
+    if (open_file->FileLength() == 0) {
+      return false;
+    }
+
+    format_reader_ = new OrcFormatReader(open_file);
+    format_reader_->Open();
+  } catch (cbdb::CException &e) {
+    std::cout << "error happend\n" << e.Stack() << std::endl;
+    Release();
+    return false;
+  }
+
+  return true;
+}
+
+void PaxDumpReader::Release() {
+  if (format_reader_) {
+    format_reader_->Close();
+    delete format_reader_;
+    format_reader_ = nullptr;
+  }
+}
+
+void PaxDumpReader::Dump() {
+  bool no_print = true;
+  if (config_->print_all) {
+    DumpAllInfo();
+    no_print = false;
+  }
+
+  if (config_->print_all_desc) {
+    DumpAllDesc();
+    no_print = false;
+  }
+
+  if (config_->print_post_script) {
+    DumpPostScript();
+    no_print = false;
+  }
+
+  if (config_->print_footer) {
+    DumpFooter();
+    no_print = false;
+  }
+
+  if (config_->print_schema) {
+    DumpSchema();
+    no_print = false;
+  }
+
+  if (config_->print_group_info) {
+    DumpGroupInfo();
+    no_print = false;
+  }
+
+  if (config_->print_group_footer) {
+    DumpGroupFooter();
+    no_print = false;
+  }
+
+  if (config_->print_all_data) {
+    DumpAllData();
+    no_print = false;
+  }
+
+  // defualt dump all of desc
+  if (no_print) {
+    DumpAllDesc();
+  }
+}
+
+void PaxDumpReader::DumpAllInfo() {
+  DumpAllDesc();
+  DumpAllData();
+}
+
+void PaxDumpReader::DumpAllDesc() {
+  DumpPostScript();
+  DumpFooter();
+  DumpSchema();
+  DumpGroupInfo();
+  DumpGroupFooter();
+}
+
+void PaxDumpReader::DumpPostScript() {
+  tabulate::Table post_srcipt_table;
+  tabulate::Table desc_table;
+  auto postsrcipt = &(format_reader_->post_script_);
+
+  desc_table.add_row(
+      {"Major version", std::to_string(postsrcipt->majorversion())});
+  desc_table.add_row(
+      {"Minor version", std::to_string(postsrcipt->minorversion())});
+  desc_table.add_row({"Writer desc", GetWriterDesc(postsrcipt->writer())});
+  desc_table.add_row(
+      {"Footer length", std::to_string(postsrcipt->footerlength())});
+  desc_table.add_row({"Magic", postsrcipt->magic()});
+
+  post_srcipt_table.add_row(tabulate::Table::Row_t{"Post Script description"});
+  post_srcipt_table[0].format().font_align(tabulate::FontAlign::center);
+  post_srcipt_table[0].format().font_color(tabulate::Color::red);
+
+  post_srcipt_table.add_row(tabulate::Table::Row_t{desc_table});
+  post_srcipt_table[1].format().hide_border_top();
+
+  std::cout << post_srcipt_table << std::endl;
+}
+
+void PaxDumpReader::DumpSchema() {
+  tabulate::Table schema_table;
+  tabulate::Table desc_table;
+
+  auto footer = &(format_reader_->file_footer_);
+  auto col_infos = &(footer->colinfo());
+
+  // verify schema exist
+  auto max_id = footer->types_size();
+  CBDB_CHECK(max_id > 0, cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+  // verify schema defined
+  auto struct_types = &(footer->types(0));
+  CBDB_CHECK(struct_types->kind() == pax::orc::proto::Type_Kind_STRUCT,
+             cbdb::CException::ExType::kExTypeInvalidORCFormat);
+  CBDB_CHECK(struct_types->subtypes_size() == col_infos->size(),
+             cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+  // create desc header, types and basic info
+  tabulate::Table::Row_t desc_table_header{""};
+  tabulate::Table::Row_t desc_table_types{"Type"};
+  tabulate::Table::Row_t desc_table_typeids{"Type id"};
+  tabulate::Table::Row_t desc_table_collation{"Collation"};
+  tabulate::Table::Row_t desc_table_opfamilys{"Operator family"};
+
+  int64 column_start, column_end;
+  bool succ;
+  std::tie(column_start, column_end, succ) =
+      ParseRange(config_->column_id_start, config_->column_id_len,
+                 struct_types->subtypes_size());
+  if (!succ) {
+    std::cout << "Fail to parse the column range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "column range should in [0, " << struct_types->subtypes_size()
+              << ")" << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  for (int j = column_start; j < column_end; ++j) {
+    int sub_type_id = static_cast<int>(struct_types->subtypes(j)) + 1;
+    auto sub_type = &(footer->types(sub_type_id));
+
+    desc_table_header.emplace_back(std::string("column" + std::to_string(j)));
+    desc_table_types.emplace_back(sub_type->DebugString());
+    desc_table_typeids.emplace_back(std::to_string((*col_infos)[j].typid()));
+    desc_table_collation.emplace_back(
+        std::to_string((*col_infos)[j].collation()));
+    desc_table_opfamilys.emplace_back(
+        std::to_string((*col_infos)[j].opfamily()));
+  }
+
+  desc_table.add_row(desc_table_header);
+  desc_table.add_row(desc_table_types);
+  desc_table.add_row(desc_table_typeids);
+  desc_table.add_row(desc_table_collation);
+  desc_table.add_row(desc_table_opfamilys);
+
+  schema_table.add_row(tabulate::Table::Row_t{"Schema description"});
+  schema_table[0].format().font_align(tabulate::FontAlign::center);
+  schema_table[0].format().font_color(tabulate::Color::red);
+
+  schema_table.add_row(tabulate::Table::Row_t{desc_table});
+  schema_table[1].format().hide_border_top();
+
+  std::cout << schema_table << std::endl;
+}
+
+void PaxDumpReader::DumpFooter() {
+  tabulate::Table footer_table;
+  tabulate::Table desc_table;
+
+  auto footer = &(format_reader_->file_footer_);
+
+  desc_table.add_row(
+      {"Length of Content", std::to_string(footer->contentlength())});
+  desc_table.add_row(
+      {"Number Of Groups", std::to_string(footer->stripes_size())});
+  desc_table.add_row(
+      {"Number Of Columns", std::to_string(footer->colinfo_size())});
+  desc_table.add_row(
+      {"Number Of Rows", std::to_string(footer->numberofrows())});
+  desc_table.add_row(
+      {"Storage Format", GetStorageFormat(footer->storageformat())});
+
+  footer_table.add_row(tabulate::Table::Row_t{"Footer description"});
+  footer_table[0].format().font_align(tabulate::FontAlign::center);
+  footer_table[0].format().font_color(tabulate::Color::red);
+
+  footer_table.add_row(tabulate::Table::Row_t{desc_table});
+  footer_table[1].format().hide_border_top();
+
+  std::cout << footer_table << std::endl;
+}
+
+void PaxDumpReader::DumpGroupInfo() {
+  auto footer = &(format_reader_->file_footer_);
+  auto stripes = &(footer->stripes());
+  auto number_of_column = footer->colinfo_size();
+
+  bool succ;
+  int64 group_start, group_end;
+  int64 column_start, column_end;
+
+  std::tie(group_start, group_end, succ) = ParseRange(
+      config_->group_id_start, config_->group_id_len, stripes->size());
+  if (!succ) {
+    std::cout << "Fail to parse the group range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "group range should in [0, " << stripes->size() << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  std::tie(column_start, column_end, succ) = ParseRange(
+      config_->column_id_start, config_->column_id_len, number_of_column);
+  if (!succ) {
+    std::cout << "Fail to parse the column range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "column range should in [0, " << number_of_column << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  for (int i = group_start; i < group_end; i++) {
+    tabulate::Table group_table;
+    tabulate::Table group_desc_table;
+
+    tabulate::Table group_col_desc_table;
+    tabulate::Table::Row_t col_desc_table_header{""};
+    tabulate::Table::Row_t col_desc_table_allnulls{"All null"};
+    tabulate::Table::Row_t col_desc_table_hasnulls{"Has null"};
+    tabulate::Table::Row_t col_desc_table_mins{"Minimal"};
+    tabulate::Table::Row_t col_desc_table_maxs{"Maximum"};
+
+    auto stripe = (*stripes)[i];
+
+    CBDB_CHECK(stripe.colstats_size() == number_of_column,
+               cbdb::CException::ExType::kExTypeInvalidORCFormat);
+
+    // full group desc
+    group_desc_table.add_row({"Group no", std::to_string(i)});
+    group_desc_table.add_row({"Offset", std::to_string(stripe.offset())});
+    group_desc_table.add_row(
+        {"Data length", std::to_string(stripe.datalength())});
+    group_desc_table.add_row(
+        {"Stripe footer length", std::to_string(stripe.footerlength())});
+    group_desc_table.add_row(
+        {"Number of rows", std::to_string(stripe.numberofrows())});
+
+    // full group col statistics desc
+    for (int j = column_start; j < column_end; j++) {
+      const auto &col_stats = stripe.colstats(j);
+      const auto &col_data_stats = col_stats.coldatastats();
+      col_desc_table_header.emplace_back(
+          std::string("column" + std::to_string(j)));
+      col_desc_table_allnulls.emplace_back(BoolCast(col_stats.allnull()));
+      col_desc_table_hasnulls.emplace_back(BoolCast(col_stats.hasnull()));
+
+      int64 minimal_val;
+      int64 maximum_val;
+      bool support = true;
+
+      switch (col_data_stats.maximum().size()) {
+        case 1: {
+          minimal_val = *reinterpret_cast<const int8 *>(  // NOLINT
+              col_data_stats.minimal().data());
+          maximum_val = *reinterpret_cast<const int8 *>(  // NOLINT
+              col_data_stats.maximum().data());
+          break;
+        }
+        case 2: {
+          minimal_val =
+              *reinterpret_cast<const int16 *>(col_data_stats.minimal().data());
+          maximum_val =
+              *reinterpret_cast<const int16 *>(col_data_stats.maximum().data());
+          break;
+        }
+        case 4: {
+          minimal_val =
+              *reinterpret_cast<const int32 *>(col_data_stats.minimal().data());
+          maximum_val =
+              *reinterpret_cast<const int32 *>(col_data_stats.maximum().data());
+          break;
+        }
+        case 8: {
+          minimal_val =
+              *reinterpret_cast<const int64 *>(col_data_stats.minimal().data());
+          maximum_val =
+              *reinterpret_cast<const int64 *>(col_data_stats.maximum().data());
+          break;
+        }
+        default: {
+          support = false;
+        }
+      }
+
+      if (support) {
+        col_desc_table_mins.emplace_back(std::to_string(minimal_val));
+        col_desc_table_maxs.emplace_back(std::to_string(maximum_val));
+      } else {
+        col_desc_table_mins.emplace_back(col_data_stats.minimal());
+        col_desc_table_maxs.emplace_back(col_data_stats.maximum());
+      }
+    }
+
+    // build group col desc table
+    group_col_desc_table.add_row(col_desc_table_header);
+    group_col_desc_table.add_row(col_desc_table_allnulls);
+    group_col_desc_table.add_row(col_desc_table_hasnulls);
+    group_col_desc_table.add_row(col_desc_table_mins);
+    group_col_desc_table.add_row(col_desc_table_maxs);
+
+    // build group table
+    group_table.add_row(tabulate::Table::Row_t{
+        std::string("Group description " + std::to_string(i))});
+    group_table[0].format().font_align(tabulate::FontAlign::center);
+    group_table[0].format().font_color(tabulate::Color::red);
+    group_table.add_row(tabulate::Table::Row_t{group_desc_table});
+    group_table[1].format().hide_border_top();
+
+    group_table.add_row(tabulate::Table::Row_t{group_col_desc_table});
+    group_table[2].format().hide_border_top();
+
+    std::cout << group_table << std::endl;
+  }
+}
+
+void PaxDumpReader::DumpGroupFooter() {
+  DataBuffer<char> *data_buffer = nullptr;
+  auto footer = &(format_reader_->file_footer_);
+  auto stripes = &(footer->stripes());
+  auto number_of_column = footer->colinfo_size();
+
+  bool succ;
+  int64 group_start, group_end;
+  int64 column_start, column_end;
+
+  std::tie(group_start, group_end, succ) = ParseRange(
+      config_->group_id_start, config_->group_id_len, stripes->size());
+  if (!succ) {
+    std::cout << "Fail to parse the group range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "group range should in [0, " << stripes->size() << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  std::tie(column_start, column_end, succ) = ParseRange(
+      config_->column_id_start, config_->column_id_len, number_of_column);
+  if (!succ) {
+    std::cout << "Fail to parse the column range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "column range should in [0, " << number_of_column << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  data_buffer = new DataBuffer<char>(8192);
+
+  size_t streams_index;
+  for (int i = group_start; i < group_end; i++) {
+    auto stripe_footer = format_reader_->ReadStripeFooter(data_buffer, i);
+    const pax::orc::proto::Stream *n_stream = nullptr;
+    const pax::ColumnEncoding *column_encoding = nullptr;
+
+    tabulate::Table group_footer_table;
+    tabulate::Table group_footer_desc_tables;
+    tabulate::Table::Row_t group_footer_descs;
+    tabulate::Table::Row_t group_footer_desc_cids;
+    tabulate::Table stream_desc_table;
+
+    streams_index = 0;
+
+    for (int j = 0; j < column_start;) {
+      n_stream = &stripe_footer.streams(streams_index++);
+      if (n_stream->kind() == ::pax::orc::proto::Stream_Kind::Stream_Kind_DATA) {
+        j++;
+      }
+    }
+
+    for (int j = column_start; j < column_end;) {
+      n_stream = &stripe_footer.streams(streams_index++);
+      stream_desc_table.add_row(
+          {"Stream type", std::to_string(n_stream->kind())});
+      stream_desc_table.add_row({"Column", std::to_string(n_stream->column())});
+      stream_desc_table.add_row({"Length", std::to_string(n_stream->length())});
+
+      if (n_stream->kind() == ::pax::orc::proto::Stream_Kind::Stream_Kind_DATA) {
+        column_encoding = &stripe_footer.pax_col_encodings(j);
+
+        tabulate::Table group_footer_desc_table;
+
+        group_footer_desc_table.add_row(
+            {"Compress type", std::to_string(column_encoding->kind())});
+        group_footer_desc_table.add_row(
+            {"Compress level",
+             std::to_string(column_encoding->compress_lvl())});
+        group_footer_desc_table.add_row(
+            {"Origin length", std::to_string(column_encoding->length())});
+        group_footer_desc_table.add_row({"Streams", stream_desc_table});
+        stream_desc_table = tabulate::Table();
+
+        group_footer_desc_cids.emplace_back(
+            std::string("Column" + std::to_string(j)));
+        group_footer_descs.emplace_back(group_footer_desc_table);
+        j++;
+      }
+    }
+
+    group_footer_desc_tables.add_row(group_footer_desc_cids);
+    group_footer_desc_tables.add_row(group_footer_descs);
+
+    group_footer_table.add_row(tabulate::Table::Row_t{
+        std::string("Group footer description " + std::to_string(i))});
+    group_footer_table[0].format().font_align(tabulate::FontAlign::center);
+    group_footer_table[0].format().font_color(tabulate::Color::red);
+    group_footer_table.add_row(
+        tabulate::Table::Row_t{group_footer_desc_tables});
+    group_footer_table[1].format().hide_border_top();
+
+    std::cout << group_footer_table << std::endl;
+  }
+
+  delete data_buffer;
+}
+
+void PaxDumpReader::DumpAllData() {
+  auto footer = &(format_reader_->file_footer_);
+  auto stripes = &(footer->stripes());
+  auto number_of_columns = footer->colinfo_size();
+
+  bool succ;
+  int64 group_start, group_end;
+  int64 column_start, column_end;
+  int64 row_start, row_end;
+  bool is_vec = footer->storageformat() == kTypeStorageOrcVec;
+
+  std::tie(group_start, group_end, succ) = ParseRange(
+      config_->group_id_start, config_->group_id_len, stripes->size());
+  if (!succ || config_->group_id_len != 1) {
+    std::cout << "Invalid group range, with option -d/--print-data the range "
+                 "length should be 1 \n"
+              << "file: " << config_->file_name << "\n"
+              << "group range shoule in [0, " << stripes->size() << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  std::tie(column_start, column_end, succ) = ParseRange(
+      config_->column_id_start, config_->column_id_len, number_of_columns);
+  if (!succ) {
+    std::cout << "Fail to parse the column range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "column range should in [0, " << number_of_columns << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  DataBuffer<char> *data_buffer = nullptr;
+  auto stripe_info = (*stripes)[group_start];
+  size_t number_of_rows = 0;
+  pax::orc::proto::StripeFooter stripe_footer;
+  bool proj_map[number_of_columns];
+  PaxColumns *columns = nullptr;
+  OrcGroup *group = nullptr;
+
+  data_buffer = new DataBuffer<char>(8192);
+  number_of_rows = stripe_info.numberofrows();
+  stripe_footer = format_reader_->ReadStripeFooter(data_buffer, group_start);
+
+  std::tie(row_start, row_end, succ) =
+      ParseRange(config_->row_id_start, config_->row_id_len, number_of_rows);
+  if (!succ) {
+    std::cout << "Fail to parse the row range. \n"
+              << "file: " << config_->file_name << "\n"
+              << "row range should in [0, " << number_of_rows << ")"
+              << std::endl;
+    CBDB_RAISE(cbdb::CException::ExType::kExTypeInvalid);
+  }
+
+  memset(proj_map, false, number_of_columns);
+  for (int column_index = column_start; column_index < column_end;
+       column_index++) {
+    proj_map[column_index] = true;
+  }
+
+  columns =
+      format_reader_->ReadStripe(group_start, proj_map, number_of_columns);
+
+  if (!is_vec)
+    group = new OrcGroup(columns, 0);
+  else
+    group = new OrcVecGroup(columns, 0);
+
+  tabulate::Table data_table;
+  tabulate::Table data_datum_table;
+  tabulate::Table::Row_t data_table_header;
+  for (int column_index = column_start; column_index < column_end;
+       column_index++) {
+    data_table_header.emplace_back(
+        std::string("Column" + std::to_string(column_index)));
+  }
+  data_datum_table.add_row(data_table_header);
+
+  for (int row_index = row_start; row_index < row_end; row_index++) {
+    tabulate::Table::Row_t current_row;
+
+    for (int column_index = column_start; column_index < column_end;
+         column_index++) {
+      Datum d;
+      bool null;
+      PaxColumn *column = (*columns)[column_index];
+
+      std::tie(d, null) = group->GetColumnValue(column_index, row_index);
+      if (null) {
+        current_row.emplace_back("");
+      } else {
+        switch (column->GetPaxColumnTypeInMem()) {
+          case kTypeNonFixed:
+            current_row.emplace_back(std::string(DatumGetPointer(d)));
+            break;
+          case kTypeFixed: {
+            switch (column->GetTypeLength()) {
+              case 1:
+                current_row.emplace_back(std::to_string(cbdb::Int8ToDatum(d)));
+                break;
+              case 2:
+                current_row.emplace_back(std::to_string(cbdb::Int16ToDatum(d)));
+                break;
+              case 4:
+                current_row.emplace_back(std::to_string(cbdb::Int32ToDatum(d)));
+                break;
+              case 8:
+                current_row.emplace_back(std::to_string(cbdb::Int64ToDatum(d)));
+                break;
+              default:
+                Assert(
+                    !"should't be here, fixed type len should be 1, 2, 4, 8");
+            }
+            break;
+          }
+          default:
+            Assert(!"should't be here, non-implemented column type in memory");
+            break;
+        }
+      }
+    }
+
+    data_datum_table.add_row(current_row);
+  }
+
+  data_table.add_row(tabulate::Table::Row_t{"Table data"});
+  data_table[0].format().font_align(tabulate::FontAlign::center);
+  data_table[0].format().font_color(tabulate::Color::red);
+
+  data_table.add_row(tabulate::Table::Row_t{data_datum_table});
+  data_table[1].format().hide_border_top();
+
+  std::cout << data_table << std::endl;
+  delete data_buffer;
+  delete group;
+}
+
+}  // namespace pax::tools
diff --git a/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.h b/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.h
new file mode 100644
index 00000000000..12970f20896
--- /dev/null
+++ b/contrib/pax_storage/src/cpp/storage/tools/pax_dump_reader.h
@@ -0,0 +1,63 @@
+#pragma once
+#include <cstdlib>
+
+namespace pax {
+class OrcFormatReader;
+namespace tools {
+
+#define NO_SPEC_ID -1
+#define NO_SPEC_LEN 0
+
+struct DumpConfig {
+  ~DumpConfig() {
+    if (file_name) {
+      free(file_name); // NOLINT
+    }
+  }
+
+  char *file_name = nullptr;
+  bool print_all = false;
+  bool print_all_desc = false;
+  bool print_post_script = false;
+  bool print_footer = false;
+  bool print_schema = false;
+  bool print_group_info = false;
+  bool print_group_footer = false;
+  bool print_all_data = false;
+
+  int64_t group_id_start = NO_SPEC_ID;
+  int64_t group_id_len = NO_SPEC_LEN;
+
+  int64_t column_id_start = NO_SPEC_ID;
+  int64_t column_id_len = NO_SPEC_LEN;
+
+  int64_t row_id_start = NO_SPEC_ID;
+  int64_t row_id_len = NO_SPEC_LEN;
+};
+
+class PaxDumpReader final {
+ public:
+  explicit PaxDumpReader(DumpConfig *config);
+
+  bool Initialize();
+  void Release();
+
+  void Dump();
+
+ private:
+  void DumpAllInfo();
+  void DumpAllDesc();
+  void DumpPostScript();
+  void DumpFooter();
+  void DumpSchema();
+  void DumpGroupInfo();
+  void DumpGroupFooter();
+  void DumpAllData();
+
+ private:
+  DumpConfig *config_;
+  OrcFormatReader *format_reader_;
+};
+
+}  // namespace tools
+}  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.cc b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.cc
index 72e7e378cfa..a8996d8b037 100644
--- a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.cc
+++ b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.cc
@@ -11,6 +11,8 @@ extern "C" {
 
 #pragma GCC diagnostic pop
 
+#include "storage/columns/pax_column_traits.h"
+#include "storage/pax_itemptr.h"
 #include "storage/vec/arrow_wrapper.h"
 
 /// export interface wrapper of arrow
@@ -41,6 +43,95 @@ Arrow<DataType> ArrowExportTraits<DataType>::export_func = ExportType;
 Arrow<Field> ArrowExportTraits<Field>::export_func = ExportField;
 Arrow<Schema> ArrowExportTraits<Schema>::export_func = ExportSchema;
 
+void ExportArrayRelease(ArrowArray *array) {
+  // The Exception throw from this call back won't be catch
+  // Because caller will call this callback in destructor
+  // just let long jump happen
+  if (array->children) {
+    for (int64_t i = 0; i < array->n_children; i++) {
+      if (array->children[i] && array->children[i]->release) {
+        array->children[i]->release(array->children[i]);
+      }
+    }
+
+    pfree(array->children);
+  }
+
+  if (array->buffers) {
+    for (int64_t i = 0; i < array->n_buffers; i++) {
+      if (array->buffers[i]) {
+        pfree((void *)array->buffers[i]);
+      }
+    }
+
+    pfree(array->buffers);
+  }
+
+  array->release = NULL;
+  if (array->private_data) {
+    pfree((ArrowArray *)array->private_data);
+  }
+};
+
+void ExportArrayNodeDetails(ArrowArray *export_array,
+                            const std::shared_ptr<ArrayData> &data,
+                            const std::vector<ArrowArray *> &child_array,
+                            bool is_child) {
+  export_array->length = data->length;
+  export_array->null_count = data->null_count;
+  export_array->offset = data->offset;
+
+  export_array->n_buffers = static_cast<int64_t>(data->buffers.size());
+  export_array->n_children = static_cast<int64_t>(child_array.size());
+  export_array->buffers = export_array->n_buffers
+                              ? (const void **)cbdb::Palloc0(
+                                    export_array->n_buffers * sizeof(void *))
+                              : nullptr;
+
+  for (int64_t i = 0; i < export_array->n_buffers; i++) {
+    auto buffer = data->buffers[i];
+    export_array->buffers[i] = buffer ? buffer->data() : nullptr;
+  }
+
+  export_array->children =
+      export_array->n_children
+          ? (ArrowArray **)cbdb::Palloc0(export_array->n_children *
+                                         sizeof(ArrowArray *))
+          : nullptr;
+  for (int64_t i = 0; i < export_array->n_children; i++) {
+    export_array->children[i] = child_array[i];
+  }
+
+  export_array->dictionary = nullptr;
+  export_array->private_data = is_child ? (void *)export_array : nullptr;
+  export_array->release = ExportArrayRelease;
+}
+
+static ArrowArray *ExportArrayNode(const std::shared_ptr<ArrayData> &data) {
+  ArrowArray *export_array;
+  std::vector<ArrowArray *> child_array;
+
+  for (size_t i = 0; i < data->child_data.size(); ++i) {
+    child_array.emplace_back(ExportArrayNode(data->child_data[i]));
+  }
+
+  export_array = (ArrowArray *)cbdb::Palloc0(sizeof(ArrowArray));
+  ExportArrayNodeDetails(export_array, data, child_array, true);
+  return export_array;
+}
+
+static void ExportArrayRoot(const std::shared_ptr<ArrayData> &data,
+                            ArrowArray *export_array) {
+  std::vector<ArrowArray *> child_array;
+
+  for (size_t i = 0; i < data->child_data.size(); ++i) {
+    child_array.emplace_back(ExportArrayNode(data->child_data[i]));
+  }
+  Assert(export_array);
+
+  ExportArrayNodeDetails(export_array, data, child_array, false);
+}
+
 }  // namespace arrow
 
 namespace pax {
@@ -58,15 +149,16 @@ static void CopyNonFixedRawBuffer(PaxColumn *column, size_t range_begin,
                                   size_t data_range_lens,
                                   DataBuffer<int32> *offset_buffer,
                                   DataBuffer<char> *out_data_buffer);
+
+static void CopyBitmap(Bitmap8 *bitmap, size_t range_begin, size_t range_lens,
+                       DataBuffer<char> *null_bits_buffer);
+
 static void ConvSchemaAndDataToVec(
     Oid pg_type_oid, char *attname, size_t all_nums_of_row,
     VecAdapter::VecBatchBuffer *vec_batch_buffer,
     std::vector<std::shared_ptr<arrow::Field>> &schema_types,
     arrow::ArrayVector &array_vector, std::vector<std::string> &field_names);
 
-static void NullBytesToNullBits(bool *null_buffer, size_t buffer_len,
-                                DataBuffer<char> *null_bits_map);
-
 VecAdapter::VecBatchBuffer::VecBatchBuffer()
     : vec_buffer(0), null_bits_buffer(0), offset_buffer(0), null_counts(0) {
   SetMemoryTakeOver(true);
@@ -101,12 +193,12 @@ static void CopyFixedRawBufferWithNull(PaxColumn *column, size_t range_begin,
   std::tie(buffer, buffer_len) =
       column->GetRangeBuffer(data_index_begin, data_range_lens);
 
-  auto null_bitmap = column->GetNulls();
+  auto null_bitmap = column->GetBitmap();
   size_t non_null_offset = 0;
   size_t type_len = column->GetTypeLength();
 
   for (size_t i = range_begin; i < (range_begin + range_lens); i++) {
-    if ((*null_bitmap)[i]) {
+    if (null_bitmap->Test(i)) {
       out_data_buffer->Write(buffer + non_null_offset, type_len);
       non_null_offset += type_len;
     }
@@ -123,17 +215,6 @@ static inline void CopyFixedRawBuffer(char *buffer, size_t len,
   data_buffer->Brush(len);
 }
 
-static void NullBytesToNullBits(bool *null_buffer, size_t buffer_len,
-                                DataBuffer<char> *null_bits_map) {
-  Assert(null_bits_map->Capacity() >=
-         (buffer_len % 8 == 0 ? buffer_len / 8 : buffer_len / 8 + 1));
-  for (size_t i = 0; i < buffer_len; i++) {
-    arrow::bit_util::SetBitTo((uint8 *)null_bits_map->GetBuffer(), i,
-                              null_buffer[i]);
-  }
-  null_bits_map->BrushAll();
-}
-
 static void CopyNonFixedRawBuffer(PaxColumn *column, size_t range_begin,
                                   size_t range_lens, size_t data_index_begin,
                                   size_t data_range_lens,
@@ -143,11 +224,11 @@ static void CopyNonFixedRawBuffer(PaxColumn *column, size_t range_begin,
   char *buffer = nullptr;
   size_t buffer_len = 0;
 
-  auto null_bitmap = column->GetNulls();
+  auto null_bitmap = column->GetBitmap();
   size_t non_null_offset = 0;
 
   for (size_t i = range_begin; i < (range_begin + range_lens); i++) {
-    if (null_bitmap && !(*null_bitmap)[i]) {
+    if (null_bitmap && !null_bitmap->Test(i)) {
       offset_buffer->Write(dst_offset);
       offset_buffer->Brush(sizeof(int32));
 
@@ -158,7 +239,7 @@ static void CopyNonFixedRawBuffer(PaxColumn *column, size_t range_begin,
       auto vl = (struct varlena *)(buffer);
       size_t read_len = 0;
 
-      auto tunpacked = pg_detoast_datum_packed(vl);
+      auto tunpacked = cbdb::PgDeToastDatum(vl);
       Assert((Pointer)vl == (Pointer)tunpacked);
 
       read_len = VARSIZE_ANY_EXHDR(tunpacked);
@@ -183,6 +264,35 @@ static void CopyNonFixedRawBuffer(PaxColumn *column, size_t range_begin,
              cbdb::CException::ExType::kExTypeOutOfRange);
 }
 
+static void CopyBitmap(Bitmap8 *bitmap, size_t range_begin, size_t range_lens,
+                       DataBuffer<char> *null_bits_buffer) {
+  // VEC_BATCH_LENGTH must align with 8
+  // So the `range_begin % 8` must be 0
+  static_assert(VEC_BATCH_LENGTH % 8 == 0, "Assumption is broken.");
+  Assert(range_begin % 8 == 0);
+
+  auto null_buffer = reinterpret_cast<char *>(bitmap->Raw().bitmap);
+  auto write_size = BITS_TO_BYTES(range_lens);
+  auto bitmap_raw_size = bitmap->Raw().size;
+
+  if ((range_begin / 8) >= bitmap_raw_size) {  // all nulls in current range
+    null_bits_buffer->WriteZero(write_size);
+    null_bits_buffer->Brush(write_size);
+  } else {
+    auto remain_size = bitmap_raw_size - (range_begin / 8);
+    if (remain_size >= write_size) {  // full bitmap in current range
+      null_bits_buffer->Write(null_buffer + range_begin / 8, write_size);
+      null_bits_buffer->Brush(write_size);
+    } else {  // part of non-null range with a continuous all nulls range
+      auto write_size_gap = write_size - remain_size;
+      null_bits_buffer->Write(null_buffer + range_begin / 8, remain_size);
+      null_bits_buffer->Brush(remain_size);
+      null_bits_buffer->WriteZero(write_size_gap);
+      null_bits_buffer->Brush(write_size_gap);
+    }
+  }
+}
+
 static std::tuple<std::shared_ptr<arrow::Buffer>,
                   std::shared_ptr<arrow::Buffer>,
                   std::shared_ptr<arrow::Buffer>>
@@ -195,16 +305,22 @@ ConvToVecBuffer(VecAdapter::VecBatchBuffer *vec_batch_buffer) {
       (uint8 *)vec_batch_buffer->vec_buffer.GetBuffer(),
       (int64)vec_batch_buffer->vec_buffer.Capacity());
 
+  Assert(vec_batch_buffer->vec_buffer.Capacity() % MEMORY_ALIGN_SIZE == 0);
+
   if (vec_batch_buffer->null_bits_buffer.GetBuffer()) {
     arrow_null_buffer = std::make_shared<arrow::Buffer>(
         (uint8 *)vec_batch_buffer->null_bits_buffer.GetBuffer(),
         (int64)vec_batch_buffer->null_bits_buffer.Capacity());
+
+    Assert(vec_batch_buffer->null_bits_buffer.Capacity() % MEMORY_ALIGN_SIZE ==
+           0);
   }
 
   if (vec_batch_buffer->offset_buffer.GetBuffer()) {
     arrow_offset_buffer = std::make_shared<arrow::Buffer>(
         (uint8 *)vec_batch_buffer->offset_buffer.GetBuffer(),
         (int64)vec_batch_buffer->offset_buffer.Capacity());
+    Assert(vec_batch_buffer->offset_buffer.Capacity() % MEMORY_ALIGN_SIZE == 0);
   }
   return std::make_tuple(arrow_buffer, arrow_null_buffer, arrow_offset_buffer);
 }
@@ -341,13 +457,14 @@ static void ConvSchemaAndDataToVec(
   }
 }
 
-VecAdapter::VecAdapter(TupleDesc tuple_desc)
+VecAdapter::VecAdapter(TupleDesc tuple_desc, bool build_ctid)
     : rel_tuple_desc_(tuple_desc),
       cached_batch_lens_(0),
       vec_cache_buffer_(nullptr),
       vec_cache_buffer_lens_(0),
       process_columns_(nullptr),
-      current_cached_pax_columns_index_(0) {
+      current_cached_pax_columns_index_(0),
+      build_ctid_(build_ctid) {
   Assert(rel_tuple_desc_);
 };
 
@@ -356,7 +473,7 @@ VecAdapter::~VecAdapter() {
     for (int i = 0; i < vec_cache_buffer_lens_; i++) {
       vec_cache_buffer_[i].SetMemoryTakeOver(false);
     }
-    delete[] vec_cache_buffer_;
+    PAX_DELETE_ARRAY(vec_cache_buffer_);
   }
 }
 
@@ -365,12 +482,21 @@ void VecAdapter::SetDataSource(PaxColumns *columns) {
   process_columns_ = columns;
   current_cached_pax_columns_index_ = 0;
   cached_batch_lens_ = 0;
+  // FIXME(jiaqizho): should expand vec_cache_buffer_
+  // if columns number not match vec_cache_buffer_ will not take care of schema
+  // it only handle buffer
+  AssertImply(vec_cache_buffer_,
+              columns->GetColumns() == (size_t)vec_cache_buffer_lens_);
   if (!vec_cache_buffer_) {
-    vec_cache_buffer_ = new VecBatchBuffer[columns->GetColumns()];
+    vec_cache_buffer_ = PAX_NEW_ARRAY<VecBatchBuffer>(columns->GetColumns());
     vec_cache_buffer_lens_ = columns->GetColumns();
   }
 }
 
+const TupleDesc VecAdapter::GetRelationTupleDesc() const {
+  return rel_tuple_desc_;
+}
+
 bool VecAdapter::AppendToVecBuffer() {
   PaxColumns *columns;
   PaxColumn *column;
@@ -391,6 +517,11 @@ bool VecAdapter::AppendToVecBuffer() {
 
   Assert(range_begin <= columns->GetRows());
 
+  if (COLUMN_STORAGE_FORMAT_IS_VEC(columns)) {
+    // direct redict
+    return AppendVecFormat();
+  }
+
   // recompute `range_lens`, if remain data LT `VEC_BATCH_LENGTH`
   // then should reduce `range_lens`
   if ((range_begin + range_lens) > columns->GetRows()) {
@@ -398,9 +529,8 @@ bool VecAdapter::AppendToVecBuffer() {
   }
 
   // null length depends on `range_lens`
-  auto null_align_bytes = TYPEALIGN(
-      MEMORY_ALIGN_SIZE,
-      range_lens % 8 == 0 ? (range_lens / 8) : ((range_lens / 8) + 1));
+  auto null_align_bytes =
+      TYPEALIGN(MEMORY_ALIGN_SIZE, BITS_TO_BYTES(range_lens));
 
   for (size_t index = 0; index < columns->GetColumns(); index++) {
     size_t data_index_begin = 0;
@@ -474,16 +604,15 @@ bool VecAdapter::AppendToVecBuffer() {
     }  // switch column type
 
     if (column->HasNull()) {
-      bool *null_buffer;
-      size_t null_buffer_len;
+      Bitmap8 *bitmap = nullptr;
       Assert(!null_bits_buffer->GetBuffer());
       null_bits_buffer->Set((char *)cbdb::Palloc(null_align_bytes),
                             null_align_bytes);
-      std::tie(null_buffer, null_buffer_len) =
-          column->GetRangeNulls(range_begin, range_lens);
-      NullBytesToNullBits(null_buffer, null_buffer_len, null_bits_buffer);
-    }
+      bitmap = column->GetBitmap();
+      Assert(bitmap);
 
+      CopyBitmap(bitmap, range_begin, range_lens, null_bits_buffer);
+    }
   }  // for each column
 
   current_cached_pax_columns_index_ = range_begin + range_lens;
@@ -491,9 +620,170 @@ bool VecAdapter::AppendToVecBuffer() {
   return true;
 }
 
-size_t VecAdapter::FlushVecBuffer(CTupleSlot *cslot) {
-  ArrowSchema *arrow_schema = nullptr;
-  ArrowArray *arrow_array = nullptr;
+bool VecAdapter::ShouldBuildCtid() const { return build_ctid_; }
+
+void VecAdapter::FullWithCTID(TupleTableSlot *slot,
+                              VecBatchBuffer *batch_buffer) {
+  auto buffer_len = sizeof(int64) * cached_batch_lens_;
+  DataBuffer<int64> ctid_data_buffer((int64 *)cbdb::Palloc(buffer_len),
+                                     buffer_len, false, false);
+
+  auto base_offset = GetTupleOffset(slot->tts_tid);
+
+  for (size_t i = 0; i < cached_batch_lens_; i++) {
+    SetTupleOffset(&slot->tts_tid, base_offset + i);
+    ctid_data_buffer[i] = CTIDToUint64(slot->tts_tid);
+  }
+  batch_buffer->vec_buffer.Set(ctid_data_buffer.Start(),
+                               ctid_data_buffer.Capacity());
+  batch_buffer->vec_buffer.SetMemTakeOver(false);
+  batch_buffer->vec_buffer.BrushAll();
+}
+
+template <typename T>
+static std::pair<bool, size_t> ColumnTransMemory(PaxColumn *column) {
+  Assert(column->GetStorageFormat() == PaxStorageFormat::kTypeStorageOrcVec);
+
+  auto vec_column = dynamic_cast<T *>(column);
+  auto data_buffer = vec_column->GetDataBuffer();
+  if (!data_buffer->IsMemTakeOver()) {
+    return {false, 0};
+  } else {
+    Assert(data_buffer->Capacity() % MEMORY_ALIGN_SIZE == 0);
+
+    data_buffer->SetMemTakeOver(false);
+    return {true, data_buffer->Capacity()};
+  }
+}
+
+bool VecAdapter::AppendVecFormat() {
+  PaxColumns *columns;
+  PaxColumn *column;
+
+  columns = process_columns_;
+  Assert(cached_batch_lens_ == 0);
+  Assert(columns->GetRows() <= VEC_BATCH_LENGTH);
+
+  size_t total_rows = columns->GetRows();
+
+  auto null_align_bytes =
+      TYPEALIGN(MEMORY_ALIGN_SIZE, BITS_TO_BYTES(total_rows));
+
+  for (size_t index = 0; index < columns->GetColumns(); index++) {
+    if ((*columns)[index] == nullptr) {
+      continue;
+    }
+
+    DataBuffer<char> *vec_buffer = &(vec_cache_buffer_[index].vec_buffer);
+    DataBuffer<char> *null_bits_buffer =
+        &(vec_cache_buffer_[index].null_bits_buffer);
+    DataBuffer<int32> *offset_buffer =
+        &(vec_cache_buffer_[index].offset_buffer);
+
+    column = (*columns)[index];
+    Assert(index < (size_t)vec_cache_buffer_lens_ && vec_cache_buffer_);
+
+    char *buffer = nullptr;
+    size_t buffer_len = 0;
+    bool trans_succ = false;
+    size_t cap_len = 0;
+
+    vec_cache_buffer_[index].null_counts =
+        total_rows - column->GetNonNullRows();
+
+    switch (column->GetPaxColumnTypeInMem()) {
+      case PaxColumnTypeInMem::kTypeNonFixed: {
+        Assert(!vec_buffer->GetBuffer());
+        Assert(!offset_buffer->GetBuffer());
+
+        std::tie(buffer, buffer_len) = column->GetBuffer();
+        std::tie(trans_succ, cap_len) =
+            ColumnTransMemory<PaxVecNonFixedColumn>(column);
+
+        if (trans_succ) {
+          vec_buffer->Set(buffer, cap_len);
+          vec_buffer->BrushAll();
+        } else {
+          vec_buffer->Set(
+              (char *)cbdb::Palloc0(TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len)),
+              TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len));
+          vec_buffer->Write(buffer, buffer_len);
+          vec_buffer->BrushAll();
+        }
+
+        auto offset_buffer_from_column =
+            dynamic_cast<PaxVecNonFixedColumn *>(column)->GetOffsetBuffer();
+        Assert(offset_buffer_from_column);
+        buffer = (char *)offset_buffer_from_column->GetBuffer();
+        buffer_len = offset_buffer_from_column->Capacity();
+
+        offset_buffer->Set(
+            (char *)cbdb::Palloc0(TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len)),
+            TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len));
+        offset_buffer->Write((int *)buffer, buffer_len);
+        offset_buffer->BrushAll();
+        break;
+      }
+      case PaxColumnTypeInMem::kTypeFixed: {
+        Assert(!vec_buffer->GetBuffer());
+        std::tie(buffer, buffer_len) = column->GetBuffer();
+
+        switch (column->GetTypeLength()) {
+          case 1:
+            std::tie(trans_succ, cap_len) =
+                ColumnTransMemory<PaxVecCommColumn<int8>>(column);
+            break;
+          case 2:
+            std::tie(trans_succ, cap_len) =
+                ColumnTransMemory<PaxVecCommColumn<int16>>(column);
+            break;
+          case 4:
+            std::tie(trans_succ, cap_len) =
+                ColumnTransMemory<PaxVecCommColumn<int32>>(column);
+            break;
+          case 8:
+            std::tie(trans_succ, cap_len) =
+                ColumnTransMemory<PaxVecCommColumn<int64>>(column);
+            break;
+          default:
+            Assert(false);
+        }
+
+        if (trans_succ) {
+          vec_buffer->Set(buffer, cap_len);
+          vec_buffer->BrushAll();
+        } else {
+          vec_buffer->Set(
+              (char *)cbdb::Palloc0(TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len)),
+              TYPEALIGN(MEMORY_ALIGN_SIZE, buffer_len));
+          vec_buffer->Write(buffer, buffer_len);
+          vec_buffer->BrushAll();
+        }
+        break;
+      }
+      default: {
+        CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+      }
+    }
+
+    if (column->HasNull()) {
+      Bitmap8 *bitmap = nullptr;
+      Assert(!null_bits_buffer->GetBuffer());
+      null_bits_buffer->Set((char *)cbdb::Palloc(null_align_bytes),
+                            null_align_bytes);
+      bitmap = column->GetBitmap();
+      Assert(bitmap);
+
+      CopyBitmap(bitmap, 0, total_rows, null_bits_buffer);
+    }
+  }
+
+  current_cached_pax_columns_index_ = total_rows;
+  cached_batch_lens_ += total_rows;
+  return true;
+}
+
+size_t VecAdapter::FlushVecBuffer(TupleTableSlot *slot) {
   std::vector<std::shared_ptr<arrow::Field>> schema_types;
   arrow::ArrayVector array_vector;
   std::vector<std::string> field_names;
@@ -512,10 +802,10 @@ size_t VecAdapter::FlushVecBuffer(CTupleSlot *cslot) {
   columns = process_columns_;
   Assert(columns);
 
-  vslot = VECSLOT(cslot->GetTupleTableSlot());
+  vslot = VECSLOT(slot);
   Assert(vslot);
 
-  target_desc = cslot->GetTupleDesc();
+  target_desc = slot->tts_tupleDescriptor;
   column_size = columns->GetColumns();
 
   Assert(column_size <= (size_t)rel_tuple_desc_->natts);
@@ -577,7 +867,9 @@ size_t VecAdapter::FlushVecBuffer(CTupleSlot *cslot) {
   // In step6, file 1 missing the column c, column b in file1 will be filter by
   // `attisdropped` so `schema_types.size()` is 1, we need full null in it. But
   // in file2, `schema_types.size()` is 3, so do nothing.
-  for (int index = schema_types.size(); index < target_desc->natts; index++) {
+  auto natts = build_ctid_ ? target_desc->natts - 1 : target_desc->natts;
+  Assert((int)schema_types.size() <= natts);
+  for (int index = schema_types.size(); index < natts; index++) {
     VecBatchBuffer temp_batch_buffer;
     char *target_column_name = NameStr(target_desc->attrs[index].attname);
 
@@ -591,59 +883,49 @@ size_t VecAdapter::FlushVecBuffer(CTupleSlot *cslot) {
                            field_names);
   }
 
+  // The CTID will be full with int64(table no(16) + block number(16) +
+  // offset(32)) The current value of CTID is accurate, But we cannot get the
+  // row data through this CTID. For vectorization, we need to assign CTID datas
+  // to the last column of target_list
+  if (build_ctid_) {
+    Assert((int)schema_types.size() == target_desc->natts - 1);
+    VecBatchBuffer ctid_batch_buffer;
+
+    FullWithCTID(slot, &ctid_batch_buffer);
+    char *target_column_name =
+        NameStr(target_desc->attrs[target_desc->natts - 1].attname);
+
+    ConvSchemaAndDataToVec(target_desc->attrs[target_desc->natts - 1].atttypid,
+                           target_column_name, cached_batch_lens_,
+                           &ctid_batch_buffer, schema_types, array_vector,
+                           field_names);
+  }
+
   Assert(schema_types.size() == (size_t)target_desc->natts);
   Assert(array_vector.size() == schema_types.size());
   Assert(field_names.size() == array_vector.size());
 
-  arrow_schema = (ArrowSchema *)cbdb::Palloc0(sizeof(ArrowSchema));
-  arrow_array = (ArrowArray *)cbdb::Palloc0(sizeof(ArrowArray));
+  // `ArrowRecordBatch/ArrowSchema/ArrowArray` alloced by pax memory context.
+  // Can not possible to hold the lifecycle of these three objects in pax.
+  // It will be freed after memory context reset.
+  auto arrow_rb = (ArrowRecordBatch *)cbdb::Palloc0(sizeof(ArrowRecordBatch));
 
   auto export_status = arrow::ArrowExportTraits<arrow::DataType>::export_func(
-      *arrow::struct_(std::move(schema_types)), arrow_schema);
+      *arrow::struct_(std::move(schema_types)), &arrow_rb->schema);
 
   CBDB_CHECK(export_status.ok(),
              cbdb::CException::ExType::kExTypeArrowExportError);
 
-  export_status = arrow::ExportArray(
-      **arrow::StructArray::Make(std::move(array_vector), field_names),
-      arrow_array);
+  // Don't use the `arrow::ExportArray`
+  // Because it will cause memory leak when release call
+  // The defualt `release` method won't free the `buffers`,
+  // but can free the `private_data` (ExportedArrayPrivateData)
+  // After we replace the `release` function. the `private_data` won't be freed.
+  auto array = *arrow::StructArray::Make(std::move(array_vector), field_names);
+  arrow::ExportArrayRoot(array->data(), &arrow_rb->batch);
 
-  CBDB_CHECK(export_status.ok(),
-             cbdb::CException::ExType::kExTypeArrowExportError);
-
-  arrow_array->release = [](struct ArrowArray *array) {  //
-    for (int64 i = 0; i < array->n_children; i++) {
-      if (array->children && array->children[i] &&
-          array->children[i]->release) {
-        array->children[i]->release(array->children[i]);
-      }
-    }
-
-    for (int64 i = 0; i < array->n_buffers; i++) {
-      if (array->buffers[i]) {
-        // cbdb::Pfree CException will not be deal
-        // just let long jump happen
-        pfree((void *)array->buffers[i]);
-      }
-    }
-
-    // FIXME(jiaqizho): memory leak here
-    // Will consider not use `arrow::ExportArray`
-    // delete reinterpret_cast<ExportedArrayPrivateData*>(array->private_data);
-    array->release = NULL;
-  };
-
-  // `ArrowRecordBatch/ArrowSchema/ArrowArray` alloced by pax memory context.
-  // Can not possible to hold the lifecycle of these three objects in pax.
-  // It will be freed after memory context reset.
-  auto *arrow_rb = (ArrowRecordBatch *)cbdb::Palloc0(sizeof(ArrowRecordBatch));
-  arrow_rb->batch = arrow_array;
-  arrow_rb->schema = arrow_schema;
   vslot->tts_recordbatch = arrow_rb;
 
-  // Pax will put any data into tts_value in `ReadVecTuple`
-  memset(vslot->tts_shouldfree, 0, vslot->base.tts_nvalid);
-
   rc = cached_batch_lens_;
   cached_batch_lens_ = 0;
 
@@ -659,4 +941,4 @@ bool VecAdapter::IsEnd() const {
 
 }  // namespace pax
 
-#endif  // VEC_BUILD
\ No newline at end of file
+#endif  // VEC_BUILD
diff --git a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.h b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.h
index bbf347adf30..65b539275dd 100644
--- a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.h
+++ b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_adapter.h
@@ -2,14 +2,9 @@
 
 #ifdef VEC_BUILD
 
-#include "storage/columns/pax_column.h"
 #include "storage/columns/pax_columns.h"
 #include "storage/micro_partition.h"
-
-// TODO(jiaqizho) : after vec define this value to cbdb,
-// then read the GUC value
-#define VEC_BATCH_LENGTH (16384)
-#define MEMORY_ALIGN_SIZE (8)
+#include "storage/pax_defined.h"
 
 namespace pax {
 
@@ -28,7 +23,7 @@ class VecAdapter final {
     void SetMemoryTakeOver(bool take);
   };
 
-  explicit VecAdapter(TupleDesc tuple_desc);
+  VecAdapter(TupleDesc tuple_desc, bool build_ctid = false);
 
   ~VecAdapter();
 
@@ -40,7 +35,15 @@ class VecAdapter final {
 
   bool AppendToVecBuffer();
 
-  size_t FlushVecBuffer(CTupleSlot *cslot);
+  size_t FlushVecBuffer(TupleTableSlot *slot);
+
+  const TupleDesc GetRelationTupleDesc() const;
+
+  bool ShouldBuildCtid() const;
+
+ private:
+  void FullWithCTID(TupleTableSlot *slot, VecBatchBuffer *batch_buffer);
+  bool AppendVecFormat();
 
  private:
   TupleDesc rel_tuple_desc_;
@@ -50,6 +53,7 @@ class VecAdapter final {
 
   PaxColumns *process_columns_;
   size_t current_cached_pax_columns_index_;
+  bool build_ctid_;
 };
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.cc b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.cc
index 55aa8b0fe3b..3e95c6ee985 100644
--- a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.cc
+++ b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.cc
@@ -1,36 +1,87 @@
 #include "storage/vec/pax_vec_reader.h"
 
+#include "comm/guc.h"
+#include "comm/pax_memory.h"
+#include "storage/pax_itemptr.h"
 #include "storage/vec/pax_vec_adapter.h"
 #ifdef VEC_BUILD
 
 namespace pax {
 
-PaxVecReader::PaxVecReader(MicroPartitionReader *reader, VecAdapter *adapter)
-    : reader_(reader), adapter_(adapter) {}
+PaxVecReader::PaxVecReader(MicroPartitionReader *reader, VecAdapter *adapter,
+                           PaxFilter *filter)
+    : reader_(reader),
+      adapter_(adapter),
+      working_group_(nullptr),
+      current_group_index_(0),
+      filter_(filter),
+      ctid_offset_(0) {
+  Assert(reader && adapter);
+}
 
-PaxVecReader::~PaxVecReader() { delete reader_; }
+PaxVecReader::~PaxVecReader() { PAX_DELETE(reader_); }
 
 void PaxVecReader::Open(const ReaderOptions &options) {
   reader_->Open(options);
-  PaxColumns *pax_columns = reader_->GetAllColumns();
-  adapter_->SetDataSource(pax_columns);
 }
 
 void PaxVecReader::Close() { reader_->Close(); }
 
-bool PaxVecReader::ReadTuple(CTupleSlot *cslot) {
+bool PaxVecReader::ReadTuple(TupleTableSlot *slot) {
+  auto desc = adapter_->GetRelationTupleDesc();
+retry_read_group:
+  if (!working_group_) {
+    if (current_group_index_ >= reader_->GetGroupNums()) {
+      return false;
+    }
+    auto group_index = current_group_index_++;
+    auto info = reader_->GetGroupStatsInfo(group_index);
+    if (filter_ &&
+        !filter_->TestScan(*info, desc, PaxFilterStatisticsKind::kGroup)) {
+      goto retry_read_group;
+    }
+
+    working_group_ = reader_->ReadGroup(group_index);
+    adapter_->SetDataSource(working_group_->GetAllColumns());
+  }
+
   if (!adapter_->AppendToVecBuffer()) {
-    return false;
+    PAX_DELETE(working_group_);
+    working_group_ = nullptr;
+    goto retry_read_group;
+  }
+
+  size_t flush_nums_of_rows = 0;
+  if (adapter_->ShouldBuildCtid()) {
+    SetTupleOffset(&slot->tts_tid, ctid_offset_);
+    flush_nums_of_rows = adapter_->FlushVecBuffer(slot);
+    ctid_offset_ += flush_nums_of_rows;
+  } else {
+    flush_nums_of_rows = adapter_->FlushVecBuffer(slot);
   }
 
-  auto flush_nums_of_rows = adapter_->FlushVecBuffer(cslot);
   Assert(flush_nums_of_rows);
   return true;
 }
 
-PaxColumns *PaxVecReader::GetAllColumns() {
+bool PaxVecReader::GetTuple(TupleTableSlot *slot, size_t row_index) {
+  CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+}
+
+size_t PaxVecReader::GetGroupNums() {
+  CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+}
+
+std::unique_ptr<ColumnStatsProvider> PaxVecReader::GetGroupStatsInfo(
+    size_t group_index) {
   CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+  return nullptr;
 }
+
+MicroPartitionReader::Group *PaxVecReader::ReadGroup(size_t index) {
+  CBDB_RAISE(cbdb::CException::ExType::kExTypeLogicError);
+}
+
 };  // namespace pax
 
 #endif  // VEC_BUILD
diff --git a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.h b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.h
index b8b255e67c5..6185362be6e 100644
--- a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.h
+++ b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_reader.h
@@ -5,6 +5,7 @@
 
 namespace pax {
 
+class PaxFilter;
 class VecAdapter;
 
 class PaxVecReader : public MicroPartitionReader {
@@ -12,7 +13,8 @@ class PaxVecReader : public MicroPartitionReader {
   // If enable read tuple from vec reader,
   // then OrcReader will be hold by PaxVecReader,
   // current MicroPartitionReader lifecycle will be bound to the PaxVecReader)
-  PaxVecReader(MicroPartitionReader *reader, VecAdapter *adapter);
+  PaxVecReader(MicroPartitionReader *reader, VecAdapter *adapter,
+               PaxFilter *filter);
 
   ~PaxVecReader() override;
 
@@ -20,14 +22,26 @@ class PaxVecReader : public MicroPartitionReader {
 
   void Close() override;
 
-  bool ReadTuple(CTupleSlot *cslot) override;
+  bool ReadTuple(TupleTableSlot *slot) override;
 
- protected:
-  PaxColumns *GetAllColumns() override;
+  bool GetTuple(TupleTableSlot *slot, size_t row_index) override;
+
+  size_t GetGroupNums() override;
+
+  std::unique_ptr<ColumnStatsProvider> GetGroupStatsInfo(
+      size_t group_index) override;
+
+  MicroPartitionReader::Group *ReadGroup(size_t index) override;
 
  private:
   MicroPartitionReader *reader_;
   VecAdapter *adapter_;
+
+  MicroPartitionReader::Group *working_group_;
+  size_t current_group_index_;
+  PaxFilter *filter_;
+
+  size_t ctid_offset_;
 };
 
 }  // namespace pax
diff --git a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_test.cc b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_test.cc
index 113a58810c0..47cc414ed3c 100644
--- a/contrib/pax_storage/src/cpp/storage/vec/pax_vec_test.cc
+++ b/contrib/pax_storage/src/cpp/storage/vec/pax_vec_test.cc
@@ -1,7 +1,7 @@
 #include "comm/gtest_wrappers.h"
+#include "pax_gtest_helper.h"
 #include "storage/pax.h"
 #include "storage/vec/pax_vec_adapter.h"
-
 #ifdef VEC_BUILD
 #pragma GCC diagnostic push
 #pragma GCC diagnostic ignored "-Wunused-but-set-variable"
@@ -27,54 +27,35 @@ static void GenFakeBuffer(char *buffer, size_t length) {
   }
 }
 
-static void CreateOrcTestResourceOwner() {
-  CurrentResourceOwner = ResourceOwnerCreate(NULL, "PaxVecTestResourceOwner");
-}
-
-static void ReleaseOrcTestResourceOwner() {
-  ResourceOwner tmp_resource_owner = CurrentResourceOwner;
-  CurrentResourceOwner = NULL;
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_BEFORE_LOCKS, false,
-                       true);
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_LOCKS, false, true);
-  ResourceOwnerRelease(tmp_resource_owner, RESOURCE_RELEASE_AFTER_LOCKS, false,
-                       true);
-  ResourceOwnerDelete(tmp_resource_owner);
-}
-
 class PaxVecTest : public ::testing::TestWithParam<bool> {
  public:
   void SetUp() override {
     Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    MemoryContext pax_vec_test_memory_context = AllocSetContextCreate(
-        (MemoryContext)NULL, "PaxVecTestMemoryContext", 80 * 1024 * 1024,
-        80 * 1024 * 1024, 80 * 1024 * 1024);
-
-    MemoryContextSwitchTo(pax_vec_test_memory_context);
-    CreateOrcTestResourceOwner();
+    CreateMemoryContext();
+    CreateTestResourceOwner();
   }
 
-  static CTupleSlot *CreateCtuple(bool is_fixed, bool with_value = false) {
-    TupleTableSlot *tuple_slot;
+  static TupleTableSlot *CreateTupleSlot(bool is_fixed,
+                                         bool with_value = false) {
     TupleDescData *tuple_desc;
-    CTupleSlot *ctuple_slot;
+    TupleTableSlot *tuple_slot;
 
     tuple_desc = reinterpret_cast<TupleDescData *>(cbdb::Palloc0(
         sizeof(TupleDescData) + sizeof(FormData_pg_attribute) * 1));
 
     tuple_desc->natts = 1;
     if (is_fixed) {
-      tuple_desc->attrs[0] = {
-          .atttypid = INT4OID,
-          .attlen = 4,
-          .attbyval = true,
-      };
+      tuple_desc->attrs[0] = {.atttypid = INT4OID,
+                              .attlen = 4,
+                              .attbyval = true,
+                              .attalign = TYPALIGN_INT,
+                              .attcollation = InvalidOid};
     } else {
-      tuple_desc->attrs[0] = {
-          .atttypid = TEXTOID,
-          .attlen = -1,
-          .attbyval = false,
-      };
+      tuple_desc->attrs[0] = {.atttypid = TEXTOID,
+                              .attlen = -1,
+                              .attbyval = false,
+                              .attalign = TYPALIGN_DOUBLE,
+                              .attcollation = DEFAULT_COLLATION_OID};
     }
 
     tuple_slot = (TupleTableSlot *)cbdb::RePalloc(
@@ -100,21 +81,17 @@ class PaxVecTest : public ::testing::TestWithParam<bool> {
     }
 
     tuple_slot->tts_tupleDescriptor = tuple_desc;
-    ctuple_slot = new CTupleSlot(tuple_slot);
-
-    return ctuple_slot;
+    return tuple_slot;
   }
 
-  static void DeleteCTupleSlot(CTupleSlot *ctuple_slot) {
-    auto tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    cbdb::Pfree(tuple_table_slot->tts_tupleDescriptor);
-    cbdb::Pfree(tuple_table_slot);
-    delete ctuple_slot;
+  static void DeleteTupleSlot(TupleTableSlot *tuple_slot) {
+    cbdb::Pfree(tuple_slot->tts_tupleDescriptor);
+    cbdb::Pfree(tuple_slot);
   }
 
   void TearDown() override {
-    // Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
-    ReleaseOrcTestResourceOwner();
+    Singleton<LocalFileSystem>::GetInstance()->Delete(file_name_);
+    ReleaseTestResourceOwner();
   }
 
  protected:
@@ -127,9 +104,9 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
   PaxColumn *column;
 
   auto is_fixed = GetParam();
-  auto ctuple_slot = CreateCtuple(is_fixed);
+  auto tuple_slot = CreateTupleSlot(is_fixed);
 
-  adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
   columns = new PaxColumns();
   if (is_fixed) {
     column = new PaxCommColumn<int32>(VEC_BATCH_LENGTH + 1000);
@@ -159,17 +136,16 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_FALSE(append_rc);
 
-  size_t flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  size_t flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(VEC_BATCH_LENGTH, flush_counts);
 
-  // verify ctuple_slot 1
+  // verify tuple_slot 1
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, VEC_BATCH_LENGTH);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -178,7 +154,7 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, VEC_BATCH_LENGTH);
@@ -188,6 +164,7 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
     ASSERT_EQ(child_array->buffers[0], nullptr);  // null bitmap
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[1], nullptr);
@@ -213,24 +190,22 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_TRUE(append_rc);
 
-  flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(1000, flush_counts);
 
-  // verify ctuple_slot 2
+  // verify tuple_slot 2
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, 1000);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -239,7 +214,7 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, 1000);
@@ -249,6 +224,7 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
     ASSERT_EQ(child_array->buffers[0], nullptr);  // null bitmap
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[1], nullptr);
@@ -276,10 +252,9 @@ TEST_P(PaxVecTest, PaxColumnToVec) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
 
   delete columns;
   delete adapter;
@@ -289,13 +264,12 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
   VecAdapter *adapter;
   PaxColumns *columns;
   PaxColumn *column;
-  CTupleSlot *ctuple_slot;
   size_t null_counts = 0;
   auto is_fixed = GetParam();
 
-  ctuple_slot = CreateCtuple(is_fixed);
+  TupleTableSlot *tuple_slot = CreateTupleSlot(is_fixed);
 
-  adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
   columns = new PaxColumns();
   if (is_fixed) {
     column = new PaxCommColumn<int32>(VEC_BATCH_LENGTH + 1000);
@@ -330,17 +304,16 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_FALSE(append_rc);
 
-  size_t flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  size_t flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(VEC_BATCH_LENGTH, flush_counts);
 
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, VEC_BATCH_LENGTH);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -349,7 +322,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, VEC_BATCH_LENGTH);
@@ -360,6 +333,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     ASSERT_EQ(child_array->n_buffers, is_fixed ? 2 : 3);
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[0], nullptr);
@@ -437,25 +411,23 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_TRUE(append_rc);
 
-  flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(null_counts + 1000, flush_counts);
 
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     size_t range_size = null_counts + 1000;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, range_size);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -464,7 +436,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, range_size);
@@ -475,6 +447,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     ASSERT_EQ(child_array->n_buffers, is_fixed ? 2 : 3);
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[0], nullptr);
@@ -539,10 +512,9 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVec) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
 
   delete columns;
   delete adapter;
@@ -554,9 +526,9 @@ TEST_P(PaxVecTest, PaxColumnToVecNoFull) {
   PaxColumn *column;
 
   auto is_fixed = GetParam();
-  auto ctuple_slot = CreateCtuple(is_fixed);
+  auto tuple_slot = CreateTupleSlot(is_fixed);
 
-  adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
   columns = new PaxColumns();
   if (is_fixed) {
     column = new PaxCommColumn<int32>(VEC_BATCH_LENGTH + 1000);
@@ -586,18 +558,17 @@ TEST_P(PaxVecTest, PaxColumnToVecNoFull) {
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_FALSE(append_rc);
 
-  size_t flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  size_t flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(1000, flush_counts);
 
-  // verify ctuple_slot
+  // verify tuple_slot
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, 1000);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -606,7 +577,7 @@ TEST_P(PaxVecTest, PaxColumnToVecNoFull) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, 1000);
@@ -616,6 +587,7 @@ TEST_P(PaxVecTest, PaxColumnToVecNoFull) {
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
     ASSERT_EQ(child_array->buffers[0], nullptr);  // null bitmap
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[1], nullptr);
@@ -641,10 +613,9 @@ TEST_P(PaxVecTest, PaxColumnToVecNoFull) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
 
   delete columns;
   delete adapter;
@@ -657,9 +628,9 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVecNoFull) {
   size_t null_counts = 0;
 
   auto is_fixed = GetParam();
-  auto ctuple_slot = CreateCtuple(is_fixed);
+  auto tuple_slot = CreateTupleSlot(is_fixed);
 
-  adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
   columns = new PaxColumns();
   if (is_fixed) {
     column = new PaxCommColumn<int32>(VEC_BATCH_LENGTH + 1000);
@@ -696,18 +667,17 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVecNoFull) {
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_FALSE(append_rc);
 
-  size_t flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  size_t flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(1000 + null_counts, flush_counts);
 
-  // verify ctuple_slot 2
+  // verify tuple_slot 2
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, 1000 + null_counts);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -716,7 +686,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVecNoFull) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, 1000 + null_counts);
@@ -725,6 +695,7 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVecNoFull) {
     ASSERT_EQ(child_array->n_buffers, is_fixed ? 2 : 3);
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[0], nullptr);
@@ -793,10 +764,9 @@ TEST_P(PaxVecTest, PaxColumnWithNullToVecNoFull) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
 
   delete columns;
   delete adapter;
@@ -808,9 +778,9 @@ TEST_P(PaxVecTest, PaxColumnAllNullToVec) {
   PaxColumn *column;
 
   auto is_fixed = GetParam();
-  auto ctuple_slot = CreateCtuple(is_fixed);
+  auto tuple_slot = CreateTupleSlot(is_fixed);
 
-  adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
   columns = new PaxColumns();
   if (is_fixed) {
     column = new PaxCommColumn<int32>(1000);
@@ -832,17 +802,16 @@ TEST_P(PaxVecTest, PaxColumnAllNullToVec) {
   append_rc = adapter->AppendToVecBuffer();
   ASSERT_FALSE(append_rc);
 
-  size_t flush_counts = adapter->FlushVecBuffer(ctuple_slot);
+  size_t flush_counts = adapter->FlushVecBuffer(tuple_slot);
   ASSERT_EQ(1000, flush_counts);
 
   {
     VecTupleTableSlot *vslot = nullptr;
-    TupleTableSlot *tuple_table_slot = ctuple_slot->GetTupleTableSlot();
-    vslot = (VecTupleTableSlot *)tuple_table_slot;
+    vslot = (VecTupleTableSlot *)tuple_slot;
 
     auto rb = (ArrowRecordBatch *)vslot->tts_recordbatch;
     ASSERT_NE(rb, nullptr);
-    ArrowArray *arrow_array = rb->batch;
+    ArrowArray *arrow_array = &rb->batch;
     ASSERT_EQ(arrow_array->length, 1000);
     ASSERT_EQ(arrow_array->null_count, 0);
     ASSERT_EQ(arrow_array->offset, 0);
@@ -851,7 +820,7 @@ TEST_P(PaxVecTest, PaxColumnAllNullToVec) {
     ASSERT_NE(arrow_array->children, nullptr);
     ASSERT_EQ(arrow_array->buffers[0], nullptr);
     ASSERT_EQ(arrow_array->dictionary, nullptr);
-    ASSERT_EQ(arrow_array->private_data, arrow_array->buffers);
+    ASSERT_EQ(arrow_array->private_data, nullptr);
 
     ArrowArray *child_array = arrow_array->children[0];
     ASSERT_EQ(child_array->length, 1000);
@@ -860,6 +829,7 @@ TEST_P(PaxVecTest, PaxColumnAllNullToVec) {
     ASSERT_EQ(child_array->n_buffers, is_fixed ? 2 : 3);
     ASSERT_EQ(child_array->n_children, 0);
     ASSERT_EQ(child_array->children, nullptr);
+    ASSERT_EQ(child_array->private_data, child_array);
 
     if (is_fixed) {
       ASSERT_NE(child_array->buffers[0], nullptr);
@@ -893,24 +863,25 @@ TEST_P(PaxVecTest, PaxColumnAllNullToVec) {
     }
 
     ASSERT_EQ(child_array->dictionary, nullptr);
-    ASSERT_EQ(child_array->private_data, child_array->buffers);
   }
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
 
   delete columns;
   delete adapter;
 }
 
-class MockWriter : public TableWriter {
+class MockTableWriter : public TableWriter {
  public:
-  MockWriter(const Relation relation, WriteSummaryCallback callback)
+  MockTableWriter(const Relation relation, WriteSummaryCallback callback)
       : TableWriter(relation) {
     SetWriteSummaryCallback(callback);
     SetFileSplitStrategy(new PaxDefaultSplitStrategy());
   }
 
   MOCK_METHOD(std::string, GenFilePath, (const std::string &), (override));
+  MOCK_METHOD((std::vector<std::tuple<ColumnEncoding_Kind, int>>),
+              GetRelEncodingOptions, (), (override));
 };
 
 class MockReaderInterator : public IteratorBase<MicroPartitionMetadata> {
@@ -935,10 +906,11 @@ class MockReaderInterator : public IteratorBase<MicroPartitionMetadata> {
 
 TEST_P(PaxVecTest, PaxVecReaderTest) {
   auto is_fixed = GetParam();
-  CTupleSlot *ctuple_slot = CreateCtuple(is_fixed, true);
+  TupleTableSlot *tuple_slot = CreateTupleSlot(is_fixed, true);
+  std::vector<std::tuple<ColumnEncoding_Kind, int>> encoding_opts;
 
   auto relation = (Relation)cbdb::Palloc0(sizeof(RelationData));
-  relation->rd_att = ctuple_slot->GetTupleTableSlot()->tts_tupleDescriptor;
+  relation->rd_att = tuple_slot->tts_tupleDescriptor;
   bool callback_called = false;
 
   TableWriter::WriteSummaryCallback callback =
@@ -946,25 +918,30 @@ TEST_P(PaxVecTest, PaxVecReaderTest) {
         callback_called = true;
       };
 
-  auto writer = new MockWriter(relation, callback);
+  auto writer = new MockTableWriter(relation, callback);
   EXPECT_CALL(*writer, GenFilePath(_))
       .Times(AtLeast(1))
       .WillRepeatedly(Return(file_name_));
+  encoding_opts.emplace_back(
+      std::make_tuple(ColumnEncoding_Kind_NO_ENCODED, 0));
+  EXPECT_CALL(*writer, GetRelEncodingOptions())
+      .Times(AtLeast(1))
+      .WillRepeatedly(Return(encoding_opts));
 
   writer->Open();
 
   for (size_t i = 0; i < VEC_BATCH_LENGTH + 1000; i++) {
-    writer->WriteTuple(ctuple_slot);
+    writer->WriteTuple(tuple_slot);
   }
 
   writer->Close();
   ASSERT_TRUE(callback_called);
 
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
   delete writer;
 
-  ctuple_slot = CreateCtuple(is_fixed);
-  auto adapter = new VecAdapter(ctuple_slot->GetTupleDesc());
+  tuple_slot = CreateTupleSlot(is_fixed);
+  auto adapter = new VecAdapter(tuple_slot->tts_tupleDescriptor);
 
   std::vector<MicroPartitionMetadata> meta_info_list;
   MicroPartitionMetadata meta_info;
@@ -987,16 +964,16 @@ TEST_P(PaxVecTest, PaxVecReaderTest) {
   reader = new TableReader(std::move(meta_info_iterator), reader_options);
   reader->Open();
 
-  bool ok = reader->ReadTuple(ctuple_slot);
+  bool ok = reader->ReadTuple(tuple_slot);
   ASSERT_TRUE(ok);
 
-  ok = reader->ReadTuple(ctuple_slot);
+  ok = reader->ReadTuple(tuple_slot);
   ASSERT_TRUE(ok);
-  ok = reader->ReadTuple(ctuple_slot);
+  ok = reader->ReadTuple(tuple_slot);
   ASSERT_FALSE(ok);
 
   reader->Close();
-  DeleteCTupleSlot(ctuple_slot);
+  DeleteTupleSlot(tuple_slot);
   delete adapter;
   delete relation;
   delete reader;
@@ -1007,4 +984,4 @@ INSTANTIATE_TEST_CASE_P(PaxVecTestCombine, PaxVecTest,
 
 #endif  // VEC_BUILD
 
-}  // namespace pax::tests
\ No newline at end of file
+}  // namespace pax::tests
diff --git a/contrib/pax_storage/src/data/Makefile b/contrib/pax_storage/src/data/Makefile
deleted file mode 100644
index fc899d3fd77..00000000000
--- a/contrib/pax_storage/src/data/Makefile
+++ /dev/null
@@ -1,37 +0,0 @@
-# contrib/pax_storage/Makefile
-
-MODULE_big = pax
-OBJS = \
-	$(WIN32RES) 
-PG_CPPFLAGS = -I/usr/local/include
-PG_CXXFLAGS = -std=c++14
-
-PGFILEDESC = "pax - PAX table access method"
-SHLIB_LINK += -luuid
-
-REGRESS = ddl types join update update_gp
-
-ifdef USE_PGXS
-PG_CONFIG = pg_config
-PGXS := $(shell $(PG_CONFIG) --pgxs)
-include $(PGXS)
-else
-subdir = contrib/pax_storage/src/data
-top_builddir = ../../../..
-include $(top_builddir)/src/Makefile.global
-include $(top_srcdir)/contrib/contrib-global.mk
-endif
-
-.PHONY: install-data
-install-data:
-	$(INSTALL_DATA) pax-cdbinit--1.0.sql '$(DESTDIR)$(datadir)/cdb_init.d/pax-cdbinit--1.0.sql'
-
-install: install-data
-
-.PHONY: uninstall-data
-
-uninstall-data:
-	$(RM) '$(DESTDIR)$(datadir)/cdb_init.d/pax-cdbinit--1.0.sql'
-
-uninstall: uninstall-data
-
diff --git a/contrib/pax_storage/src/data/expected/ddl.out b/contrib/pax_storage/src/data/expected/ddl.out
deleted file mode 100644
index 11cbc134c80..00000000000
--- a/contrib/pax_storage/src/data/expected/ddl.out
+++ /dev/null
@@ -1,48 +0,0 @@
--- start_ignore
-create extension pax;
-drop table if exists users;
--- end_ignore
-create table users(
-    id int ,
-    name text not null,
-    height float not null,
-    decimal_col decimal(10, 2) not null,
-    created_at timestamp with time zone not null,
-    updated_at timestamp with time zone not null
-)  using pax distributed BY (id);
-insert into users (id, name, height, decimal_col, created_at, updated_at) values
-    (1, 'Alice', 1.65, 1.23, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
-    (2, 'Bob', 1.75, 2.34, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
-    (3, 'Carol', 1.85, 3.45, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08');
-select * from users;
- id | name  | height | decimal_col |             created_at              |             updated_at              
-----+-------+--------+-------------+-------------------------------------+-------------------------------------
-  1 | Alice |   1.65 |        1.23 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-  2 | Bob   |   1.75 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-  3 | Carol |   1.85 |        3.45 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-(3 rows)
-
-DELETE FROM users WHERE id = 1;
-select * from users;
- id | name  | height | decimal_col |             created_at              |             updated_at              
-----+-------+--------+-------------+-------------------------------------+-------------------------------------
-  2 | Bob   |   1.75 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-  3 | Carol |   1.85 |        3.45 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-(2 rows)
-
-UPDATE users SET name = 'Alice' WHERE id = 2;
-select * from users;
- id | name  | height | decimal_col |             created_at              |             updated_at              
-----+-------+--------+-------------+-------------------------------------+-------------------------------------
-  3 | Carol |   1.85 |        3.45 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-  2 | Alice |   1.75 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-(2 rows)
-
-UPDATE users SET height = (select max(height) from users),decimal_col = (select min(decimal_col) from users);
-select * from users;
- id | name  | height | decimal_col |             created_at              |             updated_at              
-----+-------+--------+-------------+-------------------------------------+-------------------------------------
-  3 | Carol |   1.85 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-  2 | Alice |   1.85 |        2.34 | Wed May 17 02:56:49.633664 2023 PDT | Wed May 17 02:56:49.633664 2023 PDT
-(2 rows)
-
diff --git a/contrib/pax_storage/src/data/expected/join.out b/contrib/pax_storage/src/data/expected/join.out
deleted file mode 100644
index 193e7f7abfb..00000000000
--- a/contrib/pax_storage/src/data/expected/join.out
+++ /dev/null
@@ -1,46 +0,0 @@
--- start_ignore
-create extension pax;
-drop table if exists t1;
--- end_ignore
-create table t1(v int) using pax distributed by(v);
-insert into t1 select generate_series(1,10);
-select * from t1 order by v;
- v  
-----
-  1
-  2
-  3
-  4
-  5
-  6
-  7
-  8
-  9
- 10
-(10 rows)
-
-update t1 set v=(select max(v) from t1) where v <= 5;
-select * from t1 order by v;
- v  
-----
-  6
-  7
-  8
-  9
- 10
- 10
- 10
- 10
- 10
- 10
-(10 rows)
-
-select * from t1 as a join t1 as b on a.v=b.v where a.v<10;
- v | v 
----+---
- 6 | 6
- 9 | 9
- 7 | 7
- 8 | 8
-(4 rows)
-
diff --git a/contrib/pax_storage/src/data/expected/update.out b/contrib/pax_storage/src/data/expected/update.out
deleted file mode 100644
index b4ef40b4f44..00000000000
--- a/contrib/pax_storage/src/data/expected/update.out
+++ /dev/null
@@ -1,968 +0,0 @@
--- start_ignore
-create extension pax;
-ERROR:  extension "pax" already exists
-drop table if exists update_test;
-NOTICE:  table "update_test" does not exist, skipping
-drop table if exists upsert_test;
-NOTICE:  table "upsert_test" does not exist, skipping
--- end_ignore
-set default_table_access_method = 'pax';
-CREATE TABLE update_test (
-    a   INT DEFAULT 10,
-    b   INT,
-    c   TEXT
-) using pax;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-CREATE TABLE upsert_test (
-    a   INT ,
-    b   TEXT
-) using pax;
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-INSERT INTO update_test VALUES (5, 10, 'foo');
-INSERT INTO update_test(b, a, c) VALUES (15, 10, '');
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
- a  | b  |  c  
-----+----+-----
-  5 | 10 | foo
- 10 | 15 | 
-(2 rows)
-
-UPDATE update_test SET a = DEFAULT, b = 0;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
- a  | b |  c  
-----+---+-----
- 10 | 0 | 
- 10 | 0 | foo
-(2 rows)
-
--- aliases for the UPDATE target table
-UPDATE update_test AS t SET b = 10 WHERE t.a = 10;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
- a  | b  |  c  
-----+----+-----
- 10 | 10 | 
- 10 | 10 | foo
-(2 rows)
-
-UPDATE update_test t SET b = t.b + 10 WHERE t.a = 10;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
- a  | b  |  c  
-----+----+-----
- 10 | 20 | 
- 10 | 20 | foo
-(2 rows)
-
---
--- Test VALUES in FROM
---
-UPDATE update_test SET a=v.i FROM (VALUES(100, 20)) AS v(i, j)
-  WHERE update_test.b = v.j;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-  a  | b  |  c  
------+----+-----
- 100 | 20 | 
- 100 | 20 | foo
-(2 rows)
-
--- fail, wrong data type:
-UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i, j)
-  WHERE update_test.b = v.j;
-ERROR:  column "a" is of type integer but expression is of type record
-LINE 1: UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i...
-                                   ^
-HINT:  You will need to rewrite or cast the expression.
---
--- Test multiple-set-clause syntax
---
-INSERT INTO update_test SELECT a,b+1,c FROM update_test;
-SELECT * FROM update_test;
-  a  | b  |  c  
------+----+-----
- 100 | 20 | foo
- 100 | 20 | 
- 100 | 21 | foo
- 100 | 21 | 
-(4 rows)
-
-UPDATE update_test SET (c,b,a) = ('bugle', b+11, DEFAULT) WHERE c = 'foo';
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-  a  | b  |   c   
------+----+-------
-  10 | 31 | bugle
-  10 | 32 | bugle
- 100 | 20 | 
- 100 | 21 | 
-(4 rows)
-
-UPDATE update_test SET (c,b) = ('car', a+b), a = a + 1 WHERE a = 10;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-  a  | b  |  c  
------+----+-----
-  11 | 41 | car
-  11 | 42 | car
- 100 | 20 | 
- 100 | 21 | 
-(4 rows)
-
--- fail, multi assignment to same column:
-UPDATE update_test SET (c,b) = ('car', a+b), b = a + 1 WHERE a = 10;
-ERROR:  multiple assignments to same column "b"
--- uncorrelated sub-select:
-UPDATE update_test
-  SET (b,a) = (select a,b from update_test where b = 41 and c = 'car')
-  WHERE a = 100 AND b = 20;
-SELECT * FROM update_test;
-  a  | b  |  c  
------+----+-----
-  41 | 11 | 
-  11 | 41 | car
-  11 | 42 | car
- 100 | 21 | 
-(4 rows)
-
--- correlated sub-select:
-UPDATE update_test o
-  SET (b,a) = (select a+1,b from update_test i
-               where i.a=o.a and i.b=o.b and i.c is not distinct from o.c);
-SELECT * FROM update_test;
- a  |  b  |  c  
-----+-----+-----
- 41 |  12 | car
- 42 |  12 | car
- 11 |  42 | 
- 21 | 101 | 
-(4 rows)
-
--- fail, multiple rows supplied:
-UPDATE update_test SET (b,a) = (select a+1,b from update_test);
-ERROR:  more than one row returned by a subquery used as an expression
--- set to null if no rows supplied:
-UPDATE update_test SET (b,a) = (select a+1,b from update_test where a = 1000)
-  WHERE a = 11;
-SELECT * FROM update_test;
- a  |  b  |  c  
-----+-----+-----
- 41 |  12 | car
- 42 |  12 | car
-    |     | 
- 21 | 101 | 
-(4 rows)
-
--- *-expansion should work in this context:
-UPDATE update_test SET (a,b) = ROW(v.*) FROM (VALUES(21, 100)) AS v(i, j)
-  WHERE update_test.a = v.i;
--- you might expect this to work, but syntactically it's not a RowExpr:
-UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) AS v(i, j)
-  WHERE update_test.a = v.i;
-ERROR:  source for a multiple-column UPDATE item must be a sub-SELECT or ROW() expression
-LINE 1: UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) ...
-                                        ^
--- if an alias for the target table is specified, don't allow references
--- to the original table name
-UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a = 10;
-ERROR:  invalid reference to FROM-clause entry for table "update_test"
-LINE 1: UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a...
-                                        ^
-HINT:  Perhaps you meant to reference the table alias "t".
--- Make sure that we can update to a TOASTed value.
-UPDATE update_test SET c = repeat('x', 10000) WHERE c = 'car';
-SELECT a, b, char_length(c) FROM update_test;
- a  |  b  | char_length 
-----+-----+-------------
- 21 | 100 |           0
-    |     |           0
- 41 |  12 |       10000
- 42 |  12 |       10000
-(4 rows)
-
--- Check multi-assignment with a Result node to handle a one-time filter.
-EXPLAIN (VERBOSE, COSTS OFF)
-UPDATE update_test t
-  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
-  WHERE CURRENT_USER = SESSION_USER;
-                                                  QUERY PLAN                                                   
----------------------------------------------------------------------------------------------------------------
- Update on public.update_test t
-   ->  Explicit Redistribute Motion 3:3  (slice1; segments: 3)
-         Output: ($1), ($2), t.c, ((SubPlan 1 (returns $1,$2))), t.ctid, t.gp_segment_id, t.*, (DMLAction)
-         ->  Split
-               Output: ($1), ($2), t.c, ((SubPlan 1 (returns $1,$2))), t.ctid, t.gp_segment_id, t.*, DMLAction
-               ->  Seq Scan on public.update_test t
-                     Output: $1, $2, t.c, (SubPlan 1 (returns $1,$2)), t.ctid, t.gp_segment_id, t.*
-                     SubPlan 1 (returns $1,$2)
-                       ->  Result
-                             Output: s.b, s.a
-                             Filter: (s.a = t.a)
-                             ->  Materialize
-                                   Output: s.b, s.a
-                                   ->  Broadcast Motion 3:3  (slice2; segments: 3)
-                                         Output: s.b, s.a
-                                         ->  Seq Scan on public.update_test s
-                                               Output: s.b, s.a
- Optimizer: Postgres query optimizer
-(18 rows)
-
-UPDATE update_test t
-  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
-  WHERE CURRENT_USER = SESSION_USER;
-SELECT a, b, char_length(c) FROM update_test;
-  a  | b  | char_length 
------+----+-------------
-     |    |           0
-  12 | 41 |       10000
-  12 | 42 |       10000
- 100 | 21 |           0
-(4 rows)
-
--- start_ignore
--- Test ON CONFLICT DO UPDATE
--- skip, not support primary key, can't test
-set default_table_access_method = 'pax';
-CREATE TABLE upsert_test (
-    a   INT PRIMARY KEY,
-    b   TEXT
-) using pax;
-ERROR:  relation "upsert_test" already exists
--- INSERT INTO upsert_test VALUES(1, 'Boo'), (3, 'Zoo');
--- -- uncorrelated  sub-select:
--- WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
---   VALUES (1, 'Bar') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
--- -- correlated sub-select:
--- INSERT INTO upsert_test VALUES (1, 'Baz'), (3, 'Zaz') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Correlated', a from upsert_test i WHERE i.a = upsert_test.a)
---   RETURNING *;
--- -- correlated sub-select (EXCLUDED.* alias):
--- INSERT INTO upsert_test VALUES (1, 'Bat'), (3, 'Zot') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING *;
--- -- ON CONFLICT using system attributes in RETURNING, testing both the
--- -- inserting and updating paths. See bug report at:
--- -- https://www.postgresql.org/message-id/73436355-6432-49B1-92ED-1FE4F7E7E100%40finefun.com.au
--- INSERT INTO upsert_test VALUES (2, 'Beeble') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = 0 AS xmax_correct;
--- -- currently xmax is set after a conflict - that's probably not good,
--- -- but it seems worthwhile to have to be explicit if that changes.
--- INSERT INTO upsert_test VALUES (2, 'Brox') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = pg_current_xact_id()::xid AS xmax_correct;
--- DROP TABLE update_test;
--- DROP TABLE upsert_test;
--- -- Test ON CONFLICT DO UPDATE with partitioned table and non-identical children
--- CREATE TABLE upsert_test (
---     a   INT PRIMARY KEY,
---     b   TEXT
--- ) PARTITION BY LIST (a);
--- CREATE TABLE upsert_test_1 PARTITION OF upsert_test FOR VALUES IN (1);
--- CREATE TABLE upsert_test_2 (b TEXT, a INT PRIMARY KEY);
--- ALTER TABLE upsert_test ATTACH PARTITION upsert_test_2 FOR VALUES IN (2);
--- INSERT INTO upsert_test VALUES(1, 'Boo'), (2, 'Zoo');
--- -- uncorrelated sub-select:
--- WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
---   VALUES (1, 'Bar') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
--- -- correlated sub-select:
--- WITH aaa AS (SELECT 1 AS ctea, ' Foo' AS cteb) INSERT INTO upsert_test
---   VALUES (1, 'Bar'), (2, 'Baz') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT upsert_test.b||cteb, upsert_test.a FROM aaa) RETURNING *;
--- DROP TABLE upsert_test;
----------------------------
--- UPDATE with row movement
----------------------------
--- When a partitioned table receives an UPDATE to the partitioned key and the
--- new values no longer meet the partition's bound, the row must be moved to
--- the correct partition for the new partition key (if one exists). We must
--- also ensure that updatable views on partitioned tables properly enforce any
--- WITH CHECK OPTION that is defined. The situation with triggers in this case
--- also requires thorough testing as partition key updates causing row
--- movement convert UPDATEs into DELETE+INSERT.
-set default_table_access_method = 'pax';
-CREATE TABLE range_parted (
-	a text,
-	b bigint,
-	c numeric,
-	d int,
-	e varchar
-) PARTITION BY RANGE (a, b);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
--- Create partitions intentionally in descending bound order, so as to test
--- that update-row-movement works with the leaf partitions not in bound order.
-CREATE TABLE part_b_20_b_30 (e varchar, c numeric, a text, b bigint, d int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'e' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
--- GPDB: distribution policy must match the parent table.
-alter table part_b_20_b_30 set distributed by (a);
-ALTER TABLE range_parted ATTACH PARTITION part_b_20_b_30 FOR VALUES FROM ('b', 20) TO ('b', 30);
-CREATE TABLE part_b_10_b_20 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY RANGE (c);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'e' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-alter table part_b_10_b_20 set distributed by (a);
-CREATE TABLE part_b_1_b_10 PARTITION OF range_parted FOR VALUES FROM ('b', 1) TO ('b', 10);
-NOTICE:  table has parent, setting distribution columns to match parent table
-ALTER TABLE range_parted ATTACH PARTITION part_b_10_b_20 FOR VALUES FROM ('b', 10) TO ('b', 20);
-CREATE TABLE part_a_10_a_20 PARTITION OF range_parted FOR VALUES FROM ('a', 10) TO ('a', 20);
-NOTICE:  table has parent, setting distribution columns to match parent table
-CREATE TABLE part_a_1_a_10 PARTITION OF range_parted FOR VALUES FROM ('a', 1) TO ('a', 10);
-NOTICE:  table has parent, setting distribution columns to match parent table
--- Check that partition-key UPDATE works sanely on a partitioned table that
--- does not have any child partitions.
-UPDATE part_b_10_b_20 set b = b - 6;
--- Create some more partitions following the above pattern of descending bound
--- order, but let's make the situation a bit more complex by having the
--- attribute numbers of the columns vary from their parent partition.
-CREATE TABLE part_c_100_200 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY range (abs(d));
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'e' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-ALTER TABLE part_c_100_200 DROP COLUMN e, DROP COLUMN c, DROP COLUMN a;
-NOTICE:  dropping a column that is part of the distribution policy forces a NULL distribution policy
-ALTER TABLE part_c_100_200 ADD COLUMN c numeric, ADD COLUMN e varchar, ADD COLUMN a text;
-ALTER TABLE part_c_100_200 DROP COLUMN b;
-ALTER TABLE part_c_100_200 ADD COLUMN b bigint;
-CREATE TABLE part_d_1_15 PARTITION OF part_c_100_200 FOR VALUES FROM (1) TO (15);
-NOTICE:  table has parent, setting distribution columns to match parent table
-CREATE TABLE part_d_15_20 PARTITION OF part_c_100_200 FOR VALUES FROM (15) TO (20);
-NOTICE:  table has parent, setting distribution columns to match parent table
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
-ERROR:  distribution policy for "part_c_100_200" must be the same as that for "part_b_10_b_20"
--- GPDB: distribution policy must match the parent table, so the previous command fails.
--- Change the distribution key and try again.
-alter table part_c_100_200 set distributed by (a);
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
-CREATE TABLE part_c_1_100 (e varchar, d int, c numeric, b bigint, a text);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'e' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-alter table part_c_1_100 set distributed by (a);
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_1_100 FOR VALUES FROM (1) TO (100);
-\set init_range_parted 'truncate range_parted; insert into range_parted VALUES (''a'', 1, 1, 1 ,''e''), (''a'', 10, 200, 1 ,''e''), (''b'', 12, 96, 1 ,''e''), (''b'', 13, 97, 2 ,''e''), (''b'', 15, 105, 16 ,''e''), (''b'', 17, 105, 19 ,''e'')'
-\set show_data 'select tableoid::regclass::text COLLATE "C" partname, * from range_parted ORDER BY 1, 2, 3, 4, 5, 6'
-:init_range_parted;
-:show_data;
-    partname    | a | b  |  c  | d  | e 
-----------------+---+----+-----+----+---
- part_a_10_a_20 | a | 10 | 200 |  1 | e
- part_a_1_a_10  | a |  1 |   1 |  1 | e
- part_c_1_100   | b | 12 |  96 |  1 | e
- part_c_1_100   | b | 13 |  97 |  2 | e
- part_d_15_20   | b | 15 | 105 | 16 | e
- part_d_15_20   | b | 17 | 105 | 19 | e
-(6 rows)
-
--- The order of subplans should be in bound order
-EXPLAIN (costs off) UPDATE range_parted set c = c - 50 WHERE c > 97;
-                      QUERY PLAN                       
--------------------------------------------------------
- Update on range_parted
-   Update on part_a_1_a_10 range_parted_1
-   Update on part_a_10_a_20 range_parted_2
-   Update on part_b_1_b_10 range_parted_3
-   Update on part_c_1_100 range_parted_4
-   Update on part_d_1_15 range_parted_5
-   Update on part_d_15_20 range_parted_6
-   Update on part_b_20_b_30 range_parted_7
-   ->  Append
-         ->  Seq Scan on part_a_1_a_10 range_parted_1
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_a_10_a_20 range_parted_2
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_b_1_b_10 range_parted_3
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_c_1_100 range_parted_4
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_d_1_15 range_parted_5
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_d_15_20 range_parted_6
-               Filter: (c > '97'::numeric)
-         ->  Seq Scan on part_b_20_b_30 range_parted_7
-               Filter: (c > '97'::numeric)
- Optimizer: Postgres query optimizer
-(24 rows)
-
--- fail, row movement happens only within the partition subtree.
-UPDATE part_c_100_200 set c = c - 20, d = c WHERE c = 105;
--- fail, no partition key update, so no attempt to move tuple,
--- but "a = 'a'" violates partition constraint enforced by root partition)
-UPDATE part_b_10_b_20 set a = 'a';
-ERROR:  new row for relation "part_b_10_b_20" violates partition constraint  (seg2 127.0.0.1:7004 pid=32017)
-DETAIL:  Failing row contains (e, 96, a, 12, 1).
--- ok, partition key update, no constraint violation
-UPDATE range_parted set d = d - 10 WHERE d > 10;
--- ok, no partition key update, no constraint violation
-UPDATE range_parted set e = d;
--- No row found
-UPDATE part_c_1_100 set c = c + 20 WHERE c = 98;
--- ok, row movement
-UPDATE part_b_10_b_20 set c = c + 20 returning c, b, a;
- c | b | a 
----+---+---
-(0 rows)
-
-:show_data;
-    partname    | a | b  |  c  | d | e 
-----------------+---+----+-----+---+---
- part_a_10_a_20 | a | 10 | 200 | 1 | 1
- part_a_1_a_10  | a |  1 |   1 | 1 | 1
-(2 rows)
-
--- fail, row movement happens only within the partition subtree.
-UPDATE part_b_10_b_20 set b = b - 6 WHERE c > 116 returning *;
- e | c | a | b | d 
----+---+---+---+---
-(0 rows)
-
--- ok, row movement, with subset of rows moved into different partition.
-UPDATE range_parted set b = b - 6 WHERE c > 116 returning a, b + c;
- a | ?column? 
----+----------
-(0 rows)
-
-:show_data;
-   partname    | a | b | c | d | e 
----------------+---+---+---+---+---
- part_a_1_a_10 | a | 1 | 1 | 1 | 1
-(1 row)
-
----------------------------   Common table needed for multiple test scenarios.  ---------------------------
-CREATE TABLE mintab(c1 int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'c1' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-INSERT into mintab VALUES (120);
--- update partition key using updatable view.
-CREATE VIEW upview AS SELECT * FROM range_parted WHERE (select c > c1 FROM mintab) WITH CHECK OPTION;
--- ok
-UPDATE upview set c = 199 WHERE b = 4;
--- fail, check option violation
-UPDATE upview set c = 120 WHERE b = 4;
--- fail, row movement with check option violation
-UPDATE upview set a = 'b', b = 15, c = 120 WHERE b = 4;
--- ok, row movement, check option passes
-UPDATE upview set a = 'b', b = 15 WHERE b = 4;
-:show_data;
-   partname    | a | b | c | d | e 
----------------+---+---+---+---+---
- part_a_1_a_10 | a | 1 | 1 | 1 | 1
-(1 row)
-
--- cleanup
-DROP VIEW upview;
--- RETURNING having whole-row vars.
-:init_range_parted;
-UPDATE range_parted set c = 95 WHERE a = 'b' and b > 10 and c > 100 returning (range_parted), *;
- range_parted | a | b | c | d | e 
---------------+---+---+---+---+---
-(0 rows)
-
-:show_data;
-    partname    | a | b  |  c  | d | e 
-----------------+---+----+-----+---+---
- part_a_10_a_20 | a | 10 | 200 | 1 | e
- part_a_1_a_10  | a |  1 |   1 | 1 | e
- part_c_1_100   | b | 12 |  96 | 1 | e
- part_c_1_100   | b | 13 |  97 | 2 | e
-(4 rows)
-
--- Transition tables with update row movement
-:init_range_parted;
-CREATE FUNCTION trans_updatetrigfunc() RETURNS trigger LANGUAGE plpgsql AS
-$$
-  begin
-    raise notice 'trigger = %, old table = %, new table = %',
-                 TG_NAME,
-                 (select string_agg(old_table::text, ', ' ORDER BY a) FROM old_table),
-                 (select string_agg(new_table::text, ', ' ORDER BY a) FROM new_table);
-    return null;
-  end;
-$$;
-CREATE TRIGGER trans_updatetrig
-  AFTER UPDATE ON range_parted REFERENCING OLD TABLE AS old_table NEW TABLE AS new_table
-  FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
-ERROR:  Triggers for statements are not yet supported
-UPDATE range_parted set c = (case when c = 96 then 110 else c + 1 end ) WHERE a = 'b' and b > 10 and c >= 96;
-:show_data;
-    partname    | a | b  |  c  | d  | e 
-----------------+---+----+-----+----+---
- part_a_10_a_20 | a | 10 | 200 |  1 | e
- part_a_1_a_10  | a |  1 |   1 |  1 | e
- part_c_1_100   | b | 13 |  98 |  2 | e
- part_d_15_20   | b | 15 | 106 | 16 | e
- part_d_15_20   | b | 17 | 106 | 19 | e
-(5 rows)
-
-:init_range_parted;
--- -- Enabling OLD TABLE capture for both DELETE as well as UPDATE stmt triggers
--- -- should not cause DELETEd rows to be captured twice. Similar thing for
--- -- INSERT triggers and inserted rows.
--- CREATE TRIGGER trans_deletetrig
---   AFTER DELETE ON range_parted REFERENCING OLD TABLE AS old_table
---   FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
--- CREATE TRIGGER trans_inserttrig
---   AFTER INSERT ON range_parted REFERENCING NEW TABLE AS new_table
---   FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
--- UPDATE range_parted set c = c + 50 WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
--- DROP TRIGGER trans_deletetrig ON range_parted;
--- DROP TRIGGER trans_inserttrig ON range_parted;
--- -- Don't drop trans_updatetrig yet. It is required below.
--- -- Test with transition tuple conversion happening for rows moved into the
--- -- new partition. This requires a trigger that references transition table
--- -- (we already have trans_updatetrig). For inserted rows, the conversion
--- -- is not usually needed, because the original tuple is already compatible with
--- -- the desired transition tuple format. But conversion happens when there is a
--- -- BR trigger because the trigger can change the inserted row. So install a
--- -- BR triggers on those child partitions where the rows will be moved.
--- CREATE FUNCTION func_parted_mod_b() RETURNS trigger AS $$
--- BEGIN
---    NEW.b = NEW.b + 1;
---    return NEW;
--- END $$ language plpgsql;
--- CREATE TRIGGER trig_c1_100 BEFORE UPDATE OR INSERT ON part_c_1_100
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- CREATE TRIGGER trig_d1_15 BEFORE UPDATE OR INSERT ON part_d_1_15
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- CREATE TRIGGER trig_d15_20 BEFORE UPDATE OR INSERT ON part_d_15_20
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- :init_range_parted;
--- UPDATE range_parted set c = (case when c = 96 then 110 else c + 1 end) WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
--- :init_range_parted;
--- UPDATE range_parted set c = c + 50 WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
--- -- Case where per-partition tuple conversion map array is allocated, but the
--- -- map is not required for the particular tuple that is routed, thanks to
--- -- matching table attributes of the partition and the target table.
--- :init_range_parted;
--- UPDATE range_parted set b = 15 WHERE b = 1;
--- :show_data;
--- DROP TRIGGER trans_updatetrig ON range_parted;
--- DROP TRIGGER trig_c1_100 ON part_c_1_100;
--- DROP TRIGGER trig_d1_15 ON part_d_1_15;
--- DROP TRIGGER trig_d15_20 ON part_d_15_20;
--- DROP FUNCTION func_parted_mod_b();
--- RLS policies with update-row-movement
------------------------------------------
-ALTER TABLE range_parted ENABLE ROW LEVEL SECURITY;
-CREATE USER regress_range_parted_user;
-NOTICE:  resource queue required -- using default resource queue "pg_default"
-GRANT ALL ON range_parted, mintab TO regress_range_parted_user;
-CREATE POLICY seeall ON range_parted AS PERMISSIVE FOR SELECT USING (true);
-CREATE POLICY policy_range_parted ON range_parted for UPDATE USING (true) WITH CHECK (c % 2 = 0);
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- This should fail with RLS violation error while moving row from
--- part_a_10_a_20 to part_d_1_15, because we are setting 'c' to an odd number.
-UPDATE range_parted set a = 'b', c = 151 WHERE a = 'a' and c = 200;
-ERROR:  new row violates row-level security policy for table "range_parted"  (seg1 127.0.0.1:7003 pid=32016)
-RESET SESSION AUTHORIZATION;
--- Create a trigger on part_d_1_15
-CREATE FUNCTION func_d_1_15() RETURNS trigger AS $$
-BEGIN
-   NEW.c = NEW.c + 1; -- Make even numbers odd, or vice versa
-   return NEW;
-END $$ LANGUAGE plpgsql;
-CREATE TRIGGER trig_d_1_15 BEFORE INSERT ON part_d_1_15
-   FOR EACH ROW EXECUTE PROCEDURE func_d_1_15();
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- Here, RLS checks should succeed while moving row from part_a_10_a_20 to
--- part_d_1_15. Even though the UPDATE is setting 'c' to an odd number, the
--- trigger at the destination partition again makes it an even number.
-UPDATE range_parted set a = 'b', c = 151 WHERE a = 'a' and c = 200;
-ERROR:  new row violates row-level security policy for table "range_parted"  (seg1 127.0.0.1:7003 pid=32016)
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- This should fail with RLS violation error. Even though the UPDATE is setting
--- 'c' to an even number, the trigger at the destination partition again makes
--- it an odd number.
-UPDATE range_parted set a = 'b', c = 150 WHERE a = 'a' and c = 200;
--- Cleanup
-RESET SESSION AUTHORIZATION;
-DROP TRIGGER trig_d_1_15 ON part_d_1_15;
-DROP FUNCTION func_d_1_15();
--- Policy expression contains SubPlan
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-CREATE POLICY policy_range_parted_subplan on range_parted
-    AS RESTRICTIVE for UPDATE USING (true)
-    WITH CHECK ((SELECT range_parted.c <= c1 FROM mintab));
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- fail, mintab has row with c1 = 120
-UPDATE range_parted set a = 'b', c = 122 WHERE a = 'a' and c = 200;
-ERROR:  new row violates row-level security policy "policy_range_parted_subplan" for table "range_parted"  (seg1 127.0.0.1:7003 pid=32016)
--- ok
-UPDATE range_parted set a = 'b', c = 120 WHERE a = 'a' and c = 200;
--- RLS policy expression contains whole row.
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-CREATE POLICY policy_range_parted_wholerow on range_parted AS RESTRICTIVE for UPDATE USING (true)
-   WITH CHECK (range_parted = row('b', 10, 112, 1, NULL)::range_parted);
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- ok, should pass the RLS check
-UPDATE range_parted set a = 'b', c = 112 WHERE a = 'a' and c = 200;
-ERROR:  new row violates row-level security policy "policy_range_parted_wholerow" for table "range_parted"  (seg1 127.0.0.1:7003 pid=32016)
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- fail, the whole row RLS check should fail
-UPDATE range_parted set a = 'b', c = 116 WHERE a = 'a' and c = 200;
-ERROR:  new row violates row-level security policy "policy_range_parted_wholerow" for table "range_parted"  (seg1 127.0.0.1:7003 pid=32016)
--- Cleanup
-RESET SESSION AUTHORIZATION;
-DROP POLICY policy_range_parted ON range_parted;
-DROP POLICY policy_range_parted_subplan ON range_parted;
-DROP POLICY policy_range_parted_wholerow ON range_parted;
-REVOKE ALL ON range_parted, mintab FROM regress_range_parted_user;
-DROP USER regress_range_parted_user;
-DROP TABLE mintab;
------ ok above
--- statement triggers with update row movement
----------------------------------------------------
-:init_range_parted;
-CREATE FUNCTION trigfunc() returns trigger language plpgsql as
-$$
-  begin
-    raise notice 'trigger = % fired on table % during %',
-                 TG_NAME, TG_TABLE_NAME, TG_OP;
-    return null;
-  end;
-$$;
--- Triggers on root partition
-CREATE TRIGGER parent_delete_trig
-  AFTER DELETE ON range_parted for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER parent_update_trig
-  AFTER UPDATE ON range_parted for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER parent_insert_trig
-  AFTER INSERT ON range_parted for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
--- Triggers on leaf partition part_c_1_100
-CREATE TRIGGER c1_delete_trig
-  AFTER DELETE ON part_c_1_100 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER c1_update_trig
-  AFTER UPDATE ON part_c_1_100 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER c1_insert_trig
-  AFTER INSERT ON part_c_1_100 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
--- Triggers on leaf partition part_d_1_15
-CREATE TRIGGER d1_delete_trig
-  AFTER DELETE ON part_d_1_15 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER d1_update_trig
-  AFTER UPDATE ON part_d_1_15 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER d1_insert_trig
-  AFTER INSERT ON part_d_1_15 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
--- Triggers on leaf partition part_d_15_20
-CREATE TRIGGER d15_delete_trig
-  AFTER DELETE ON part_d_15_20 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER d15_update_trig
-  AFTER UPDATE ON part_d_15_20 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
-CREATE TRIGGER d15_insert_trig
-  AFTER INSERT ON part_d_15_20 for each statement execute procedure trigfunc();
-ERROR:  Triggers for statements are not yet supported
--- Move all rows from part_c_100_200 to part_c_1_100. None of the delete or
--- insert statement triggers should be fired.
-UPDATE range_parted set c = c - 50 WHERE c > 97;
-:show_data;
-    partname    | a | b  |  c  | d | e 
-----------------+---+----+-----+---+---
- part_a_10_a_20 | a | 10 | 150 | 1 | e
- part_a_1_a_10  | a |  1 |   1 | 1 | e
- part_c_1_100   | b | 12 |  96 | 1 | e
- part_c_1_100   | b | 13 |  97 | 2 | e
-(4 rows)
-
-DROP TRIGGER parent_delete_trig ON range_parted;
-ERROR:  trigger "parent_delete_trig" for table "range_parted" does not exist
-DROP TRIGGER parent_update_trig ON range_parted;
-ERROR:  trigger "parent_update_trig" for table "range_parted" does not exist
-DROP TRIGGER parent_insert_trig ON range_parted;
-ERROR:  trigger "parent_insert_trig" for table "range_parted" does not exist
-DROP TRIGGER c1_delete_trig ON part_c_1_100;
-ERROR:  trigger "c1_delete_trig" for table "part_c_1_100" does not exist
-DROP TRIGGER c1_update_trig ON part_c_1_100;
-ERROR:  trigger "c1_update_trig" for table "part_c_1_100" does not exist
-DROP TRIGGER c1_insert_trig ON part_c_1_100;
-ERROR:  trigger "c1_insert_trig" for table "part_c_1_100" does not exist
-DROP TRIGGER d1_delete_trig ON part_d_1_15;
-ERROR:  trigger "d1_delete_trig" for table "part_d_1_15" does not exist
-DROP TRIGGER d1_update_trig ON part_d_1_15;
-ERROR:  trigger "d1_update_trig" for table "part_d_1_15" does not exist
-DROP TRIGGER d1_insert_trig ON part_d_1_15;
-ERROR:  trigger "d1_insert_trig" for table "part_d_1_15" does not exist
-DROP TRIGGER d15_delete_trig ON part_d_15_20;
-ERROR:  trigger "d15_delete_trig" for table "part_d_15_20" does not exist
-DROP TRIGGER d15_update_trig ON part_d_15_20;
-ERROR:  trigger "d15_update_trig" for table "part_d_15_20" does not exist
-DROP TRIGGER d15_insert_trig ON part_d_15_20;
-ERROR:  trigger "d15_insert_trig" for table "part_d_15_20" does not exist
--- Creating default partition for range
-:init_range_parted;
-create table part_def partition of range_parted default;
-NOTICE:  table has parent, setting distribution columns to match parent table
-\d+ part_def
-                                       Table "public.part_def"
- Column |       Type        | Collation | Nullable | Default | Storage  | Stats target | Description 
---------+-------------------+-----------+----------+---------+----------+--------------+-------------
- a      | text              |           |          |         | extended |              | 
- b      | bigint            |           |          |         | plain    |              | 
- c      | numeric           |           |          |         | main     |              | 
- d      | integer           |           |          |         | plain    |              | 
- e      | character varying |           |          |         | extended |              | 
-Partition of: range_parted DEFAULT
-Partition constraint: (NOT ((a IS NOT NULL) AND (b IS NOT NULL) AND (((a = 'a'::text) AND (b >= '1'::bigint) AND (b < '10'::bigint)) OR ((a = 'a'::text) AND (b >= '10'::bigint) AND (b < '20'::bigint)) OR ((a = 'b'::text) AND (b >= '1'::bigint) AND (b < '10'::bigint)) OR ((a = 'b'::text) AND (b >= '10'::bigint) AND (b < '20'::bigint)) OR ((a = 'b'::text) AND (b >= '20'::bigint) AND (b < '30'::bigint)))))
-Distributed by: (a)
-
-insert into range_parted values ('c', 9, 0, 0, '');
--- ok
-update part_def set a = 'd' where a = 'c';
--- fail
-update part_def set a = 'a' where a = 'd';
-ERROR:  new row for relation "part_def" violates partition constraint  (seg2 127.0.0.1:7004 pid=32017)
-DETAIL:  Failing row contains (a, 9, 0, 0, ).
-:show_data;
-    partname    | a | b  |  c  | d  | e 
-----------------+---+----+-----+----+---
- part_a_10_a_20 | a | 10 | 200 |  1 | e
- part_a_1_a_10  | a |  1 |   1 |  1 | e
- part_c_1_100   | b | 12 |  96 |  1 | e
- part_c_1_100   | b | 13 |  97 |  2 | e
- part_d_15_20   | b | 15 | 105 | 16 | e
- part_d_15_20   | b | 17 | 105 | 19 | e
- part_def       | d |  9 |   0 |  0 | 
-(7 rows)
-
--- Update row movement from non-default to default partition.
--- fail, default partition is not under part_a_10_a_20;
-UPDATE part_a_10_a_20 set a = 'ad' WHERE a = 'a';
-ERROR:  new row for relation "part_a_10_a_20" violates partition constraint  (seg2 127.0.0.1:7004 pid=32017)
-DETAIL:  Failing row contains (ad, 10, 200, 1, e).
--- ok
--- UPDATE range_parted set a = 'ad' WHERE a = 'a';
-UPDATE range_parted set a = 'bd' WHERE a = 'b';
-:show_data;
- partname | a  | b  |  c  | d  | e 
-----------+----+----+-----+----+---
- part_def | ad |  1 |   1 |  1 | e
- part_def | ad | 10 | 200 |  1 | e
- part_def | bd | 12 |  96 |  1 | e
- part_def | bd | 13 |  97 |  2 | e
- part_def | bd | 15 | 105 | 16 | e
- part_def | bd | 17 | 105 | 19 | e
- part_def | d  |  9 |   0 |  0 | 
-(7 rows)
-
--- Update row movement from default to non-default partitions.
--- ok
-UPDATE range_parted set a = 'a' WHERE a = 'ad';
-UPDATE range_parted set a = 'b' WHERE a = 'bd';
-:show_data;
-    partname    | a | b  |  c  | d  | e 
-----------------+---+----+-----+----+---
- part_a_10_a_20 | a | 10 | 200 |  1 | e
- part_a_1_a_10  | a |  1 |   1 |  1 | e
- part_c_1_100   | b | 12 |  96 |  1 | e
- part_c_1_100   | b | 13 |  97 |  2 | e
- part_d_15_20   | b | 15 | 105 | 16 | e
- part_d_15_20   | b | 17 | 105 | 19 | e
- part_def       | d |  9 |   0 |  0 | 
-(7 rows)
-
--- Cleanup: range_parted no longer needed.
-DROP TABLE range_parted;
-CREATE TABLE list_parted (
-	a text,
-	b int
-) PARTITION BY list (a);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-CREATE TABLE list_part1  PARTITION OF list_parted for VALUES in ('a', 'b');
-NOTICE:  table has parent, setting distribution columns to match parent table
-CREATE TABLE list_default PARTITION OF list_parted default;
-NOTICE:  table has parent, setting distribution columns to match parent table
-INSERT into list_part1 VALUES ('a', 1);
-INSERT into list_default VALUES ('d', 10);
--- fail
-UPDATE list_default set a = 'a' WHERE a = 'd';
-ERROR:  new row for relation "list_default" violates partition constraint  (seg2 127.0.0.1:7004 pid=32017)
-DETAIL:  Failing row contains (a, 10).
--- ok
-UPDATE list_default set a = 'x' WHERE a = 'd';
-DROP TABLE list_parted;
--- Test retrieval of system columns with non-consistent partition row types.
--- This is only partially supported, as seen in the results.
--- start_ignore
--- create table utrtest (a int, b text) partition by list (a);
--- create table utr1 (a int check (a in (1)), q text, b text);
--- create table utr2 (a int check (a in (2)), b text);
--- alter table utr1 drop column q;
--- alter table utrtest attach partition utr1 for values in (1);
--- alter table utrtest attach partition utr2 for values in (2);
--- -- xmin_ok is likely false, xmin and pg_current_xact_id() comes from
--- -- data segment and master, respectively.
--- insert into utrtest values (1, 'foo')
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;
--- insert into utrtest values (2, 'bar')
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;  -- fails
--- insert into utrtest values (2, 'bar')
---   returning *, tableoid::regclass;
--- update utrtest set b = b || b from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;
--- update utrtest set a = 3 - a from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;  -- fails
--- update utrtest set a = 3 - a from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass;
--- delete from utrtest
---   returning *, tableoid::regclass, xmax = pg_current_xact_id()::xid as xmax_ok;
--- drop table utrtest;
--- end_ignore
---------------
--- Some more update-partition-key test scenarios below. This time use list
--- partitions.
---------------
--- Setup for list partitions
-CREATE TABLE list_parted (a numeric, b int, c int8) PARTITION BY list (a);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-CREATE TABLE sub_parted PARTITION OF list_parted for VALUES in (1) PARTITION BY list (b);
-NOTICE:  table has parent, setting distribution columns to match parent table
-CREATE TABLE sub_part1(b int, c int8, a numeric);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-alter table sub_part1 set distributed by (a); -- GPDB: distribution policy must match the parent table.
-ALTER TABLE sub_parted ATTACH PARTITION sub_part1 for VALUES in (1);
-CREATE TABLE sub_part2(b int, c int8, a numeric);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'b' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-alter table sub_part2 set distributed by (a); -- GPDB: distribution policy must match the parent table.
-ALTER TABLE sub_parted ATTACH PARTITION sub_part2 for VALUES in (2);
-CREATE TABLE list_part1(a numeric, b int, c int8);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-ALTER TABLE list_parted ATTACH PARTITION list_part1 for VALUES in (2,3);
-INSERT into list_parted VALUES (2,5,50);
-INSERT into list_parted VALUES (3,6,60);
-INSERT into sub_parted VALUES (1,1,60);
-INSERT into sub_parted VALUES (1,2,10);
--- Test partition constraint violation when intermediate ancestor is used and
--- constraint is inherited from upper root.
-UPDATE sub_parted set a = 2 WHERE c = 10;
-ERROR:  new row for relation "sub_parted" violates partition constraint  (seg1 127.0.0.1:7003 pid=32016)
-DETAIL:  Failing row contains (2, 2, 10).
--- Test update-partition-key, where the unpruned partitions do not have their
--- partition keys updated.
-SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
-  tableoid  | a | b | c  
-------------+---+---+----
- list_part1 | 2 | 5 | 50
-(1 row)
-
-UPDATE list_parted set b = c + a WHERE a = 2;
-SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
-  tableoid  | a | b  | c  
-------------+---+----+----
- list_part1 | 2 | 52 | 50
-(1 row)
-
--- Test the case where BR UPDATE triggers change the partition key.
--- CREATE FUNCTION func_parted_mod_b() returns trigger as $$
--- BEGIN
---    NEW.b = 2; -- This is changing partition key column.
---    return NEW;
--- END $$ LANGUAGE plpgsql;
--- CREATE TRIGGER parted_mod_b before update on sub_part1
---    for each row execute procedure func_parted_mod_b();
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- -- This should do the tuple routing even though there is no explicit
--- -- partition-key update, because there is a trigger on sub_part1.
--- UPDATE list_parted set c = 70 WHERE b  = 1;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- DROP TRIGGER parted_mod_b ON sub_part1;
--- -- If BR DELETE trigger prevented DELETE from happening, we should also skip
--- -- the INSERT if that delete is part of UPDATE=>DELETE+INSERT.
--- CREATE OR REPLACE FUNCTION func_parted_mod_b() returns trigger as $$
--- BEGIN
---    raise notice 'Trigger: Got OLD row %, but returning NULL', OLD;
---    return NULL;
--- END $$ LANGUAGE plpgsql;
--- CREATE TRIGGER trig_skip_delete before delete on sub_part2
---    for each row execute procedure func_parted_mod_b();
--- UPDATE list_parted set b = 1 WHERE c = 70;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- -- Drop the trigger. Now the row should be moved.
--- DROP TRIGGER trig_skip_delete ON sub_part2;
--- UPDATE list_parted set b = 1 WHERE c = 70;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- DROP FUNCTION func_parted_mod_b();
--- UPDATE partition-key with FROM clause. If join produces multiple output
--- rows for the same row to be modified, we should tuple-route the row only
--- once. There should not be any rows inserted.
-CREATE TABLE non_parted (id int);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'id' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-INSERT into non_parted VALUES (1), (1), (1), (2), (2), (2), (3), (3), (3);
-UPDATE list_parted t1 set a = 2 FROM non_parted t2 WHERE t1.a = t2.id and a = 1;
-ERROR:  multiple updates to a row by the same query is not allowed  (seg2 127.0.0.1:7004 pid=25968)
--- In GPDB, the above UPDATE fails because the distribution key is updated, and
--- the Split Update codepath isn't smart enough to handle this situation. With
--- a non-Split Update, it works:
--- ALTER TABLE list_parted SET DISTRIBUTED BY (c);
-UPDATE list_parted t1 set a = 2 FROM non_parted t2 WHERE t1.a = t2.id and a = 1;
-ERROR:  multiple updates to a row by the same query is not allowed  (seg2 127.0.0.1:7004 pid=25968)
-SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
-  tableoid  | a | b  | c  
-------------+---+----+----
- list_part1 | 2 | 52 | 50
- list_part1 | 3 |  6 | 60
- sub_part1  | 1 |  1 | 60
- sub_part2  | 1 |  2 | 10
-(4 rows)
-
-DROP TABLE non_parted;
--- Cleanup: list_parted no longer needed.
-DROP TABLE list_parted;
--- create custom operator class and hash function, for the same reason
--- explained in alter_table.sql
-create or replace function dummy_hashint4(a int4, seed int8) returns int8 as
-$$ begin return (a + seed); end; $$ language 'plpgsql' immutable;
-create operator class custom_opclass for type int4 using hash as
-operator 1 = , function 2 dummy_hashint4(int4, int8);
-create table hash_parted (
-	a int,
-	b int
-) partition by hash (a custom_opclass, b custom_opclass);
-NOTICE:  Table doesn't have 'DISTRIBUTED BY' clause -- Using column named 'a' as the Cloudberry Database data distribution key for this table.
-HINT:  The 'DISTRIBUTED BY' clause determines the distribution of data. Make sure column(s) chosen are the optimal data distribution key to minimize skew.
-create table hpart1 partition of hash_parted for values with (modulus 2, remainder 1);
-NOTICE:  table has parent, setting distribution columns to match parent table
-create table hpart2 partition of hash_parted for values with (modulus 4, remainder 2);
-NOTICE:  table has parent, setting distribution columns to match parent table
-create table hpart3 partition of hash_parted for values with (modulus 8, remainder 0);
-NOTICE:  table has parent, setting distribution columns to match parent table
-create table hpart4 partition of hash_parted for values with (modulus 8, remainder 4);
-NOTICE:  table has parent, setting distribution columns to match parent table
-insert into hpart1 values (1, 1);
-insert into hpart2 values (2, 5);
-insert into hpart4 values (3, 4);
--- fail
-update hpart1 set a = 3, b=4 where a = 1;
-ERROR:  new row for relation "hpart1" violates partition constraint  (seg0 127.0.0.1:7002 pid=32015)
-DETAIL:  Failing row contains (3, 4).
--- ok, row movement
-update hash_parted set b = b - 1 where b = 1;
--- ok
-update hash_parted set b = b + 8 where b = 1;
--- cleanup
-drop table hash_parted;
-drop operator class custom_opclass using hash;
-drop function dummy_hashint4(a int4, seed int8);
--- end_ignore
diff --git a/contrib/pax_storage/src/data/pax-cdbinit--1.0.sql b/contrib/pax_storage/src/data/pax-cdbinit--1.0.sql
deleted file mode 100644
index c563aa4f73b..00000000000
--- a/contrib/pax_storage/src/data/pax-cdbinit--1.0.sql
+++ /dev/null
@@ -1,7 +0,0 @@
--- insert pax catalog values
-INSERT INTO pg_proc VALUES(7600,'pax_tableam_handler',11,10,13,1,0,0,0,'f','f','f','t','f','s','u',1,0,269,'2281',null,null,null,null,null,'pax_tableam_handler','$libdir/pax',null,null,null,'n','a');
-INSERT INTO pg_am   VALUES(7014,'pax',7600,'t');
-COMMENT ON FUNCTION pax_tableam_handler IS 'column-optimized PAX table access method handler';
-INSERT INTO pg_proc VALUES(7601,'paxauxstats_in',11,10,13,1,0,0,0,'f','f','f','t','f','i','u',1,0,7603,'2275',null,null,null,null,null,'MicroPartitionStatsInput','$libdir/pax',null,null,null,'n','a');
-INSERT INTO pg_proc VALUES(7602,'paxauxstats_out',11,10,13,1,0,0,0,'f','f','f','t','f','i','u',1,0,2275,'7603',null,null,null,null,null,'MicroPartitionStatsOutput','$libdir/pax',null,null,null,'n','a');
-INSERT INTO pg_type VALUES(7603,'paxauxstats',11,10,-1,'f','b','U','f','t',',',0,0,0,0,7601,7602,0,0,0,0,0,'i','x','t',0,-1,0,0,null,null,null);
diff --git a/contrib/pax_storage/src/data/sql/ddl.sql b/contrib/pax_storage/src/data/sql/ddl.sql
deleted file mode 100644
index 66a6c239d1a..00000000000
--- a/contrib/pax_storage/src/data/sql/ddl.sql
+++ /dev/null
@@ -1,28 +0,0 @@
--- start_ignore
-create extension pax;
-drop table if exists users;
--- end_ignore
-create table users(
-    id int ,
-    name text not null,
-    height float not null,
-    decimal_col decimal(10, 2) not null,
-    created_at timestamp with time zone not null,
-    updated_at timestamp with time zone not null
-)  using pax distributed BY (id);
-
-insert into users (id, name, height, decimal_col, created_at, updated_at) values
-    (1, 'Alice', 1.65, 1.23, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
-    (2, 'Bob', 1.75, 2.34, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08'),
-    (3, 'Carol', 1.85, 3.45, '2023-05-17 17:56:49.633664+08', '2023-05-17 17:56:49.633664+08');
-select * from users;
-
-DELETE FROM users WHERE id = 1;
-select * from users;
-
-UPDATE users SET name = 'Alice' WHERE id = 2;
-select * from users;
-
-UPDATE users SET height = (select max(height) from users),decimal_col = (select min(decimal_col) from users);
-select * from users;
-
diff --git a/contrib/pax_storage/src/data/sql/join.sql b/contrib/pax_storage/src/data/sql/join.sql
deleted file mode 100644
index 8b28bd7cb92..00000000000
--- a/contrib/pax_storage/src/data/sql/join.sql
+++ /dev/null
@@ -1,10 +0,0 @@
--- start_ignore
-create extension pax;
-drop table if exists t1;
--- end_ignore
-create table t1(v int) using pax distributed by(v);
-insert into t1 select generate_series(1,10);
-select * from t1 order by v;
-update t1 set v=(select max(v) from t1) where v <= 5;
-select * from t1 order by v;
-select * from t1 as a join t1 as b on a.v=b.v where a.v<10;
diff --git a/contrib/pax_storage/src/data/sql/setup.sql b/contrib/pax_storage/src/data/sql/setup.sql
deleted file mode 100644
index 2ba583b79bd..00000000000
--- a/contrib/pax_storage/src/data/sql/setup.sql
+++ /dev/null
@@ -1,3 +0,0 @@
--- start_ignore
-create EXTENSION if not exists pax;
--- end_ignore
\ No newline at end of file
diff --git a/contrib/pax_storage/src/data/sql/update.sql b/contrib/pax_storage/src/data/sql/update.sql
deleted file mode 100644
index a305246765a..00000000000
--- a/contrib/pax_storage/src/data/sql/update.sql
+++ /dev/null
@@ -1,703 +0,0 @@
--- start_ignore
-create extension pax;
-drop table if exists update_test;
-drop table if exists upsert_test;
--- end_ignore
-set default_table_access_method = 'pax';
-CREATE TABLE update_test (
-    a   INT DEFAULT 10,
-    b   INT,
-    c   TEXT
-) using pax;
-
-CREATE TABLE upsert_test (
-    a   INT ,
-    b   TEXT
-) using pax;
-
-INSERT INTO update_test VALUES (5, 10, 'foo');
-INSERT INTO update_test(b, a, c) VALUES (15, 10, '');
-
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-
-UPDATE update_test SET a = DEFAULT, b = 0;
-
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-
--- aliases for the UPDATE target table
-UPDATE update_test AS t SET b = 10 WHERE t.a = 10;
-
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-
-UPDATE update_test t SET b = t.b + 10 WHERE t.a = 10;
-
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-
---
--- Test VALUES in FROM
---
-
-UPDATE update_test SET a=v.i FROM (VALUES(100, 20)) AS v(i, j)
-  WHERE update_test.b = v.j;
-
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-
--- fail, wrong data type:
-UPDATE update_test SET a = v.* FROM (VALUES(100, 20)) AS v(i, j)
-  WHERE update_test.b = v.j;
-
---
--- Test multiple-set-clause syntax
---
-
-INSERT INTO update_test SELECT a,b+1,c FROM update_test;
-SELECT * FROM update_test;
-
-UPDATE update_test SET (c,b,a) = ('bugle', b+11, DEFAULT) WHERE c = 'foo';
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
-UPDATE update_test SET (c,b) = ('car', a+b), a = a + 1 WHERE a = 10;
-SELECT a,b,c FROM update_test ORDER BY a,b,c;
--- fail, multi assignment to same column:
-UPDATE update_test SET (c,b) = ('car', a+b), b = a + 1 WHERE a = 10;
-
--- uncorrelated sub-select:
-UPDATE update_test
-  SET (b,a) = (select a,b from update_test where b = 41 and c = 'car')
-  WHERE a = 100 AND b = 20;
-SELECT * FROM update_test;
--- correlated sub-select:
-UPDATE update_test o
-  SET (b,a) = (select a+1,b from update_test i
-               where i.a=o.a and i.b=o.b and i.c is not distinct from o.c);
-SELECT * FROM update_test;
-
--- fail, multiple rows supplied:
-UPDATE update_test SET (b,a) = (select a+1,b from update_test);
--- set to null if no rows supplied:
-UPDATE update_test SET (b,a) = (select a+1,b from update_test where a = 1000)
-  WHERE a = 11;
-SELECT * FROM update_test;
--- *-expansion should work in this context:
-UPDATE update_test SET (a,b) = ROW(v.*) FROM (VALUES(21, 100)) AS v(i, j)
-  WHERE update_test.a = v.i;
--- you might expect this to work, but syntactically it's not a RowExpr:
-UPDATE update_test SET (a,b) = (v.*) FROM (VALUES(21, 101)) AS v(i, j)
-  WHERE update_test.a = v.i;
-
--- if an alias for the target table is specified, don't allow references
--- to the original table name
-UPDATE update_test AS t SET b = update_test.b + 10 WHERE t.a = 10;
-
--- Make sure that we can update to a TOASTed value.
-UPDATE update_test SET c = repeat('x', 10000) WHERE c = 'car';
-SELECT a, b, char_length(c) FROM update_test;
-
--- Check multi-assignment with a Result node to handle a one-time filter.
-EXPLAIN (VERBOSE, COSTS OFF)
-UPDATE update_test t
-  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
-  WHERE CURRENT_USER = SESSION_USER;
-UPDATE update_test t
-  SET (a, b) = (SELECT b, a FROM update_test s WHERE s.a = t.a)
-  WHERE CURRENT_USER = SESSION_USER;
-SELECT a, b, char_length(c) FROM update_test;
-
--- start_ignore
--- Test ON CONFLICT DO UPDATE
-
--- skip, not support primary key, can't test
-set default_table_access_method = 'pax';
-CREATE TABLE upsert_test (
-    a   INT PRIMARY KEY,
-    b   TEXT
-) using pax;
-
--- INSERT INTO upsert_test VALUES(1, 'Boo'), (3, 'Zoo');
--- -- uncorrelated  sub-select:
--- WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
---   VALUES (1, 'Bar') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
--- -- correlated sub-select:
--- INSERT INTO upsert_test VALUES (1, 'Baz'), (3, 'Zaz') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Correlated', a from upsert_test i WHERE i.a = upsert_test.a)
---   RETURNING *;
--- -- correlated sub-select (EXCLUDED.* alias):
--- INSERT INTO upsert_test VALUES (1, 'Bat'), (3, 'Zot') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING *;
-
--- -- ON CONFLICT using system attributes in RETURNING, testing both the
--- -- inserting and updating paths. See bug report at:
--- -- https://www.postgresql.org/message-id/73436355-6432-49B1-92ED-1FE4F7E7E100%40finefun.com.au
--- INSERT INTO upsert_test VALUES (2, 'Beeble') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = 0 AS xmax_correct;
--- -- currently xmax is set after a conflict - that's probably not good,
--- -- but it seems worthwhile to have to be explicit if that changes.
--- INSERT INTO upsert_test VALUES (2, 'Brox') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b || ', Excluded', a from upsert_test i WHERE i.a = excluded.a)
---   RETURNING tableoid::regclass, xmin = pg_current_xact_id()::xid AS xmin_correct, xmax = pg_current_xact_id()::xid AS xmax_correct;
-
--- DROP TABLE update_test;
--- DROP TABLE upsert_test;
-
--- -- Test ON CONFLICT DO UPDATE with partitioned table and non-identical children
-
--- CREATE TABLE upsert_test (
---     a   INT PRIMARY KEY,
---     b   TEXT
--- ) PARTITION BY LIST (a);
-
--- CREATE TABLE upsert_test_1 PARTITION OF upsert_test FOR VALUES IN (1);
--- CREATE TABLE upsert_test_2 (b TEXT, a INT PRIMARY KEY);
--- ALTER TABLE upsert_test ATTACH PARTITION upsert_test_2 FOR VALUES IN (2);
-
--- INSERT INTO upsert_test VALUES(1, 'Boo'), (2, 'Zoo');
--- -- uncorrelated sub-select:
--- WITH aaa AS (SELECT 1 AS a, 'Foo' AS b) INSERT INTO upsert_test
---   VALUES (1, 'Bar') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT b, a FROM aaa) RETURNING *;
--- -- correlated sub-select:
--- WITH aaa AS (SELECT 1 AS ctea, ' Foo' AS cteb) INSERT INTO upsert_test
---   VALUES (1, 'Bar'), (2, 'Baz') ON CONFLICT(a)
---   DO UPDATE SET (b, a) = (SELECT upsert_test.b||cteb, upsert_test.a FROM aaa) RETURNING *;
-
--- DROP TABLE upsert_test;
-
----------------------------
--- UPDATE with row movement
----------------------------
-
--- When a partitioned table receives an UPDATE to the partitioned key and the
--- new values no longer meet the partition's bound, the row must be moved to
--- the correct partition for the new partition key (if one exists). We must
--- also ensure that updatable views on partitioned tables properly enforce any
--- WITH CHECK OPTION that is defined. The situation with triggers in this case
--- also requires thorough testing as partition key updates causing row
--- movement convert UPDATEs into DELETE+INSERT.
-set default_table_access_method = 'pax';
-
-CREATE TABLE range_parted (
-	a text,
-	b bigint,
-	c numeric,
-	d int,
-	e varchar
-) PARTITION BY RANGE (a, b);
-
--- Create partitions intentionally in descending bound order, so as to test
--- that update-row-movement works with the leaf partitions not in bound order.
-CREATE TABLE part_b_20_b_30 (e varchar, c numeric, a text, b bigint, d int);
--- GPDB: distribution policy must match the parent table.
-alter table part_b_20_b_30 set distributed by (a);
-ALTER TABLE range_parted ATTACH PARTITION part_b_20_b_30 FOR VALUES FROM ('b', 20) TO ('b', 30);
-CREATE TABLE part_b_10_b_20 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY RANGE (c);
-alter table part_b_10_b_20 set distributed by (a);
-CREATE TABLE part_b_1_b_10 PARTITION OF range_parted FOR VALUES FROM ('b', 1) TO ('b', 10);
-ALTER TABLE range_parted ATTACH PARTITION part_b_10_b_20 FOR VALUES FROM ('b', 10) TO ('b', 20);
-CREATE TABLE part_a_10_a_20 PARTITION OF range_parted FOR VALUES FROM ('a', 10) TO ('a', 20);
-CREATE TABLE part_a_1_a_10 PARTITION OF range_parted FOR VALUES FROM ('a', 1) TO ('a', 10);
-
--- Check that partition-key UPDATE works sanely on a partitioned table that
--- does not have any child partitions.
-UPDATE part_b_10_b_20 set b = b - 6;
-
--- Create some more partitions following the above pattern of descending bound
--- order, but let's make the situation a bit more complex by having the
--- attribute numbers of the columns vary from their parent partition.
-CREATE TABLE part_c_100_200 (e varchar, c numeric, a text, b bigint, d int) PARTITION BY range (abs(d));
-ALTER TABLE part_c_100_200 DROP COLUMN e, DROP COLUMN c, DROP COLUMN a;
-ALTER TABLE part_c_100_200 ADD COLUMN c numeric, ADD COLUMN e varchar, ADD COLUMN a text;
-ALTER TABLE part_c_100_200 DROP COLUMN b;
-ALTER TABLE part_c_100_200 ADD COLUMN b bigint;
-CREATE TABLE part_d_1_15 PARTITION OF part_c_100_200 FOR VALUES FROM (1) TO (15);
-CREATE TABLE part_d_15_20 PARTITION OF part_c_100_200 FOR VALUES FROM (15) TO (20);
-
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
-
--- GPDB: distribution policy must match the parent table, so the previous command fails.
--- Change the distribution key and try again.
-alter table part_c_100_200 set distributed by (a);
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_100_200 FOR VALUES FROM (100) TO (200);
-
-CREATE TABLE part_c_1_100 (e varchar, d int, c numeric, b bigint, a text);
-alter table part_c_1_100 set distributed by (a);
-ALTER TABLE part_b_10_b_20 ATTACH PARTITION part_c_1_100 FOR VALUES FROM (1) TO (100);
-
-\set init_range_parted 'truncate range_parted; insert into range_parted VALUES (''a'', 1, 1, 1 ,''e''), (''a'', 10, 200, 1 ,''e''), (''b'', 12, 96, 1 ,''e''), (''b'', 13, 97, 2 ,''e''), (''b'', 15, 105, 16 ,''e''), (''b'', 17, 105, 19 ,''e'')'
-\set show_data 'select tableoid::regclass::text COLLATE "C" partname, * from range_parted ORDER BY 1, 2, 3, 4, 5, 6'
-:init_range_parted;
-:show_data;
-
--- The order of subplans should be in bound order
-EXPLAIN (costs off) UPDATE range_parted set c = c - 50 WHERE c > 97;
-
--- fail, row movement happens only within the partition subtree.
-UPDATE part_c_100_200 set c = c - 20, d = c WHERE c = 105;
--- fail, no partition key update, so no attempt to move tuple,
--- but "a = 'a'" violates partition constraint enforced by root partition)
-UPDATE part_b_10_b_20 set a = 'a';
--- ok, partition key update, no constraint violation
-UPDATE range_parted set d = d - 10 WHERE d > 10;
--- ok, no partition key update, no constraint violation
-UPDATE range_parted set e = d;
--- No row found
-UPDATE part_c_1_100 set c = c + 20 WHERE c = 98;
--- ok, row movement
-UPDATE part_b_10_b_20 set c = c + 20 returning c, b, a;
-:show_data;
-
--- fail, row movement happens only within the partition subtree.
-UPDATE part_b_10_b_20 set b = b - 6 WHERE c > 116 returning *;
--- ok, row movement, with subset of rows moved into different partition.
-UPDATE range_parted set b = b - 6 WHERE c > 116 returning a, b + c;
-
-:show_data;
-
-
-
----------------------------   Common table needed for multiple test scenarios.  ---------------------------
-CREATE TABLE mintab(c1 int);
-INSERT into mintab VALUES (120);
-
--- update partition key using updatable view.
-CREATE VIEW upview AS SELECT * FROM range_parted WHERE (select c > c1 FROM mintab) WITH CHECK OPTION;
--- ok
-UPDATE upview set c = 199 WHERE b = 4;
--- fail, check option violation
-UPDATE upview set c = 120 WHERE b = 4;
--- fail, row movement with check option violation
-UPDATE upview set a = 'b', b = 15, c = 120 WHERE b = 4;
--- ok, row movement, check option passes
-UPDATE upview set a = 'b', b = 15 WHERE b = 4;
-
-:show_data;
-
--- cleanup
-DROP VIEW upview;
-
--- RETURNING having whole-row vars.
-:init_range_parted;
-UPDATE range_parted set c = 95 WHERE a = 'b' and b > 10 and c > 100 returning (range_parted), *;
-:show_data;
-
-
--- Transition tables with update row movement
-:init_range_parted;
-
-CREATE FUNCTION trans_updatetrigfunc() RETURNS trigger LANGUAGE plpgsql AS
-$$
-  begin
-    raise notice 'trigger = %, old table = %, new table = %',
-                 TG_NAME,
-                 (select string_agg(old_table::text, ', ' ORDER BY a) FROM old_table),
-                 (select string_agg(new_table::text, ', ' ORDER BY a) FROM new_table);
-    return null;
-  end;
-$$;
-
-CREATE TRIGGER trans_updatetrig
-  AFTER UPDATE ON range_parted REFERENCING OLD TABLE AS old_table NEW TABLE AS new_table
-  FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
-
-UPDATE range_parted set c = (case when c = 96 then 110 else c + 1 end ) WHERE a = 'b' and b > 10 and c >= 96;
-:show_data;
-:init_range_parted;
-
--- -- Enabling OLD TABLE capture for both DELETE as well as UPDATE stmt triggers
--- -- should not cause DELETEd rows to be captured twice. Similar thing for
--- -- INSERT triggers and inserted rows.
--- CREATE TRIGGER trans_deletetrig
---   AFTER DELETE ON range_parted REFERENCING OLD TABLE AS old_table
---   FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
--- CREATE TRIGGER trans_inserttrig
---   AFTER INSERT ON range_parted REFERENCING NEW TABLE AS new_table
---   FOR EACH STATEMENT EXECUTE PROCEDURE trans_updatetrigfunc();
--- UPDATE range_parted set c = c + 50 WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
--- DROP TRIGGER trans_deletetrig ON range_parted;
--- DROP TRIGGER trans_inserttrig ON range_parted;
--- -- Don't drop trans_updatetrig yet. It is required below.
-
--- -- Test with transition tuple conversion happening for rows moved into the
--- -- new partition. This requires a trigger that references transition table
--- -- (we already have trans_updatetrig). For inserted rows, the conversion
--- -- is not usually needed, because the original tuple is already compatible with
--- -- the desired transition tuple format. But conversion happens when there is a
--- -- BR trigger because the trigger can change the inserted row. So install a
--- -- BR triggers on those child partitions where the rows will be moved.
--- CREATE FUNCTION func_parted_mod_b() RETURNS trigger AS $$
--- BEGIN
---    NEW.b = NEW.b + 1;
---    return NEW;
--- END $$ language plpgsql;
--- CREATE TRIGGER trig_c1_100 BEFORE UPDATE OR INSERT ON part_c_1_100
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- CREATE TRIGGER trig_d1_15 BEFORE UPDATE OR INSERT ON part_d_1_15
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- CREATE TRIGGER trig_d15_20 BEFORE UPDATE OR INSERT ON part_d_15_20
---    FOR EACH ROW EXECUTE PROCEDURE func_parted_mod_b();
--- :init_range_parted;
--- UPDATE range_parted set c = (case when c = 96 then 110 else c + 1 end) WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
--- :init_range_parted;
--- UPDATE range_parted set c = c + 50 WHERE a = 'b' and b > 10 and c >= 96;
--- :show_data;
-
--- -- Case where per-partition tuple conversion map array is allocated, but the
--- -- map is not required for the particular tuple that is routed, thanks to
--- -- matching table attributes of the partition and the target table.
--- :init_range_parted;
--- UPDATE range_parted set b = 15 WHERE b = 1;
--- :show_data;
-
--- DROP TRIGGER trans_updatetrig ON range_parted;
--- DROP TRIGGER trig_c1_100 ON part_c_1_100;
--- DROP TRIGGER trig_d1_15 ON part_d_1_15;
--- DROP TRIGGER trig_d15_20 ON part_d_15_20;
--- DROP FUNCTION func_parted_mod_b();
-
--- RLS policies with update-row-movement
------------------------------------------
-
-ALTER TABLE range_parted ENABLE ROW LEVEL SECURITY;
-CREATE USER regress_range_parted_user;
-GRANT ALL ON range_parted, mintab TO regress_range_parted_user;
-CREATE POLICY seeall ON range_parted AS PERMISSIVE FOR SELECT USING (true);
-CREATE POLICY policy_range_parted ON range_parted for UPDATE USING (true) WITH CHECK (c % 2 = 0);
-
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- This should fail with RLS violation error while moving row from
--- part_a_10_a_20 to part_d_1_15, because we are setting 'c' to an odd number.
-UPDATE range_parted set a = 'b', c = 151 WHERE a = 'a' and c = 200;
-
-RESET SESSION AUTHORIZATION;
--- Create a trigger on part_d_1_15
-CREATE FUNCTION func_d_1_15() RETURNS trigger AS $$
-BEGIN
-   NEW.c = NEW.c + 1; -- Make even numbers odd, or vice versa
-   return NEW;
-END $$ LANGUAGE plpgsql;
-CREATE TRIGGER trig_d_1_15 BEFORE INSERT ON part_d_1_15
-   FOR EACH ROW EXECUTE PROCEDURE func_d_1_15();
-
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
-
--- Here, RLS checks should succeed while moving row from part_a_10_a_20 to
--- part_d_1_15. Even though the UPDATE is setting 'c' to an odd number, the
--- trigger at the destination partition again makes it an even number.
-UPDATE range_parted set a = 'b', c = 151 WHERE a = 'a' and c = 200;
-
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- This should fail with RLS violation error. Even though the UPDATE is setting
--- 'c' to an even number, the trigger at the destination partition again makes
--- it an odd number.
-UPDATE range_parted set a = 'b', c = 150 WHERE a = 'a' and c = 200;
-
--- Cleanup
-RESET SESSION AUTHORIZATION;
-DROP TRIGGER trig_d_1_15 ON part_d_1_15;
-DROP FUNCTION func_d_1_15();
-
--- Policy expression contains SubPlan
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-CREATE POLICY policy_range_parted_subplan on range_parted
-    AS RESTRICTIVE for UPDATE USING (true)
-    WITH CHECK ((SELECT range_parted.c <= c1 FROM mintab));
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- fail, mintab has row with c1 = 120
-UPDATE range_parted set a = 'b', c = 122 WHERE a = 'a' and c = 200;
--- ok
-UPDATE range_parted set a = 'b', c = 120 WHERE a = 'a' and c = 200;
-
--- RLS policy expression contains whole row.
-
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-CREATE POLICY policy_range_parted_wholerow on range_parted AS RESTRICTIVE for UPDATE USING (true)
-   WITH CHECK (range_parted = row('b', 10, 112, 1, NULL)::range_parted);
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- ok, should pass the RLS check
-UPDATE range_parted set a = 'b', c = 112 WHERE a = 'a' and c = 200;
-RESET SESSION AUTHORIZATION;
-:init_range_parted;
-SET SESSION AUTHORIZATION regress_range_parted_user;
--- fail, the whole row RLS check should fail
-UPDATE range_parted set a = 'b', c = 116 WHERE a = 'a' and c = 200;
-
--- Cleanup
-RESET SESSION AUTHORIZATION;
-DROP POLICY policy_range_parted ON range_parted;
-DROP POLICY policy_range_parted_subplan ON range_parted;
-DROP POLICY policy_range_parted_wholerow ON range_parted;
-REVOKE ALL ON range_parted, mintab FROM regress_range_parted_user;
-DROP USER regress_range_parted_user;
-DROP TABLE mintab;
------ ok above
--- statement triggers with update row movement
----------------------------------------------------
-
-:init_range_parted;
-
-CREATE FUNCTION trigfunc() returns trigger language plpgsql as
-$$
-  begin
-    raise notice 'trigger = % fired on table % during %',
-                 TG_NAME, TG_TABLE_NAME, TG_OP;
-    return null;
-  end;
-$$;
--- Triggers on root partition
-CREATE TRIGGER parent_delete_trig
-  AFTER DELETE ON range_parted for each statement execute procedure trigfunc();
-CREATE TRIGGER parent_update_trig
-  AFTER UPDATE ON range_parted for each statement execute procedure trigfunc();
-CREATE TRIGGER parent_insert_trig
-  AFTER INSERT ON range_parted for each statement execute procedure trigfunc();
-
--- Triggers on leaf partition part_c_1_100
-CREATE TRIGGER c1_delete_trig
-  AFTER DELETE ON part_c_1_100 for each statement execute procedure trigfunc();
-CREATE TRIGGER c1_update_trig
-  AFTER UPDATE ON part_c_1_100 for each statement execute procedure trigfunc();
-CREATE TRIGGER c1_insert_trig
-  AFTER INSERT ON part_c_1_100 for each statement execute procedure trigfunc();
-
--- Triggers on leaf partition part_d_1_15
-CREATE TRIGGER d1_delete_trig
-  AFTER DELETE ON part_d_1_15 for each statement execute procedure trigfunc();
-CREATE TRIGGER d1_update_trig
-  AFTER UPDATE ON part_d_1_15 for each statement execute procedure trigfunc();
-CREATE TRIGGER d1_insert_trig
-  AFTER INSERT ON part_d_1_15 for each statement execute procedure trigfunc();
--- Triggers on leaf partition part_d_15_20
-CREATE TRIGGER d15_delete_trig
-  AFTER DELETE ON part_d_15_20 for each statement execute procedure trigfunc();
-CREATE TRIGGER d15_update_trig
-  AFTER UPDATE ON part_d_15_20 for each statement execute procedure trigfunc();
-CREATE TRIGGER d15_insert_trig
-  AFTER INSERT ON part_d_15_20 for each statement execute procedure trigfunc();
-
--- Move all rows from part_c_100_200 to part_c_1_100. None of the delete or
--- insert statement triggers should be fired.
-UPDATE range_parted set c = c - 50 WHERE c > 97;
-:show_data;
-
-DROP TRIGGER parent_delete_trig ON range_parted;
-DROP TRIGGER parent_update_trig ON range_parted;
-DROP TRIGGER parent_insert_trig ON range_parted;
-DROP TRIGGER c1_delete_trig ON part_c_1_100;
-DROP TRIGGER c1_update_trig ON part_c_1_100;
-DROP TRIGGER c1_insert_trig ON part_c_1_100;
-DROP TRIGGER d1_delete_trig ON part_d_1_15;
-DROP TRIGGER d1_update_trig ON part_d_1_15;
-DROP TRIGGER d1_insert_trig ON part_d_1_15;
-DROP TRIGGER d15_delete_trig ON part_d_15_20;
-DROP TRIGGER d15_update_trig ON part_d_15_20;
-DROP TRIGGER d15_insert_trig ON part_d_15_20;
-
-
--- Creating default partition for range
-:init_range_parted;
-create table part_def partition of range_parted default;
-\d+ part_def
-insert into range_parted values ('c', 9, 0, 0, '');
--- ok
-update part_def set a = 'd' where a = 'c';
--- fail
-update part_def set a = 'a' where a = 'd';
-
-:show_data;
-
--- Update row movement from non-default to default partition.
--- fail, default partition is not under part_a_10_a_20;
-UPDATE part_a_10_a_20 set a = 'ad' WHERE a = 'a';
--- ok
--- UPDATE range_parted set a = 'ad' WHERE a = 'a';
-UPDATE range_parted set a = 'bd' WHERE a = 'b';
-:show_data;
--- Update row movement from default to non-default partitions.
--- ok
-UPDATE range_parted set a = 'a' WHERE a = 'ad';
-UPDATE range_parted set a = 'b' WHERE a = 'bd';
-:show_data;
-
--- Cleanup: range_parted no longer needed.
-DROP TABLE range_parted;
-
-CREATE TABLE list_parted (
-	a text,
-	b int
-) PARTITION BY list (a);
-CREATE TABLE list_part1  PARTITION OF list_parted for VALUES in ('a', 'b');
-CREATE TABLE list_default PARTITION OF list_parted default;
-INSERT into list_part1 VALUES ('a', 1);
-INSERT into list_default VALUES ('d', 10);
-
--- fail
-UPDATE list_default set a = 'a' WHERE a = 'd';
--- ok
-UPDATE list_default set a = 'x' WHERE a = 'd';
-
-DROP TABLE list_parted;
-
--- Test retrieval of system columns with non-consistent partition row types.
--- This is only partially supported, as seen in the results.
--- start_ignore
--- create table utrtest (a int, b text) partition by list (a);
--- create table utr1 (a int check (a in (1)), q text, b text);
--- create table utr2 (a int check (a in (2)), b text);
--- alter table utr1 drop column q;
--- alter table utrtest attach partition utr1 for values in (1);
--- alter table utrtest attach partition utr2 for values in (2);
-
--- -- xmin_ok is likely false, xmin and pg_current_xact_id() comes from
--- -- data segment and master, respectively.
--- insert into utrtest values (1, 'foo')
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;
--- insert into utrtest values (2, 'bar')
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;  -- fails
--- insert into utrtest values (2, 'bar')
---   returning *, tableoid::regclass;
-
--- update utrtest set b = b || b from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;
-
--- update utrtest set a = 3 - a from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass, xmin = pg_current_xact_id()::xid as xmin_ok;  -- fails
-
--- update utrtest set a = 3 - a from (values (1), (2)) s(x) where a = s.x
---   returning *, tableoid::regclass;
-
--- delete from utrtest
---   returning *, tableoid::regclass, xmax = pg_current_xact_id()::xid as xmax_ok;
-
--- drop table utrtest;
--- end_ignore
-
-
---------------
--- Some more update-partition-key test scenarios below. This time use list
--- partitions.
---------------
-
--- Setup for list partitions
-CREATE TABLE list_parted (a numeric, b int, c int8) PARTITION BY list (a);
-CREATE TABLE sub_parted PARTITION OF list_parted for VALUES in (1) PARTITION BY list (b);
-
-CREATE TABLE sub_part1(b int, c int8, a numeric);
-alter table sub_part1 set distributed by (a); -- GPDB: distribution policy must match the parent table.
-ALTER TABLE sub_parted ATTACH PARTITION sub_part1 for VALUES in (1);
-CREATE TABLE sub_part2(b int, c int8, a numeric);
-alter table sub_part2 set distributed by (a); -- GPDB: distribution policy must match the parent table.
-ALTER TABLE sub_parted ATTACH PARTITION sub_part2 for VALUES in (2);
-
-CREATE TABLE list_part1(a numeric, b int, c int8);
-ALTER TABLE list_parted ATTACH PARTITION list_part1 for VALUES in (2,3);
-
-INSERT into list_parted VALUES (2,5,50);
-INSERT into list_parted VALUES (3,6,60);
-INSERT into sub_parted VALUES (1,1,60);
-INSERT into sub_parted VALUES (1,2,10);
-
--- Test partition constraint violation when intermediate ancestor is used and
--- constraint is inherited from upper root.
-UPDATE sub_parted set a = 2 WHERE c = 10;
-
--- Test update-partition-key, where the unpruned partitions do not have their
--- partition keys updated.
-SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
-UPDATE list_parted set b = c + a WHERE a = 2;
-SELECT tableoid::regclass::text, * FROM list_parted WHERE a = 2 ORDER BY 1;
-
-
--- Test the case where BR UPDATE triggers change the partition key.
--- CREATE FUNCTION func_parted_mod_b() returns trigger as $$
--- BEGIN
---    NEW.b = 2; -- This is changing partition key column.
---    return NEW;
--- END $$ LANGUAGE plpgsql;
--- CREATE TRIGGER parted_mod_b before update on sub_part1
---    for each row execute procedure func_parted_mod_b();
-
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
-
--- -- This should do the tuple routing even though there is no explicit
--- -- partition-key update, because there is a trigger on sub_part1.
--- UPDATE list_parted set c = 70 WHERE b  = 1;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
-
--- DROP TRIGGER parted_mod_b ON sub_part1;
-
--- -- If BR DELETE trigger prevented DELETE from happening, we should also skip
--- -- the INSERT if that delete is part of UPDATE=>DELETE+INSERT.
--- CREATE OR REPLACE FUNCTION func_parted_mod_b() returns trigger as $$
--- BEGIN
---    raise notice 'Trigger: Got OLD row %, but returning NULL', OLD;
---    return NULL;
--- END $$ LANGUAGE plpgsql;
--- CREATE TRIGGER trig_skip_delete before delete on sub_part2
---    for each row execute procedure func_parted_mod_b();
--- UPDATE list_parted set b = 1 WHERE c = 70;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- -- Drop the trigger. Now the row should be moved.
--- DROP TRIGGER trig_skip_delete ON sub_part2;
--- UPDATE list_parted set b = 1 WHERE c = 70;
--- SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
--- DROP FUNCTION func_parted_mod_b();
-
--- UPDATE partition-key with FROM clause. If join produces multiple output
--- rows for the same row to be modified, we should tuple-route the row only
--- once. There should not be any rows inserted.
-CREATE TABLE non_parted (id int);
-INSERT into non_parted VALUES (1), (1), (1), (2), (2), (2), (3), (3), (3);
-UPDATE list_parted t1 set a = 2 FROM non_parted t2 WHERE t1.a = t2.id and a = 1;
-
--- In GPDB, the above UPDATE fails because the distribution key is updated, and
--- the Split Update codepath isn't smart enough to handle this situation. With
--- a non-Split Update, it works:
--- ALTER TABLE list_parted SET DISTRIBUTED BY (c);
-UPDATE list_parted t1 set a = 2 FROM non_parted t2 WHERE t1.a = t2.id and a = 1;
-
-SELECT tableoid::regclass::text, * FROM list_parted ORDER BY 1, 2, 3, 4;
-DROP TABLE non_parted;
-
--- Cleanup: list_parted no longer needed.
-DROP TABLE list_parted;
-
--- create custom operator class and hash function, for the same reason
--- explained in alter_table.sql
-create or replace function dummy_hashint4(a int4, seed int8) returns int8 as
-$$ begin return (a + seed); end; $$ language 'plpgsql' immutable;
-create operator class custom_opclass for type int4 using hash as
-operator 1 = , function 2 dummy_hashint4(int4, int8);
-
-create table hash_parted (
-	a int,
-	b int
-) partition by hash (a custom_opclass, b custom_opclass);
-create table hpart1 partition of hash_parted for values with (modulus 2, remainder 1);
-create table hpart2 partition of hash_parted for values with (modulus 4, remainder 2);
-create table hpart3 partition of hash_parted for values with (modulus 8, remainder 0);
-create table hpart4 partition of hash_parted for values with (modulus 8, remainder 4);
-insert into hpart1 values (1, 1);
-insert into hpart2 values (2, 5);
-insert into hpart4 values (3, 4);
-
--- fail
-update hpart1 set a = 3, b=4 where a = 1;
--- ok, row movement
-update hash_parted set b = b - 1 where b = 1;
--- ok
-update hash_parted set b = b + 8 where b = 1;
-
--- cleanup
-drop table hash_parted;
-drop operator class custom_opclass using hash;
-drop function dummy_hashint4(a int4, seed int8);
--- end_ignore
diff --git a/contrib/pax_storage/tools/gen_sql.c b/contrib/pax_storage/tools/gen_sql.c
index f7a01fe2fae..bf1282b009d 100644
--- a/contrib/pax_storage/tools/gen_sql.c
+++ b/contrib/pax_storage/tools/gen_sql.c
@@ -1,25 +1,19 @@
+//
+// This program is used to generate sql script file for PAX.
+// Build and run of this program is automatically done in the
+// cmake script.
+//
+// The command to build this program alone is:
+// gcc -I`pg_config --includedir-server` -I<pax_dir>/src/cpp -o generate_sql gen_sql.c
+//
+//
+
 #include "postgres.h"  // NOLINT
 
 #include <stdio.h>
 
-#define USE_PAX_MACRO
-
-#if defined(USE_PAX_MACRO)
 /* define these values in pax header file */
 #include "comm/cbdb_api.h"
-#else
-// only for tests, you should use the macros in cbdb_api.h
-
-#define PAX_TABLE_AM_OID 7014
-#define PAX_AMNAME "pax"
-#define PAX_AM_HANDLER_OID 7600
-#define PAX_AM_HANDLER_NAME "pax_tableam_handler"
-
-#define PAX_AUX_STATS_IN_OID 7601
-#define PAX_AUX_STATS_OUT_OID 7602
-#define PAX_AUX_STATS_TYPE_OID 7603
-#define PAX_AUX_STATS_TYPE_NAME "paxauxstats"
-#endif
 
 #include "catalog/pg_am.h"
 #include "catalog/pg_authid.h"
@@ -34,6 +28,78 @@
 #define PAX_COMMENT "column-optimized PAX table access method handler"
 int main() {
   printf("-- insert pax catalog values\n");
+
+  printf("-- create pg_ext_aux.pg_pax_tables\n");
+  printf(
+      "CREATE TABLE pg_ext_aux.pg_pax_tables(relid oid not null, auxrelid oid "
+      "not null, partitionspec pg_node_tree);\n");
+  printf(
+      "DELETE FROM gp_distribution_policy WHERE "
+      "localoid='pg_ext_aux.pg_pax_tables'::regclass;\n");
+
+  printf("\n-- update toast name to consistent with new relation oid\n");
+  printf(
+      "UPDATE pg_class SET relname = 'pg_toast_%u' WHERE oid = (SELECT "
+      "reltoastrelid FROM pg_class WHERE "
+      "oid='pg_ext_aux.pg_pax_tables'::regclass);\n",
+      PAX_TABLES_RELATION_ID);
+  printf(
+      "UPDATE pg_class SET relname = 'pg_toast_%u_index' WHERE oid = (SELECT "
+      "indexrelid FROM pg_index idx, pg_class c WHERE idx.indrelid = "
+      "c.reltoastrelid AND c.oid = 'pg_ext_aux.pg_pax_tables'::regclass);\n",
+      PAX_TABLES_RELATION_ID);
+
+  printf("\n-- update pg_depend\n");
+  printf(
+      "UPDATE pg_depend SET refobjid = %u WHERE refclassid = %u AND "
+      "refobjid='pg_ext_aux.pg_pax_tables'::regclass;\n",
+      PAX_TABLES_RELATION_ID, RelationRelationId);
+  printf(
+      "UPDATE pg_depend SET objid = %u WHERE classid = %u AND "
+      "objid='pg_ext_aux.pg_pax_tables'::regclass;\n",
+      PAX_TABLES_RELATION_ID, RelationRelationId);
+
+  printf("\n-- update pg_attribute\n");
+  printf(
+      "UPDATE pg_attribute SET attrelid = %u WHERE attrelid = "
+      "'pg_ext_aux.pg_pax_tables'::regclass;\n",
+      PAX_TABLES_RELATION_ID);
+  printf(
+      "UPDATE pg_class SET oid=%u WHERE "
+      "oid='pg_ext_aux.pg_pax_tables'::regclass;\n",
+      PAX_TABLES_RELATION_ID);
+
+  printf("\n-- add unique index\n");
+  printf(
+      "CREATE UNIQUE INDEX pg_pax_tables_relid_index on "
+      "pg_ext_aux.pg_pax_tables(relid);\n");
+
+  printf("\n-- update pg_attribute\n");
+  printf(
+      "UPDATE pg_attribute SET attrelid = %u WHERE attrelid = (SELECT "
+      "indexrelid FROM pg_index WHERE "
+      "indrelid='pg_ext_aux.pg_pax_tables'::regclass);\n",
+      PAX_TABLES_RELID_INDEX_ID);
+
+  printf("\n-- update pg_depend\n");
+  printf(
+      "UPDATE pg_depend SET objid = %u WHERE classid = %u AND refclassid = %u "
+      "AND refobjid='pg_ext_aux.pg_pax_tables'::regclass AND objid = (SELECT "
+      "indexrelid FROM pg_index WHERE "
+      "indrelid='pg_ext_aux.pg_pax_tables'::regclass);",
+      PAX_TABLES_RELID_INDEX_ID, RelationRelationId, RelationRelationId);
+
+  printf("\n-- update index oid\n");
+  printf(
+      "UPDATE pg_class SET oid = %u WHERE oid = (SELECT indexrelid FROM "
+      "pg_index WHERE indrelid='pg_ext_aux.pg_pax_tables'::regclass);\n",
+      PAX_TABLES_RELID_INDEX_ID);
+  printf(
+      "UPDATE pg_index SET indexrelid = %u WHERE "
+      "indrelid='pg_ext_aux.pg_pax_tables'::regclass;\n",
+      PAX_TABLES_RELID_INDEX_ID);
+
+  printf("\n-- insert proc and am entry\n");
   printf(
       "INSERT INTO pg_proc "
       "VALUES(%u,'%s',%u,%u,%u,%u,%u,%u,%u,'%c','%c','%c','%c','%c','%c','%c',"
@@ -88,7 +154,7 @@ int main() {
       ";\n",
       PAX_AUX_STATS_IN_OID,  /* oid: pg_proc.oid */
       "paxauxstats_in",      /* proname */
-      PG_CATALOG_NAMESPACE,  /* pronamespace: pg_namespace.oid: pg_catalog */
+      PG_EXTAUX_NAMESPACE,   /* pronamespace: pg_namespace.oid: pg_catalog */
       BOOTSTRAP_SUPERUSERID, /* proowner: pg_authid.oid */
       ClanguageId,           /* prolang: pg_language.oid */
       1,                     /* procost: 1 */
@@ -126,7 +192,7 @@ int main() {
       ";\n",
       PAX_AUX_STATS_OUT_OID, /* oid: pg_proc.oid */
       "paxauxstats_out",     /* proname */
-      PG_CATALOG_NAMESPACE,  /* pronamespace: pg_namespace.oid: pg_catalog */
+      PG_EXTAUX_NAMESPACE,   /* pronamespace: pg_namespace.oid: pg_catalog */
       BOOTSTRAP_SUPERUSERID, /* proowner: pg_authid.oid */
       ClanguageId,           /* prolang: pg_language.oid */
       1,                     /* procost: 1 */
@@ -164,7 +230,7 @@ int main() {
       "%u,%d,%d,%u,null,null,null);\n",
       PAX_AUX_STATS_TYPE_OID,  /* pg_type.oid */
       PAX_AUX_STATS_TYPE_NAME, /* pg_type.typname */
-      PG_CATALOG_NAMESPACE,    /* pg_type.typnamespace: pg_namespace.oid:
+      PG_EXTAUX_NAMESPACE,     /* pg_type.typnamespace: pg_namespace.oid:
                                   pg_catalog */
       BOOTSTRAP_SUPERUSERID,   /* pg_type.typowner: pg_authid.oid */
       -1,                      /* pg_type.typlen: -1 variable length */
@@ -194,5 +260,60 @@ int main() {
       InvalidOid               /* pg_type.typcollation */
   );
 
+  printf("\n");
+  /* create pax auxiliary fast sequence table. */
+  printf("CREATE TABLE %s.%s(objid oid NOT NULL, seq int NOT NULL);\n",
+         PG_PAX_FASTSEQUENCE_NAMESPACE, PG_PAX_FASTSEQUENCE_TABLE);
+
+  /* create pax auxiliary fast sequence index. */
+  printf("CREATE INDEX %s ON %s.%s(objid);\n", PG_PAX_FASTSEQUENCE_INDEX_NAME,
+         PG_PAX_FASTSEQUENCE_NAMESPACE, PG_PAX_FASTSEQUENCE_TABLE);
+
+  /* update oid of pg_pax_fastsequence and pg_pax_fastsequence_objid_idx */
+  printf("-- update oid of fastsequence: table %u index %u\n",
+         PAX_FASTSEQUENCE_OID, PAX_FASTSEQUENCE_INDEX_OID);
+  printf("-- pg_type\n");
+  printf("UPDATE pg_type SET typrelid = %u WHERE typname='%s';\n",
+         PAX_FASTSEQUENCE_OID, PG_PAX_FASTSEQUENCE_TABLE);
+  printf("-- pg_depend\n");
+  printf(
+      "UPDATE pg_depend SET refobjid = %u WHERE refobjid = (SELECT oid FROM "
+      "pg_class WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_OID, PG_PAX_FASTSEQUENCE_TABLE);
+  printf(
+      "UPDATE pg_depend SET objid = %u WHERE objid = (SELECT oid FROM pg_class "
+      "WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_OID, PG_PAX_FASTSEQUENCE_TABLE);
+  printf(
+      "UPDATE pg_depend SET objid = %u WHERE objid = (SELECT oid FROM pg_class "
+      "WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_INDEX_OID, PG_PAX_FASTSEQUENCE_INDEX_NAME);
+  printf("-- pg_attribute\n");
+  printf(
+      "UPDATE pg_attribute SET attrelid=%u WHERE attrelid = (SELECT oid FROM "
+      "pg_class WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_OID, PG_PAX_FASTSEQUENCE_TABLE);
+  printf("\n");
+
+  printf(
+      "UPDATE pg_attribute SET attrelid=%u WHERE attrelid = (SELECT oid FROM "
+      "pg_class WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_INDEX_OID, PG_PAX_FASTSEQUENCE_INDEX_NAME);
+  printf("\n");
+
+  printf("-- pg_index\n");
+  printf(
+      "UPDATE pg_index SET indexrelid = %u, indrelid = %u WHERE indexrelid = "
+      "(SELECT oid FROM pg_class WHERE relname='%s') AND indrelid = (SELECT "
+      "oid FROM pg_class WHERE relname='%s');\n",
+      PAX_FASTSEQUENCE_INDEX_OID, PAX_FASTSEQUENCE_OID,
+      PG_PAX_FASTSEQUENCE_INDEX_NAME, PG_PAX_FASTSEQUENCE_TABLE);
+
+  printf("-- pg_class\n");
+  printf("UPDATE pg_class SET oid=%u WHERE relname='%s';\n",
+         PAX_FASTSEQUENCE_OID, PG_PAX_FASTSEQUENCE_TABLE);
+  printf("UPDATE pg_class SET oid=%u WHERE relname='%s';\n",
+         PAX_FASTSEQUENCE_INDEX_OID, PG_PAX_FASTSEQUENCE_INDEX_NAME);
+
   return 0;
 }
diff --git a/src/Makefile.global.in b/src/Makefile.global.in
index a774ab0c695..8a195a39856 100644
--- a/src/Makefile.global.in
+++ b/src/Makefile.global.in
@@ -232,7 +232,7 @@ enable_mapreduce    = @enable_mapreduce@
 enable_shared_postgres_backend    = @enable_shared_postgres_backend@
 enable_gpcloud 	    = @enable_gpcloud@
 enable_ic_proxy     = @enable_ic_proxy@
-
+enable_pax          = @enable_pax@
 enable_tap_tests = @enable_tap_tests@
 
 python_includespec	= @python_includespec@
diff --git a/src/include/pg_config.h.in b/src/include/pg_config.h.in
index 2388d182e9d..379a94ae56a 100644
--- a/src/include/pg_config.h.in
+++ b/src/include/pg_config.h.in
@@ -1064,6 +1064,8 @@
 /* Define to 1 to build with Cloudberry ORCA optimizer. (--enable-orca) */
 #undef USE_ORCA
 
+/* Define to 1 to build with pax support. (--enable-pax) */
+#undef USE_PAX_STORAGE
 
 /* Define to 1 to build with PAM support. (--with-pam) */
 #undef USE_PAM
diff --git a/src/test/regress/expected/create_am.out b/src/test/regress/expected/create_am.out
index 2ff668ffd84..aa82f1ade40 100644
--- a/src/test/regress/expected/create_am.out
+++ b/src/test/regress/expected/create_am.out
@@ -137,7 +137,7 @@ CREATE ACCESS METHOD bogus TYPE TABLE HANDLER int4in;
 ERROR:  function int4in(internal) does not exist
 CREATE ACCESS METHOD bogus TYPE TABLE HANDLER bthandler;
 ERROR:  function bthandler must return type table_am_handler
-SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' ORDER BY 1, 2;
+SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' and amname not in ('pax') ORDER BY 1, 2;
   amname   |         amhandler         | amtype 
 -----------+---------------------------+--------
  ao_column | ao_column_tableam_handler | t
diff --git a/src/test/regress/expected/create_am_optimizer.out b/src/test/regress/expected/create_am_optimizer.out
index 214137e9d92..8bcb572c331 100644
--- a/src/test/regress/expected/create_am_optimizer.out
+++ b/src/test/regress/expected/create_am_optimizer.out
@@ -138,7 +138,7 @@ CREATE ACCESS METHOD bogus TYPE TABLE HANDLER int4in;
 ERROR:  function int4in(internal) does not exist
 CREATE ACCESS METHOD bogus TYPE TABLE HANDLER bthandler;
 ERROR:  function bthandler must return type table_am_handler
-SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' ORDER BY 1, 2;
+SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' and amname not in ('pax') ORDER BY 1, 2;
   amname   |         amhandler         | amtype 
 -----------+---------------------------+--------
  ao_column | ao_column_tableam_handler | t
diff --git a/src/test/regress/expected/opr_sanity.out b/src/test/regress/expected/opr_sanity.out
index af95c308c93..2fb7ba06584 100644
--- a/src/test/regress/expected/opr_sanity.out
+++ b/src/test/regress/expected/opr_sanity.out
@@ -505,7 +505,8 @@ WHERE p2.oid = p1.prosupport AND
 SELECT p1.oid, p1.proname
 FROM pg_proc as p1 LEFT JOIN pg_description as d
      ON p1.tableoid = d.classoid and p1.oid = d.objoid and d.objsubid = 0
-WHERE d.classoid IS NULL AND p1.oid <= 9999;
+WHERE d.classoid IS NULL AND p1.oid <= 9999
+    AND pronamespace not in (select oid from pg_namespace where nspname='pg_ext_aux');
  oid | proname 
 -----+---------
 (0 rows)
@@ -906,7 +907,8 @@ order by 1;
 -- Check that all immutable functions are marked parallel safe
 SELECT p1.oid, p1.proname
 FROM pg_proc AS p1
-WHERE provolatile = 'i' AND proparallel = 'u';
+WHERE provolatile = 'i' AND proparallel = 'u'
+    AND pronamespace not in (select oid from pg_namespace where nspname='pg_ext_aux');
  oid | proname 
 -----+---------
 (0 rows)
@@ -2304,6 +2306,8 @@ WHERE c.oid = attrelid AND c.oid < 16384 AND
     c.relkind != 'v' AND  -- we don't care about columns in views
     c.relkind != 'f' AND  -- GPDB: foreign/external tables are also OK.
     c.relkind != 'c' AND  -- GPDB: as well as composite types
+    -- CBDB: ignore relations in extension namespace
+    c.relnamespace != (select oid from pg_namespace where nspname='pg_ext_aux') AND
     attcollation != 0 AND
     attcollation != (SELECT oid FROM pg_collation WHERE collname = 'C');
  relname | attname | attcollation 
diff --git a/src/test/regress/expected/psql.out b/src/test/regress/expected/psql.out
index b388887ebd1..49504f1665b 100644
--- a/src/test/regress/expected/psql.out
+++ b/src/test/regress/expected/psql.out
@@ -4991,6 +4991,7 @@ Indexes:
     "pg_toast_2619_index" PRIMARY KEY, btree (chunk_id, chunk_seq)
 
 -- check printing info about access methods
+-- start_ignore
 \dA
 List of access methods
    Name    | Type  
@@ -5005,10 +5006,31 @@ List of access methods
  hash      | Index
  heap      | Table
  heap2     | Table
+ pax       | Table
  spgist    | Index
-(11 rows)
+(12 rows)
 
 \dA *
+List of access methods
+   Name    | Type  
+-----------+-------
+ ao_column | Table
+ ao_row    | Table
+ bitmap    | Index
+ brin      | Index
+ btree     | Index
+ gin       | Index
+ gist      | Index
+ hash      | Index
+ heap      | Table
+ heap2     | Table
+ pax       | Table
+ spgist    | Index
+(12 rows)
+
+-- end_ignore
+-- CBDB: ignore pax AM
+\dA [^p]*
 List of access methods
    Name    | Type  
 -----------+-------
@@ -5047,6 +5069,7 @@ List of access methods
 (0 rows)
 
 \dA: extra argument "bar" ignored
+-- start_ignore
 \dA+
                                         List of access methods
    Name    | Type  |          Handler          |                     Description                      
@@ -5061,12 +5084,33 @@ List of access methods
  hash      | Index | hashhandler               | hash index access method
  heap      | Table | heap_tableam_handler      | heap table access method
  heap2     | Table | heap_tableam_handler      | 
+ pax       | Table | pax_tableam_handler       | 
  spgist    | Index | spghandler                | SP-GiST index access method
-(11 rows)
+(12 rows)
 
 \dA+ *
                                         List of access methods
    Name    | Type  |          Handler          |                     Description                      
+-----------+-------+---------------------------+------------------------------------------------------
+ ao_column | Table | ao_column_tableam_handler | column-oriented append-optimized table access method
+ ao_row    | Table | ao_row_tableam_handler    | row-oriented append-optimized table access method
+ bitmap    | Index | bmhandler                 | bitmap index access method
+ brin      | Index | brinhandler               | block range index (BRIN) access method
+ btree     | Index | bthandler                 | b-tree index access method
+ gin       | Index | ginhandler                | GIN index access method
+ gist      | Index | gisthandler               | GiST index access method
+ hash      | Index | hashhandler               | hash index access method
+ heap      | Table | heap_tableam_handler      | heap table access method
+ heap2     | Table | heap_tableam_handler      | 
+ pax       | Table | pax_tableam_handler       | 
+ spgist    | Index | spghandler                | SP-GiST index access method
+(12 rows)
+
+-- end_ignore
+-- CBDB: ignore pax AM
+\dA+ [^p]*
+                                        List of access methods
+   Name    | Type  |          Handler          |                     Description                      
 -----------+-------+---------------------------+------------------------------------------------------
  ao_column | Table | ao_column_tableam_handler | column-oriented append-optimized table access method
  ao_row    | Table | ao_row_tableam_handler    | row-oriented append-optimized table access method
diff --git a/src/test/regress/expected/sanity_check.out b/src/test/regress/expected/sanity_check.out
index 6a79a5b3365..4d47bca866b 100644
--- a/src/test/regress/expected/sanity_check.out
+++ b/src/test/regress/expected/sanity_check.out
@@ -13,6 +13,8 @@ SELECT relname, relhasindex
    WHERE relkind IN ('r', 'p') AND (nspname ~ '^pg_temp_') IS NOT TRUE
    AND relname NOT LIKE 'gp_%'
    AND relname NOT LIKE '__gp_%'
+   -- CBDB: ignore relations in extension namespace
+   AND nspname <> 'pg_ext_aux'
    AND relname <> 'pg_resqueue'
    AND n.nspname <> 'singleseg'
    ORDER BY relname;
diff --git a/src/test/regress/expected/type_sanity.out b/src/test/regress/expected/type_sanity.out
index c4857834c6e..18434c3ebbc 100644
--- a/src/test/regress/expected/type_sanity.out
+++ b/src/test/regress/expected/type_sanity.out
@@ -66,6 +66,7 @@ WHERE p1.typtype not in ('c','d','p') AND p1.typname NOT LIKE E'\\_%'
     (SELECT 1 FROM pg_type as p2
      WHERE p2.typname = ('_' || p1.typname)::name AND
            p2.typelem = p1.oid and p1.typarray = p2.oid)
+    AND typnamespace != (select oid from pg_namespace where nspname='pg_ext_aux')
 ORDER BY p1.oid;
  oid  |           typname            
 ------+------------------------------
@@ -793,6 +794,8 @@ SELECT oid, typname, typtype, typelem, typarray, typarray
                      'pg_brin_minmax_multi_summary', 'xml']::regtype[]) AND
     -- GPDB_14_MERGE_FIXME: Discard the GP-specific type gp_hyperloglog_estimator?
     oid != 'gp_hyperloglog_estimator'::regtype AND
+    -- CBDB: ignore types defined in extension namespace
+    typnamespace != (select oid from pg_namespace where nspname='pg_ext_aux') AND
     -- Discard arrays.
     NOT EXISTS (SELECT 1 FROM pg_type u WHERE u.typarray = t.oid)
     -- Exclude everything from the table created above.  This checks
diff --git a/src/test/regress/input/table_functions.source b/src/test/regress/input/table_functions.source
index b2db49ede26..67bd337361b 100644
--- a/src/test/regress/input/table_functions.source
+++ b/src/test/regress/input/table_functions.source
@@ -910,9 +910,9 @@ SELECT * FROM project( TABLE( SELECT * FROM history ), 2) order by 1;
 -- Valid operations on results
 SELECT id+1  FROM project( TABLE( SELECT * FROM history ), 1) order by 1;
 SELECT extract(day from "time") FROM project( TABLE( SELECT * FROM history ), 2) order by 1;
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE 1 WHEN 2 THEN 1 ELSE GREATEST(1, COALESCE(1+1)) END);
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE WHEN 3 IS NOT NULL AND 1 IN (1, 2) THEN floor(NULLIF(2, 3))::int END);
 
 -- ERROR: invalid operations demonstrating different return types
diff --git a/src/test/regress/output/table_functions.source b/src/test/regress/output/table_functions.source
index 9ffc19455c9..8ce10005805 100644
--- a/src/test/regress/output/table_functions.source
+++ b/src/test/regress/output/table_functions.source
@@ -2980,7 +2980,7 @@ SELECT extract(day from "time") FROM project( TABLE( SELECT * FROM history ), 2)
       22
 (18 rows)
 
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE 1 WHEN 2 THEN 1 ELSE GREATEST(1, COALESCE(1+1)) END);
   amname   
 -----------
@@ -2997,7 +2997,7 @@ SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
  heap2
 (11 rows)
 
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE WHEN 3 IS NOT NULL AND 1 IN (1, 2) THEN floor(NULLIF(2, 3))::int END);
   amname   
 -----------
diff --git a/src/test/regress/output/table_functions_optimizer.source b/src/test/regress/output/table_functions_optimizer.source
index 3a14190f567..6e189071762 100644
--- a/src/test/regress/output/table_functions_optimizer.source
+++ b/src/test/regress/output/table_functions_optimizer.source
@@ -2981,7 +2981,7 @@ SELECT extract(day from "time") FROM project( TABLE( SELECT * FROM history ), 2)
       22
 (18 rows)
 
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE 1 WHEN 2 THEN 1 ELSE GREATEST(1, COALESCE(1+1)) END);
   amname   
 -----------
@@ -2998,7 +2998,7 @@ SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
  heap2
 (11 rows)
 
-SELECT * FROM project( TABLE( SELECT * FROM pg_am ),
+SELECT * FROM project( TABLE( SELECT * FROM pg_am WHERE amname not in ('pax') ),
   CASE WHEN 3 IS NOT NULL AND 1 IN (1, 2) THEN floor(NULLIF(2, 3))::int END);
   amname   
 -----------
diff --git a/src/test/regress/sql/create_am.sql b/src/test/regress/sql/create_am.sql
index 439d21132df..c9e8a1f49dc 100644
--- a/src/test/regress/sql/create_am.sql
+++ b/src/test/regress/sql/create_am.sql
@@ -97,7 +97,7 @@ CREATE ACCESS METHOD heap2 TYPE TABLE HANDLER heap_tableam_handler;
 CREATE ACCESS METHOD bogus TYPE TABLE HANDLER int4in;
 CREATE ACCESS METHOD bogus TYPE TABLE HANDLER bthandler;
 
-SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' ORDER BY 1, 2;
+SELECT amname, amhandler, amtype FROM pg_am where amtype = 't' and amname not in ('pax') ORDER BY 1, 2;
 
 
 -- First create tables employing the new AM using USING
diff --git a/src/test/regress/sql/opr_sanity.sql b/src/test/regress/sql/opr_sanity.sql
index 41c93ae8c58..9377ae95fe4 100644
--- a/src/test/regress/sql/opr_sanity.sql
+++ b/src/test/regress/sql/opr_sanity.sql
@@ -364,7 +364,8 @@ WHERE p2.oid = p1.prosupport AND
 SELECT p1.oid, p1.proname
 FROM pg_proc as p1 LEFT JOIN pg_description as d
      ON p1.tableoid = d.classoid and p1.oid = d.objoid and d.objsubid = 0
-WHERE d.classoid IS NULL AND p1.oid <= 9999;
+WHERE d.classoid IS NULL AND p1.oid <= 9999
+    AND pronamespace not in (select oid from pg_namespace where nspname='pg_ext_aux');
 
 -- List of built-in leakproof functions
 --
@@ -412,7 +413,8 @@ order by 1;
 -- Check that all immutable functions are marked parallel safe
 SELECT p1.oid, p1.proname
 FROM pg_proc AS p1
-WHERE provolatile = 'i' AND proparallel = 'u';
+WHERE provolatile = 'i' AND proparallel = 'u'
+    AND pronamespace not in (select oid from pg_namespace where nspname='pg_ext_aux');
 
 
 -- **************** pg_cast ****************
@@ -1390,6 +1392,8 @@ WHERE c.oid = attrelid AND c.oid < 16384 AND
     c.relkind != 'v' AND  -- we don't care about columns in views
     c.relkind != 'f' AND  -- GPDB: foreign/external tables are also OK.
     c.relkind != 'c' AND  -- GPDB: as well as composite types
+    -- CBDB: ignore relations in extension namespace
+    c.relnamespace != (select oid from pg_namespace where nspname='pg_ext_aux') AND
     attcollation != 0 AND
     attcollation != (SELECT oid FROM pg_collation WHERE collname = 'C');
 
diff --git a/src/test/regress/sql/psql.sql b/src/test/regress/sql/psql.sql
index ff07c1851fd..1b17536838d 100644
--- a/src/test/regress/sql/psql.sql
+++ b/src/test/regress/sql/psql.sql
@@ -1216,13 +1216,21 @@ drop role regress_partitioning_role;
 \d pg_toast.pg_toast_2619
 
 -- check printing info about access methods
+-- start_ignore
 \dA
 \dA *
+-- end_ignore
+-- CBDB: ignore pax AM
+\dA [^p]*
 \dA h*
 \dA foo
 \dA foo bar
+-- start_ignore
 \dA+
 \dA+ *
+-- end_ignore
+-- CBDB: ignore pax AM
+\dA+ [^p]*
 \dA+ h*
 \dA+ foo
 \dAc brin pg*.oid*
diff --git a/src/test/regress/sql/sanity_check.sql b/src/test/regress/sql/sanity_check.sql
index 996cefa185f..ac3e904601c 100644
--- a/src/test/regress/sql/sanity_check.sql
+++ b/src/test/regress/sql/sanity_check.sql
@@ -16,6 +16,8 @@ SELECT relname, relhasindex
    WHERE relkind IN ('r', 'p') AND (nspname ~ '^pg_temp_') IS NOT TRUE
    AND relname NOT LIKE 'gp_%'
    AND relname NOT LIKE '__gp_%'
+   -- CBDB: ignore relations in extension namespace
+   AND nspname <> 'pg_ext_aux'
    AND relname <> 'pg_resqueue'
    AND n.nspname <> 'singleseg'
    ORDER BY relname;
diff --git a/src/test/regress/sql/type_sanity.sql b/src/test/regress/sql/type_sanity.sql
index 1cf116978f0..061f07d3800 100644
--- a/src/test/regress/sql/type_sanity.sql
+++ b/src/test/regress/sql/type_sanity.sql
@@ -61,6 +61,7 @@ WHERE p1.typtype not in ('c','d','p') AND p1.typname NOT LIKE E'\\_%'
     (SELECT 1 FROM pg_type as p2
      WHERE p2.typname = ('_' || p1.typname)::name AND
            p2.typelem = p1.oid and p1.typarray = p2.oid)
+    AND typnamespace != (select oid from pg_namespace where nspname='pg_ext_aux')
 ORDER BY p1.oid;
 
 -- Make sure typarray points to a "true" array type of our own base
@@ -611,6 +612,8 @@ SELECT oid, typname, typtype, typelem, typarray, typarray
                      'pg_brin_minmax_multi_summary', 'xml']::regtype[]) AND
     -- GPDB_14_MERGE_FIXME: Discard the GP-specific type gp_hyperloglog_estimator?
     oid != 'gp_hyperloglog_estimator'::regtype AND
+    -- CBDB: ignore types defined in extension namespace
+    typnamespace != (select oid from pg_namespace where nspname='pg_ext_aux') AND
     -- Discard arrays.
     NOT EXISTS (SELECT 1 FROM pg_type u WHERE u.typarray = t.oid)
     -- Exclude everything from the table created above.  This checks