diff --git a/be/src/agent/task_worker_pool.cpp b/be/src/agent/task_worker_pool.cpp
index c0f16d304a2b72..a8ab93de455c3b 100644
--- a/be/src/agent/task_worker_pool.cpp
+++ b/be/src/agent/task_worker_pool.cpp
@@ -1630,11 +1630,13 @@ void drop_tablet_callback(StorageEngine& engine, const TAgentTaskRequest& req) {
                 dropped_tablet->tablet_uid());
         LOG_INFO("successfully drop tablet")
                 .tag("signature", req.signature)
-                .tag("tablet_id", drop_tablet_req.tablet_id);
+                .tag("tablet_id", drop_tablet_req.tablet_id)
+                .tag("replica_id", drop_tablet_req.replica_id);
     } else {
         LOG_WARNING("failed to drop tablet")
                 .tag("signature", req.signature)
                 .tag("tablet_id", drop_tablet_req.tablet_id)
+                .tag("replica_id", drop_tablet_req.replica_id)
                 .error(status);
     }
 
diff --git a/be/src/cloud/cloud_base_compaction.cpp b/be/src/cloud/cloud_base_compaction.cpp
index 88d83000e95dfa..9742e57dcf9d34 100644
--- a/be/src/cloud/cloud_base_compaction.cpp
+++ b/be/src/cloud/cloud_base_compaction.cpp
@@ -125,6 +125,7 @@ Status CloudBaseCompaction::prepare_compact() {
         _input_row_num += rs->num_rows();
         _input_segments += rs->num_segments();
         _input_rowsets_data_size += rs->data_disk_size();
+        _input_rowsets_index_size += rs->index_disk_size();
         _input_rowsets_total_size += rs->total_disk_size();
     }
     LOG_INFO("start CloudBaseCompaction, tablet_id={}, range=[{}-{}]", _tablet->tablet_id(),
@@ -320,6 +321,10 @@ Status CloudBaseCompaction::modify_rowsets() {
     compaction_job->add_output_versions(_output_rowset->end_version());
     compaction_job->add_txn_id(_output_rowset->txn_id());
     compaction_job->add_output_rowset_ids(_output_rowset->rowset_id().to_string());
+    compaction_job->set_index_size_input_rowsets(_input_rowsets_index_size);
+    compaction_job->set_segment_size_input_rowsets(_input_rowsets_data_size);
+    compaction_job->set_index_size_output_rowsets(_output_rowset->index_disk_size());
+    compaction_job->set_segment_size_output_rowsets(_output_rowset->data_disk_size());
 
     DeleteBitmapPtr output_rowset_delete_bitmap = nullptr;
     if (_tablet->keys_type() == KeysType::UNIQUE_KEYS &&
diff --git a/be/src/cloud/cloud_cumulative_compaction.cpp b/be/src/cloud/cloud_cumulative_compaction.cpp
index 2f08082f51b5f3..f63054563aa18a 100644
--- a/be/src/cloud/cloud_cumulative_compaction.cpp
+++ b/be/src/cloud/cloud_cumulative_compaction.cpp
@@ -33,6 +33,7 @@
 #include "util/uuid_generator.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 bvar::Adder<uint64_t> cumu_output_size("cumu_compaction", "output_size");
@@ -263,6 +264,10 @@ Status CloudCumulativeCompaction::modify_rowsets() {
     compaction_job->add_output_versions(_output_rowset->end_version());
     compaction_job->add_txn_id(_output_rowset->txn_id());
     compaction_job->add_output_rowset_ids(_output_rowset->rowset_id().to_string());
+    compaction_job->set_index_size_input_rowsets(_input_rowsets_index_size);
+    compaction_job->set_segment_size_input_rowsets(_input_rowsets_data_size);
+    compaction_job->set_index_size_output_rowsets(_output_rowset->index_disk_size());
+    compaction_job->set_segment_size_output_rowsets(_output_rowset->data_disk_size());
 
     DBUG_EXECUTE_IF("CloudCumulativeCompaction::modify_rowsets.enable_spin_wait", {
         LOG(INFO) << "CloudCumulativeCompaction::modify_rowsets.enable_spin_wait, start";
@@ -371,11 +376,9 @@ Status CloudCumulativeCompaction::modify_rowsets() {
 Status CloudCumulativeCompaction::process_old_version_delete_bitmap() {
     // agg previously rowset old version delete bitmap
     std::vector<RowsetSharedPtr> pre_rowsets {};
-    std::vector<std::string> pre_rowset_ids {};
     for (const auto& it : cloud_tablet()->rowset_map()) {
         if (it.first.second < _input_rowsets.front()->start_version()) {
             pre_rowsets.emplace_back(it.second);
-            pre_rowset_ids.emplace_back(it.second->rowset_id().to_string());
         }
     }
     std::sort(pre_rowsets.begin(), pre_rowsets.end(), Rowset::comparator);
@@ -486,8 +489,10 @@ Status CloudCumulativeCompaction::pick_rowsets_to_compact() {
     }
 
     int64_t max_score = config::cumulative_compaction_max_deltas;
-    auto process_memory_usage = doris::GlobalMemoryArbitrator::process_memory_usage();
-    bool memory_usage_high = process_memory_usage > MemInfo::soft_mem_limit() * 0.8;
+    double process_memory_usage =
+            cast_set<double>(doris::GlobalMemoryArbitrator::process_memory_usage());
+    bool memory_usage_high =
+            process_memory_usage > cast_set<double>(MemInfo::soft_mem_limit()) * 0.8;
     if (cloud_tablet()->last_compaction_status.is<ErrorCode::MEM_LIMIT_EXCEEDED>() ||
         memory_usage_high) {
         max_score = std::max(config::cumulative_compaction_max_deltas /
@@ -617,4 +622,5 @@ void CloudCumulativeCompaction::do_lease() {
     }
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_cumulative_compaction.h b/be/src/cloud/cloud_cumulative_compaction.h
index 1159dcb59ceef1..87fc0b62c9c389 100644
--- a/be/src/cloud/cloud_cumulative_compaction.h
+++ b/be/src/cloud/cloud_cumulative_compaction.h
@@ -24,6 +24,7 @@
 #include "olap/compaction.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 class CloudCumulativeCompaction : public CloudCompactionMixin {
 public:
@@ -60,4 +61,5 @@ class CloudCumulativeCompaction : public CloudCompactionMixin {
     Version _last_delete_version {-1, -1};
 };
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_cumulative_compaction_policy.cpp b/be/src/cloud/cloud_cumulative_compaction_policy.cpp
index 5a9879387b2327..92a47fcc69f8d7 100644
--- a/be/src/cloud/cloud_cumulative_compaction_policy.cpp
+++ b/be/src/cloud/cloud_cumulative_compaction_policy.cpp
@@ -31,6 +31,7 @@
 #include "olap/tablet_meta.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 CloudSizeBasedCumulativeCompactionPolicy::CloudSizeBasedCumulativeCompactionPolicy(
         int64_t promotion_size, double promotion_ratio, int64_t promotion_min_size,
@@ -48,7 +49,7 @@ int64_t CloudSizeBasedCumulativeCompactionPolicy::_level_size(const int64_t size
     return (int64_t)1 << (sizeof(size) * 8 - 1 - __builtin_clzl(size));
 }
 
-int32_t CloudSizeBasedCumulativeCompactionPolicy::pick_input_rowsets(
+int64_t CloudSizeBasedCumulativeCompactionPolicy::pick_input_rowsets(
         CloudTablet* tablet, const std::vector<RowsetSharedPtr>& candidate_rowsets,
         const int64_t max_compaction_score, const int64_t min_compaction_score,
         std::vector<RowsetSharedPtr>* input_rowsets, Version* last_delete_version,
@@ -114,8 +115,8 @@ int32_t CloudSizeBasedCumulativeCompactionPolicy::pick_input_rowsets(
     size_t new_compaction_score = *compaction_score;
     while (rs_begin != input_rowsets->end()) {
         auto& rs_meta = (*rs_begin)->rowset_meta();
-        int current_level = _level_size(rs_meta->total_disk_size());
-        int remain_level = _level_size(total_size - rs_meta->total_disk_size());
+        int64_t current_level = _level_size(rs_meta->total_disk_size());
+        int64_t remain_level = _level_size(total_size - rs_meta->total_disk_size());
         // if current level less then remain level, input rowsets contain current rowset
         // and process return; otherwise, input rowsets do not contain current rowset.
         if (current_level <= remain_level) {
@@ -185,7 +186,7 @@ int32_t CloudSizeBasedCumulativeCompactionPolicy::pick_input_rowsets(
 }
 
 int64_t CloudSizeBasedCumulativeCompactionPolicy::cloud_promotion_size(CloudTablet* t) const {
-    int64_t promotion_size = int64_t(t->base_size() * _promotion_ratio);
+    int64_t promotion_size = int64_t(cast_set<double>(t->base_size()) * _promotion_ratio);
     // promotion_size is between _size_based_promotion_size and _size_based_promotion_min_size
     return promotion_size > _promotion_size       ? _promotion_size
            : promotion_size < _promotion_min_size ? _promotion_min_size
@@ -215,7 +216,7 @@ int64_t CloudSizeBasedCumulativeCompactionPolicy::new_cumulative_point(
                    : last_cumulative_point;
 }
 
-int32_t CloudTimeSeriesCumulativeCompactionPolicy::pick_input_rowsets(
+int64_t CloudTimeSeriesCumulativeCompactionPolicy::pick_input_rowsets(
         CloudTablet* tablet, const std::vector<RowsetSharedPtr>& candidate_rowsets,
         const int64_t max_compaction_score, const int64_t min_compaction_score,
         std::vector<RowsetSharedPtr>* input_rowsets, Version* last_delete_version,
@@ -377,4 +378,5 @@ int64_t CloudTimeSeriesCumulativeCompactionPolicy::new_cumulative_point(
     return output_rowset->end_version() + 1;
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_cumulative_compaction_policy.h b/be/src/cloud/cloud_cumulative_compaction_policy.h
index c142a8a6d3dffe..9373728547241b 100644
--- a/be/src/cloud/cloud_cumulative_compaction_policy.h
+++ b/be/src/cloud/cloud_cumulative_compaction_policy.h
@@ -30,6 +30,7 @@
 #include "olap/rowset/rowset_meta.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 class Tablet;
 struct Version;
@@ -44,7 +45,7 @@ class CloudCumulativeCompactionPolicy {
 
     virtual int64_t new_compaction_level(const std::vector<RowsetSharedPtr>& input_rowsets) = 0;
 
-    virtual int32_t pick_input_rowsets(CloudTablet* tablet,
+    virtual int64_t pick_input_rowsets(CloudTablet* tablet,
                                        const std::vector<RowsetSharedPtr>& candidate_rowsets,
                                        const int64_t max_compaction_score,
                                        const int64_t min_compaction_score,
@@ -71,7 +72,7 @@ class CloudSizeBasedCumulativeCompactionPolicy : public CloudCumulativeCompactio
         return 0;
     }
 
-    int32_t pick_input_rowsets(CloudTablet* tablet,
+    int64_t pick_input_rowsets(CloudTablet* tablet,
                                const std::vector<RowsetSharedPtr>& candidate_rowsets,
                                const int64_t max_compaction_score,
                                const int64_t min_compaction_score,
@@ -106,7 +107,7 @@ class CloudTimeSeriesCumulativeCompactionPolicy : public CloudCumulativeCompacti
 
     int64_t new_compaction_level(const std::vector<RowsetSharedPtr>& input_rowsets) override;
 
-    int32_t pick_input_rowsets(CloudTablet* tablet,
+    int64_t pick_input_rowsets(CloudTablet* tablet,
                                const std::vector<RowsetSharedPtr>& candidate_rowsets,
                                const int64_t max_compaction_score,
                                const int64_t min_compaction_score,
@@ -115,4 +116,5 @@ class CloudTimeSeriesCumulativeCompactionPolicy : public CloudCumulativeCompacti
                                bool allow_delete = false) override;
 };
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_delete_bitmap_action.cpp b/be/src/cloud/cloud_delete_bitmap_action.cpp
index 86cc535e1bc88e..3d834bfe7b373c 100644
--- a/be/src/cloud/cloud_delete_bitmap_action.cpp
+++ b/be/src/cloud/cloud_delete_bitmap_action.cpp
@@ -50,6 +50,7 @@
 #include "util/stopwatch.hpp"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 namespace {
@@ -177,4 +178,5 @@ void CloudDeleteBitmapAction::handle(HttpRequest* req) {
     }
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
\ No newline at end of file
diff --git a/be/src/cloud/cloud_delete_bitmap_action.h b/be/src/cloud/cloud_delete_bitmap_action.h
index 35739a7373efc8..ce507ee9991757 100644
--- a/be/src/cloud/cloud_delete_bitmap_action.h
+++ b/be/src/cloud/cloud_delete_bitmap_action.h
@@ -27,6 +27,7 @@
 #include "olap/tablet.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 class HttpRequest;
 
 class ExecEnv;
@@ -52,4 +53,5 @@ class CloudDeleteBitmapAction : public HttpHandlerWithAuth {
     CloudStorageEngine& _engine;
     DeleteBitmapActionType _delete_bitmap_action_type;
 };
+#include "common/compile_check_end.h"
 } // namespace doris
\ No newline at end of file
diff --git a/be/src/cloud/cloud_engine_calc_delete_bitmap_task.cpp b/be/src/cloud/cloud_engine_calc_delete_bitmap_task.cpp
index 91611d20c6270b..fbf4b9cf303570 100644
--- a/be/src/cloud/cloud_engine_calc_delete_bitmap_task.cpp
+++ b/be/src/cloud/cloud_engine_calc_delete_bitmap_task.cpp
@@ -34,6 +34,7 @@
 #include "runtime/memory/mem_tracker_limiter.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 CloudEngineCalcDeleteBitmapTask::CloudEngineCalcDeleteBitmapTask(
         CloudStorageEngine& engine, const TCalcDeleteBitmapRequest& cal_delete_bitmap_req,
@@ -227,7 +228,7 @@ Status CloudTabletCalcDeleteBitmapTask::handle() const {
         }
     }
     auto total_update_delete_bitmap_time_us = MonotonicMicros() - t3;
-    LOG(INFO) << "calculate delete bitmap successfully on tablet"
+    LOG(INFO) << "finish calculate delete bitmap on tablet"
               << ", table_id=" << tablet->table_id() << ", transaction_id=" << _transaction_id
               << ", tablet_id=" << tablet->tablet_id()
               << ", get_tablet_time_us=" << get_tablet_time_us
@@ -325,4 +326,5 @@ Status CloudTabletCalcDeleteBitmapTask::_handle_rowset(
     return status;
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_full_compaction.cpp b/be/src/cloud/cloud_full_compaction.cpp
index c27b728c93d29b..bce00c9a2e74f6 100644
--- a/be/src/cloud/cloud_full_compaction.cpp
+++ b/be/src/cloud/cloud_full_compaction.cpp
@@ -216,6 +216,10 @@ Status CloudFullCompaction::modify_rowsets() {
     compaction_job->add_output_versions(_output_rowset->end_version());
     compaction_job->add_txn_id(_output_rowset->txn_id());
     compaction_job->add_output_rowset_ids(_output_rowset->rowset_id().to_string());
+    compaction_job->set_index_size_input_rowsets(_input_rowsets_index_size);
+    compaction_job->set_segment_size_input_rowsets(_input_rowsets_data_size);
+    compaction_job->set_index_size_output_rowsets(_output_rowset->index_disk_size());
+    compaction_job->set_segment_size_output_rowsets(_output_rowset->data_disk_size());
 
     DeleteBitmapPtr output_rowset_delete_bitmap = nullptr;
     if (_tablet->keys_type() == KeysType::UNIQUE_KEYS &&
diff --git a/be/src/cloud/cloud_meta_mgr.cpp b/be/src/cloud/cloud_meta_mgr.cpp
index 8e21498b0d873d..835e74ca7d5687 100644
--- a/be/src/cloud/cloud_meta_mgr.cpp
+++ b/be/src/cloud/cloud_meta_mgr.cpp
@@ -64,6 +64,7 @@
 #include "util/thrift_rpc_helper.h"
 
 namespace doris::cloud {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 Status bthread_fork_join(const std::vector<std::function<Status()>>& tasks, int concurrency) {
@@ -717,7 +718,7 @@ Status CloudMetaMgr::sync_tablet_delete_bitmap(CloudTablet* tablet, int64_t old_
                 "rowset_ids.size={},segment_ids.size={},vers.size={},delete_bitmaps.size={}",
                 rowset_ids.size(), segment_ids.size(), vers.size(), delete_bitmaps.size());
     }
-    for (size_t i = 0; i < rowset_ids.size(); i++) {
+    for (int i = 0; i < rowset_ids.size(); i++) {
         RowsetId rst_id;
         rst_id.init(rowset_ids[i]);
         delete_bitmap->merge(
@@ -757,10 +758,10 @@ Status CloudMetaMgr::prepare_rowset(const RowsetMeta& rs_meta,
     Status st = retry_rpc("prepare rowset", req, &resp, &MetaService_Stub::prepare_rowset);
     if (!st.ok() && resp.status().code() == MetaServiceCode::ALREADY_EXISTED) {
         if (existed_rs_meta != nullptr && resp.has_existed_rowset_meta()) {
-            RowsetMetaPB doris_rs_meta =
+            RowsetMetaPB doris_rs_meta_tmp =
                     cloud_rowset_meta_to_doris(std::move(*resp.mutable_existed_rowset_meta()));
             *existed_rs_meta = std::make_shared<RowsetMeta>();
-            (*existed_rs_meta)->init_from_pb(doris_rs_meta);
+            (*existed_rs_meta)->init_from_pb(doris_rs_meta_tmp);
         }
         return Status::AlreadyExist("failed to prepare rowset: {}", resp.status().msg());
     }
@@ -1286,4 +1287,5 @@ int64_t CloudMetaMgr::get_inverted_index_file_szie(const RowsetMeta& rs_meta) {
     return total_inverted_index_size;
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris::cloud
diff --git a/be/src/cloud/cloud_meta_mgr.h b/be/src/cloud/cloud_meta_mgr.h
index c49b036ad90c15..913ef59489a1b3 100644
--- a/be/src/cloud/cloud_meta_mgr.h
+++ b/be/src/cloud/cloud_meta_mgr.h
@@ -27,6 +27,7 @@
 #include "util/s3_util.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 class DeleteBitmap;
 class StreamLoadContext;
@@ -124,4 +125,5 @@ class CloudMetaMgr {
 };
 
 } // namespace cloud
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_schema_change_job.cpp b/be/src/cloud/cloud_schema_change_job.cpp
index 0bab742c3ad6e5..1cc4d052a81d69 100644
--- a/be/src/cloud/cloud_schema_change_job.cpp
+++ b/be/src/cloud/cloud_schema_change_job.cpp
@@ -340,17 +340,23 @@ Status CloudSchemaChangeJob::_convert_historical_rowsets(const SchemaChangeParam
         int64_t num_output_rows = 0;
         int64_t size_output_rowsets = 0;
         int64_t num_output_segments = 0;
+        int64_t index_size_output_rowsets = 0;
+        int64_t segment_size_output_rowsets = 0;
         for (auto& rs : _output_rowsets) {
             sc_job->add_txn_ids(rs->txn_id());
             sc_job->add_output_versions(rs->end_version());
             num_output_rows += rs->num_rows();
             size_output_rowsets += rs->total_disk_size();
             num_output_segments += rs->num_segments();
+            index_size_output_rowsets += rs->index_disk_size();
+            segment_size_output_rowsets += rs->data_disk_size();
         }
         sc_job->set_num_output_rows(num_output_rows);
         sc_job->set_size_output_rowsets(size_output_rowsets);
         sc_job->set_num_output_segments(num_output_segments);
         sc_job->set_num_output_rowsets(_output_rowsets.size());
+        sc_job->set_index_size_output_rowsets(index_size_output_rowsets);
+        sc_job->set_segment_size_output_rowsets(segment_size_output_rowsets);
     }
     _output_cumulative_point = std::min(_output_cumulative_point, sc_job->alter_version() + 1);
     sc_job->set_output_cumulative_point(_output_cumulative_point);
diff --git a/be/src/cloud/cloud_storage_engine.cpp b/be/src/cloud/cloud_storage_engine.cpp
index dc6abbac31ba1b..b66a9cfbdb2245 100644
--- a/be/src/cloud/cloud_storage_engine.cpp
+++ b/be/src/cloud/cloud_storage_engine.cpp
@@ -52,6 +52,7 @@
 #include "util/parse_util.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 
 using namespace std::literals;
 
@@ -166,7 +167,8 @@ Status CloudStorageEngine::open() {
 
     _memtable_flush_executor = std::make_unique<MemTableFlushExecutor>();
     // Use file cache disks number
-    _memtable_flush_executor->init(io::FileCacheFactory::instance()->get_cache_instance_size());
+    _memtable_flush_executor->init(
+            cast_set<int32_t>(io::FileCacheFactory::instance()->get_cache_instance_size()));
 
     _calc_delete_bitmap_executor = std::make_unique<CalcDeleteBitmapExecutor>();
     _calc_delete_bitmap_executor->init();
@@ -321,7 +323,7 @@ void CloudStorageEngine::_check_file_cache_ttl_block_valid() {
         for (const auto& rowset : rowsets) {
             int64_t ttl_seconds = tablet->tablet_meta()->ttl_seconds();
             if (rowset->newest_write_timestamp() + ttl_seconds <= UnixSeconds()) continue;
-            for (int64_t seg_id = 0; seg_id < rowset->num_segments(); seg_id++) {
+            for (uint32_t seg_id = 0; seg_id < rowset->num_segments(); seg_id++) {
                 auto hash = Segment::file_cache_key(rowset->rowset_id().to_string(), seg_id);
                 auto* file_cache = io::FileCacheFactory::instance()->get_by_path(hash);
                 file_cache->update_ttl_atime(hash);
@@ -350,11 +352,11 @@ void CloudStorageEngine::sync_storage_vault() {
 
     for (auto& [id, vault_info, path_format] : vault_infos) {
         auto fs = get_filesystem(id);
-        auto st = (fs == nullptr)
-                          ? std::visit(VaultCreateFSVisitor {id, path_format}, vault_info)
-                          : std::visit(RefreshFSVaultVisitor {id, std::move(fs), path_format},
-                                       vault_info);
-        if (!st.ok()) [[unlikely]] {
+        auto status = (fs == nullptr)
+                              ? std::visit(VaultCreateFSVisitor {id, path_format}, vault_info)
+                              : std::visit(RefreshFSVaultVisitor {id, std::move(fs), path_format},
+                                           vault_info);
+        if (!status.ok()) [[unlikely]] {
             LOG(WARNING) << vault_process_error(id, vault_info, std::move(st));
         }
     }
@@ -504,13 +506,13 @@ void CloudStorageEngine::_compaction_tasks_producer_callback() {
             /// If it is not cleaned up, the reference count of the tablet will always be greater than 1,
             /// thus cannot be collected by the garbage collector. (TabletManager::start_trash_sweep)
             for (const auto& tablet : tablets_compaction) {
-                Status st = submit_compaction_task(tablet, compaction_type);
-                if (st.ok()) continue;
-                if ((!st.is<ErrorCode::BE_NO_SUITABLE_VERSION>() &&
-                     !st.is<ErrorCode::CUMULATIVE_NO_SUITABLE_VERSION>()) ||
+                Status status = submit_compaction_task(tablet, compaction_type);
+                if (status.ok()) continue;
+                if ((!status.is<ErrorCode::BE_NO_SUITABLE_VERSION>() &&
+                     !status.is<ErrorCode::CUMULATIVE_NO_SUITABLE_VERSION>()) ||
                     VLOG_DEBUG_IS_ON) {
                     LOG(WARNING) << "failed to submit compaction task for tablet: "
-                                 << tablet->tablet_id() << ", err: " << st;
+                                 << tablet->tablet_id() << ", err: " << status;
                 }
             }
             interval = config::generate_compaction_tasks_interval_ms;
@@ -544,7 +546,8 @@ std::vector<CloudTabletSPtr> CloudStorageEngine::_generate_cloud_compaction_task
     int num_cumu =
             std::accumulate(submitted_cumu_compactions.begin(), submitted_cumu_compactions.end(), 0,
                             [](int a, auto& b) { return a + b.second.size(); });
-    int num_base = submitted_base_compactions.size() + submitted_full_compactions.size();
+    int num_base =
+            cast_set<int>(submitted_base_compactions.size() + submitted_full_compactions.size());
     int n = thread_per_disk - num_cumu - num_base;
     if (compaction_type == CompactionType::BASE_COMPACTION) {
         // We need to reserve at least one thread for cumulative compaction,
@@ -822,7 +825,7 @@ Status CloudStorageEngine::get_compaction_status_json(std::string* result) {
     // cumu
     std::string_view cumu = "CumulativeCompaction";
     rapidjson::Value cumu_key;
-    cumu_key.SetString(cumu.data(), cumu.length(), root.GetAllocator());
+    cumu_key.SetString(cumu.data(), cast_set<uint32_t>(cumu.length()), root.GetAllocator());
     rapidjson::Document cumu_arr;
     cumu_arr.SetArray();
     for (auto& [tablet_id, v] : _submitted_cumu_compactions) {
@@ -834,7 +837,7 @@ Status CloudStorageEngine::get_compaction_status_json(std::string* result) {
     // base
     std::string_view base = "BaseCompaction";
     rapidjson::Value base_key;
-    base_key.SetString(base.data(), base.length(), root.GetAllocator());
+    base_key.SetString(base.data(), cast_set<uint32_t>(base.length()), root.GetAllocator());
     rapidjson::Document base_arr;
     base_arr.SetArray();
     for (auto& [tablet_id, _] : _submitted_base_compactions) {
@@ -857,4 +860,5 @@ std::shared_ptr<CloudCumulativeCompactionPolicy> CloudStorageEngine::cumu_compac
     return _cumulative_compaction_policies.at(compaction_policy);
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_tablet.cpp b/be/src/cloud/cloud_tablet.cpp
index ea86f3b40ff1dc..93c7128756738c 100644
--- a/be/src/cloud/cloud_tablet.cpp
+++ b/be/src/cloud/cloud_tablet.cpp
@@ -50,6 +50,7 @@
 #include "vec/common/schema_util.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 static constexpr int COMPACTION_DELETE_BITMAP_LOCK_ID = -1;
@@ -219,6 +220,7 @@ Status CloudTablet::sync_if_not_running() {
 }
 
 TabletSchemaSPtr CloudTablet::merged_tablet_schema() const {
+    std::shared_lock rlock(_meta_lock);
     return _merged_tablet_schema;
 }
 
@@ -380,7 +382,7 @@ void CloudTablet::delete_rowsets(const std::vector<RowsetSharedPtr>& to_delete,
     _tablet_meta->modify_rs_metas({}, rs_metas, false);
 }
 
-int CloudTablet::delete_expired_stale_rowsets() {
+uint64_t CloudTablet::delete_expired_stale_rowsets() {
     std::vector<RowsetSharedPtr> expired_rowsets;
     int64_t expired_stale_sweep_endtime =
             ::time(nullptr) - config::tablet_rowset_stale_sweep_time_sec;
@@ -539,7 +541,7 @@ Result<std::unique_ptr<RowsetWriter>> CloudTablet::create_transient_rowset_write
 
     return RowsetFactory::create_rowset_writer(_engine, context, false)
             .transform([&](auto&& writer) {
-                writer->set_segment_start_id(rowset.num_segments());
+                writer->set_segment_start_id(cast_set<int32_t>(rowset.num_segments()));
                 return writer;
             });
 }
@@ -617,7 +619,8 @@ void CloudTablet::get_compaction_status(std::string* json_result) {
         }
         rapidjson::Value value;
         std::string version_str = rowset->get_rowset_info_str();
-        value.SetString(version_str.c_str(), version_str.length(), versions_arr.GetAllocator());
+        value.SetString(version_str.c_str(), cast_set<uint32_t>(version_str.length()),
+                        versions_arr.GetAllocator());
         versions_arr.PushBack(value, versions_arr.GetAllocator());
         last_version = ver.second;
     }
@@ -630,7 +633,7 @@ void CloudTablet::get_compaction_status(std::string* json_result) {
     for (auto& rowset : stale_rowsets) {
         rapidjson::Value value;
         std::string version_str = rowset->get_rowset_info_str();
-        value.SetString(version_str.c_str(), version_str.length(),
+        value.SetString(version_str.c_str(), cast_set<uint32_t>(version_str.length()),
                         stale_versions_arr.GetAllocator());
         stale_versions_arr.PushBack(value, stale_versions_arr.GetAllocator());
     }
@@ -775,7 +778,8 @@ Status CloudTablet::calc_delete_bitmap_for_compaction(
     }
 
     std::unique_ptr<std::map<RowsetSharedPtr, RowLocationPairList>> location_map;
-    if (config::enable_rowid_conversion_correctness_check) {
+    if (config::enable_rowid_conversion_correctness_check &&
+        tablet_schema()->cluster_key_uids().empty()) {
         location_map = std::make_unique<std::map<RowsetSharedPtr, RowLocationPairList>>();
         LOG(INFO) << "Location Map inited succ for tablet:" << tablet_id();
     }
@@ -924,4 +928,5 @@ void CloudTablet::build_tablet_report_info(TTabletInfo* tablet_info) {
     // but it may be used in the future.
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/cloud/cloud_tablet.h b/be/src/cloud/cloud_tablet.h
index 80038e569ba2fc..fc0d64a493d316 100644
--- a/be/src/cloud/cloud_tablet.h
+++ b/be/src/cloud/cloud_tablet.h
@@ -92,7 +92,7 @@ class CloudTablet final : public BaseTablet {
     void clear_cache() override;
 
     // Return number of deleted stale rowsets
-    int delete_expired_stale_rowsets();
+    uint64_t delete_expired_stale_rowsets();
 
     bool has_stale_rowsets() const { return !_stale_rs_version_map.empty(); }
 
diff --git a/be/src/cloud/config.cpp b/be/src/cloud/config.cpp
index e95c295ae1daa5..f90bf536f63018 100644
--- a/be/src/cloud/config.cpp
+++ b/be/src/cloud/config.cpp
@@ -20,6 +20,7 @@
 #include "common/status.h"
 
 namespace doris::config {
+#include "common/compile_check_begin.h"
 
 DEFINE_String(deploy_mode, "");
 DEFINE_mString(cloud_unique_id, "");
@@ -76,4 +77,5 @@ DEFINE_mInt32(tablet_txn_info_min_expired_seconds, "120");
 DEFINE_mBool(enable_use_cloud_unique_id_from_fe, "true");
 
 DEFINE_mBool(enable_cloud_tablet_report, "true");
+#include "common/compile_check_end.h"
 } // namespace doris::config
diff --git a/be/src/cloud/config.h b/be/src/cloud/config.h
index b345e6355921a4..a8a7c0c48ec91f 100644
--- a/be/src/cloud/config.h
+++ b/be/src/cloud/config.h
@@ -20,6 +20,7 @@
 #include "common/config.h"
 
 namespace doris::config {
+#include "common/compile_check_begin.h"
 
 DECLARE_String(deploy_mode);
 // deprecated do not configure directly
@@ -110,4 +111,5 @@ DECLARE_mBool(enable_use_cloud_unique_id_from_fe);
 
 DECLARE_Bool(enable_cloud_tablet_report);
 
+#include "common/compile_check_end.h"
 } // namespace doris::config
diff --git a/be/src/cloud/pb_convert.cpp b/be/src/cloud/pb_convert.cpp
index bff7d8388d30d8..e655ceacf2f08d 100644
--- a/be/src/cloud/pb_convert.cpp
+++ b/be/src/cloud/pb_convert.cpp
@@ -324,7 +324,7 @@ void doris_tablet_schema_to_cloud(TabletSchemaCloudPB* out, const TabletSchemaPB
     out->set_store_row_column(in.store_row_column());
     out->set_enable_single_replica_compaction(in.enable_single_replica_compaction());
     out->set_skip_write_index_on_load(in.skip_write_index_on_load());
-    out->mutable_cluster_key_idxes()->CopyFrom(in.cluster_key_idxes());
+    out->mutable_cluster_key_uids()->CopyFrom(in.cluster_key_uids());
     out->set_is_dynamic_schema(in.is_dynamic_schema());
     out->mutable_row_store_column_unique_ids()->CopyFrom(in.row_store_column_unique_ids());
     out->set_inverted_index_storage_format(in.inverted_index_storage_format());
@@ -353,7 +353,7 @@ void doris_tablet_schema_to_cloud(TabletSchemaCloudPB* out, TabletSchemaPB&& in)
     out->set_store_row_column(in.store_row_column());
     out->set_enable_single_replica_compaction(in.enable_single_replica_compaction());
     out->set_skip_write_index_on_load(in.skip_write_index_on_load());
-    out->mutable_cluster_key_idxes()->Swap(in.mutable_cluster_key_idxes());
+    out->mutable_cluster_key_uids()->Swap(in.mutable_cluster_key_uids());
     out->set_is_dynamic_schema(in.is_dynamic_schema());
     out->mutable_row_store_column_unique_ids()->Swap(in.mutable_row_store_column_unique_ids());
     out->set_inverted_index_storage_format(in.inverted_index_storage_format());
@@ -395,7 +395,7 @@ void cloud_tablet_schema_to_doris(TabletSchemaPB* out, const TabletSchemaCloudPB
     out->set_store_row_column(in.store_row_column());
     out->set_enable_single_replica_compaction(in.enable_single_replica_compaction());
     out->set_skip_write_index_on_load(in.skip_write_index_on_load());
-    out->mutable_cluster_key_idxes()->CopyFrom(in.cluster_key_idxes());
+    out->mutable_cluster_key_uids()->CopyFrom(in.cluster_key_uids());
     out->set_is_dynamic_schema(in.is_dynamic_schema());
     out->mutable_row_store_column_unique_ids()->CopyFrom(in.row_store_column_unique_ids());
     out->set_inverted_index_storage_format(in.inverted_index_storage_format());
@@ -425,7 +425,7 @@ void cloud_tablet_schema_to_doris(TabletSchemaPB* out, TabletSchemaCloudPB&& in)
     out->set_store_row_column(in.store_row_column());
     out->set_enable_single_replica_compaction(in.enable_single_replica_compaction());
     out->set_skip_write_index_on_load(in.skip_write_index_on_load());
-    out->mutable_cluster_key_idxes()->Swap(in.mutable_cluster_key_idxes());
+    out->mutable_cluster_key_uids()->Swap(in.mutable_cluster_key_uids());
     out->set_is_dynamic_schema(in.is_dynamic_schema());
     out->mutable_row_store_column_unique_ids()->Swap(in.mutable_row_store_column_unique_ids());
     out->set_inverted_index_storage_format(in.inverted_index_storage_format());
diff --git a/be/src/clucene b/be/src/clucene
index 48fa9cc4ec32b4..a506dbb6c523aa 160000
--- a/be/src/clucene
+++ b/be/src/clucene
@@ -1 +1 @@
-Subproject commit 48fa9cc4ec32b40bf3b02338d0a1b2cdbc6408cf
+Subproject commit a506dbb6c523aa65044eb1c527a066d236172543
diff --git a/be/src/common/compile_check_begin.h b/be/src/common/compile_check_begin.h
index 6da403f2894885..4d860d39d1cf72 100644
--- a/be/src/common/compile_check_begin.h
+++ b/be/src/common/compile_check_begin.h
@@ -23,8 +23,9 @@
 #ifdef __clang__
 #pragma clang diagnostic push
 #pragma clang diagnostic error "-Wconversion"
+#pragma clang diagnostic error "-Wshadow"
 #pragma clang diagnostic ignored "-Wsign-conversion"
 #pragma clang diagnostic ignored "-Wfloat-conversion"
 #endif
 
-//#include "common/compile_check_begin.h"
\ No newline at end of file
+//#include "common/compile_check_begin.h"
diff --git a/be/src/common/compile_check_end.h b/be/src/common/compile_check_end.h
index 0897965dc74a3d..40df41b6bdfc6c 100644
--- a/be/src/common/compile_check_end.h
+++ b/be/src/common/compile_check_end.h
@@ -20,4 +20,4 @@
 #endif
 #undef COMPILE_CHECK
 
-// #include "common/compile_check_end.h"
\ No newline at end of file
+// #include "common/compile_check_end.h"
diff --git a/be/src/common/config.cpp b/be/src/common/config.cpp
index 63989a76261bb6..b3e7d0bce5ee4d 100644
--- a/be/src/common/config.cpp
+++ b/be/src/common/config.cpp
@@ -1166,6 +1166,9 @@ DEFINE_mBool(enable_missing_rows_correctness_check, "false");
 // When the number of missing versions is more than this value, do not directly
 // retry the publish and handle it through async publish.
 DEFINE_mInt32(mow_publish_max_discontinuous_version_num, "20");
+// When the size of primary keys in memory exceeds this value, finish current segment
+// and create a new segment, used in compaction. Default 50MB.
+DEFINE_mInt64(mow_primary_key_index_max_size_in_memory, "52428800");
 // When the version is not continuous for MOW table in publish phase and the gap between
 // current txn's publishing version and the max version of the tablet exceeds this value,
 // don't print warning log
diff --git a/be/src/common/config.h b/be/src/common/config.h
index 29e55e6406390e..59fc61e8cb3e5a 100644
--- a/be/src/common/config.h
+++ b/be/src/common/config.h
@@ -1236,6 +1236,9 @@ DECLARE_mBool(enable_missing_rows_correctness_check);
 // When the number of missing versions is more than this value, do not directly
 // retry the publish and handle it through async publish.
 DECLARE_mInt32(mow_publish_max_discontinuous_version_num);
+// When the size of primary keys in memory exceeds this value, finish current segment
+// and create a new segment, used in compaction.
+DECLARE_mInt64(mow_primary_key_index_max_size_in_memory);
 // When the version is not continuous for MOW table in publish phase and the gap between
 // current txn's publishing version and the max version of the tablet exceeds this value,
 // don't print warning log
diff --git a/be/src/common/daemon.cpp b/be/src/common/daemon.cpp
index ce2a6878dba034..d3d55f10dde5fb 100644
--- a/be/src/common/daemon.cpp
+++ b/be/src/common/daemon.cpp
@@ -500,15 +500,18 @@ void Daemon::cache_adjust_capacity_thread() {
 void Daemon::cache_prune_stale_thread() {
     int32_t interval = config::cache_periodic_prune_stale_sweep_sec;
     while (!_stop_background_threads_latch.wait_for(std::chrono::seconds(interval))) {
-        if (interval <= 0) {
-            LOG(WARNING) << "config of cache clean interval is illegal: [" << interval
-                         << "], force set to 3600 ";
-            interval = 3600;
+        if (config::cache_periodic_prune_stale_sweep_sec <= 0) {
+            LOG(WARNING) << "config of cache clean interval is: [" << interval
+                         << "], it means the cache prune stale thread is disabled, will wait 3s "
+                            "and check again.";
+            interval = 3;
+            continue;
         }
         if (config::disable_memory_gc) {
             continue;
         }
         CacheManager::instance()->for_each_cache_prune_stale();
+        interval = config::cache_periodic_prune_stale_sweep_sec;
     }
 }
 
diff --git a/be/src/exec/schema_scanner.cpp b/be/src/exec/schema_scanner.cpp
index 39dd45163322ac..4b430f04289d04 100644
--- a/be/src/exec/schema_scanner.cpp
+++ b/be/src/exec/schema_scanner.cpp
@@ -124,7 +124,6 @@ Status SchemaScanner::get_next_block_async(RuntimeState* state) {
                 }
                 SCOPED_ATTACH_TASK(state);
                 _async_thread_running = true;
-                _finish_dependency->block();
                 if (!_opened) {
                     _data_block = vectorized::Block::create_unique();
                     _init_block(_data_block.get());
@@ -140,9 +139,6 @@ Status SchemaScanner::get_next_block_async(RuntimeState* state) {
                 _eos = eos;
                 _async_thread_running = false;
                 _dependency->set_ready();
-                if (eos) {
-                    _finish_dependency->set_ready();
-                }
             }));
     return Status::OK();
 }
diff --git a/be/src/exec/schema_scanner.h b/be/src/exec/schema_scanner.h
index 440912bff1d729..6e7a229b7fd7b9 100644
--- a/be/src/exec/schema_scanner.h
+++ b/be/src/exec/schema_scanner.h
@@ -106,11 +106,7 @@ class SchemaScanner {
     // factory function
     static std::unique_ptr<SchemaScanner> create(TSchemaTableType::type type);
     TSchemaTableType::type type() const { return _schema_table_type; }
-    void set_dependency(std::shared_ptr<pipeline::Dependency> dep,
-                        std::shared_ptr<pipeline::Dependency> fin_dep) {
-        _dependency = dep;
-        _finish_dependency = fin_dep;
-    }
+    void set_dependency(std::shared_ptr<pipeline::Dependency> dep) { _dependency = dep; }
     Status get_next_block_async(RuntimeState* state);
 
 protected:
@@ -139,7 +135,6 @@ class SchemaScanner {
     RuntimeProfile::Counter* _fill_block_timer = nullptr;
 
     std::shared_ptr<pipeline::Dependency> _dependency = nullptr;
-    std::shared_ptr<pipeline::Dependency> _finish_dependency = nullptr;
 
     std::unique_ptr<vectorized::Block> _data_block;
     AtomicStatus _scanner_status;
diff --git a/be/src/exec/schema_scanner/schema_columns_scanner.cpp b/be/src/exec/schema_scanner/schema_columns_scanner.cpp
index 8325a7f5dc4f2d..b60dfc3d203f89 100644
--- a/be/src/exec/schema_scanner/schema_columns_scanner.cpp
+++ b/be/src/exec/schema_scanner/schema_columns_scanner.cpp
@@ -450,7 +450,19 @@ Status SchemaColumnsScanner::_fill_block_impl(vectorized::Block* block) {
         RETURN_IF_ERROR(fill_dest_column_for_range(block, 4, datas));
     }
     // COLUMN_DEFAULT
-    { RETURN_IF_ERROR(fill_dest_column_for_range(block, 5, null_datas)); }
+    {
+        std::vector<StringRef> strs(columns_num);
+        for (int i = 0; i < columns_num; ++i) {
+            if (_desc_result.columns[i].columnDesc.__isset.defaultValue) {
+                strs[i] = StringRef(_desc_result.columns[i].columnDesc.defaultValue.c_str(),
+                                    _desc_result.columns[i].columnDesc.defaultValue.length());
+                datas[i] = strs.data() + i;
+            } else {
+                datas[i] = nullptr;
+            }
+        }
+        RETURN_IF_ERROR(fill_dest_column_for_range(block, 5, datas));
+    }
     // IS_NULLABLE
     {
         StringRef str_yes = StringRef("YES", 3);
diff --git a/be/src/exec/schema_scanner/schema_tables_scanner.cpp b/be/src/exec/schema_scanner/schema_tables_scanner.cpp
index 23710b81971c15..3aba0dfcc4f83c 100644
--- a/be/src/exec/schema_scanner/schema_tables_scanner.cpp
+++ b/be/src/exec/schema_scanner/schema_tables_scanner.cpp
@@ -236,7 +236,7 @@ Status SchemaTablesScanner::_fill_block_impl(vectorized::Block* block) {
         std::vector<int64_t> srcs(table_num);
         for (int i = 0; i < table_num; ++i) {
             const TTableStatus& tbl_status = _table_result.tables[i];
-            if (tbl_status.__isset.avg_row_length) {
+            if (tbl_status.__isset.data_length) {
                 srcs[i] = tbl_status.data_length;
                 datas[i] = srcs.data() + i;
             } else {
@@ -248,7 +248,19 @@ Status SchemaTablesScanner::_fill_block_impl(vectorized::Block* block) {
     // max_data_length
     { RETURN_IF_ERROR(fill_dest_column_for_range(block, 10, null_datas)); }
     // index_length
-    { RETURN_IF_ERROR(fill_dest_column_for_range(block, 11, null_datas)); }
+    {
+        std::vector<int64_t> srcs(table_num);
+        for (int i = 0; i < table_num; ++i) {
+            const TTableStatus& tbl_status = _table_result.tables[i];
+            if (tbl_status.__isset.index_length) {
+                srcs[i] = tbl_status.index_length;
+                datas[i] = srcs.data() + i;
+            } else {
+                datas[i] = nullptr;
+            }
+        }
+        RETURN_IF_ERROR(fill_dest_column_for_range(block, 11, datas));
+    }
     // data_free
     { RETURN_IF_ERROR(fill_dest_column_for_range(block, 12, null_datas)); }
     // auto_increment
diff --git a/be/src/exprs/bloom_filter_func.h b/be/src/exprs/bloom_filter_func.h
index ff749420ad286e..4d221f7bfe8421 100644
--- a/be/src/exprs/bloom_filter_func.h
+++ b/be/src/exprs/bloom_filter_func.h
@@ -26,17 +26,41 @@
 #include "vec/common/string_ref.h"
 
 namespace doris {
+// there are problems with the implementation of the old datetimev2. for compatibility reason, we will keep this code temporary.
+struct fixed_len_to_uint32 {
+    template <typename T>
+    uint32_t operator()(T value) {
+        if constexpr (sizeof(T) <= sizeof(uint32_t)) {
+            if constexpr (std::is_same_v<T, DateV2Value<DateV2ValueType>>) {
+                return (uint32_t)value.to_int64();
+            } else {
+                return (uint32_t)value;
+            }
+        }
+        return std::hash<T>()(value);
+    }
+};
+
+struct fixed_len_to_uint32_v2 {
+    template <typename T>
+    uint32_t operator()(T value) {
+        if constexpr (sizeof(T) <= sizeof(uint32_t)) {
+            if constexpr (std::is_same_v<T, DateV2Value<DateV2ValueType>>) {
+                return (uint32_t)value.to_date_int_val();
+            } else {
+                return (uint32_t)value;
+            }
+        }
+        return std::hash<T>()(value);
+    }
+};
 
 class BloomFilterAdaptor {
 public:
-    BloomFilterAdaptor(bool null_aware = false) : _null_aware(null_aware) {
+    BloomFilterAdaptor(bool null_aware) : _null_aware(null_aware) {
         _bloom_filter = std::make_shared<doris::BlockBloomFilter>();
     }
 
-    static int64_t optimal_bit_num(int64_t expect_num, double fpp) {
-        return doris::segment_v2::BloomFilter::optimal_bit_num(expect_num, fpp) / 8;
-    }
-
     static BloomFilterAdaptor* create(bool null_aware) {
         return new BloomFilterAdaptor(null_aware);
     }
@@ -57,27 +81,23 @@ class BloomFilterAdaptor {
 
     size_t size() { return _bloom_filter->directory().size; }
 
-    template <typename T>
-    bool test(T data) const {
-        return _bloom_filter->find(data);
-    }
+    bool test(uint32_t data) const { return _bloom_filter->find(data); }
 
-    // test_element/find_element only used on vectorized engine
-    template <typename T>
+    template <typename fixed_len_to_uint32_method, typename T>
     bool test_element(T element) const {
         if constexpr (std::is_same_v<T, StringRef>) {
             return _bloom_filter->find(element);
         } else {
-            return _bloom_filter->find(HashUtil::fixed_len_to_uint32(element));
+            return _bloom_filter->find(fixed_len_to_uint32_method()(element));
         }
     }
 
-    template <typename T>
+    template <typename fixed_len_to_uint32_method, typename T>
     void add_element(T element) {
         if constexpr (std::is_same_v<T, StringRef>) {
             _bloom_filter->insert(element);
         } else {
-            _bloom_filter->insert(HashUtil::fixed_len_to_uint32(element));
+            _bloom_filter->insert(fixed_len_to_uint32_method()(element));
         }
     }
 
@@ -214,6 +234,8 @@ class BloomFilterFuncBase : public RuntimeFilterFuncBase {
 
     void set_contain_null_and_null_aware() { _bloom_filter->set_contain_null_and_null_aware(); }
 
+    void set_enable_fixed_len_to_uint32_v2() { _enable_fixed_len_to_uint32_v2 = true; }
+
     size_t get_size() const { return _bloom_filter ? _bloom_filter->size() : 0; }
 
     void light_copy(BloomFilterFuncBase* bloomfilter_func) {
@@ -221,6 +243,7 @@ class BloomFilterFuncBase : public RuntimeFilterFuncBase {
         _bloom_filter_alloced = other_func->_bloom_filter_alloced;
         _bloom_filter = other_func->_bloom_filter;
         _inited = other_func->_inited;
+        _enable_fixed_len_to_uint32_v2 |= other_func->_enable_fixed_len_to_uint32_v2;
     }
 
     virtual void insert(const void* data) = 0;
@@ -255,9 +278,10 @@ class BloomFilterFuncBase : public RuntimeFilterFuncBase {
     int64_t _runtime_bloom_filter_max_size;
     bool _build_bf_exactly = false;
     bool _bloom_filter_size_calculated_by_ndv = false;
+    bool _enable_fixed_len_to_uint32_v2 = false;
 };
 
-template <typename T, bool need_trim = false>
+template <typename fixed_len_to_uint32_method, typename T, bool need_trim = false>
 uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* data,
                          const uint8* nullmap, uint16_t* offsets, int number,
                          const bool is_parse_column) {
@@ -281,7 +305,8 @@ uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* dat
         if (nullmap == nullptr) {
             for (int i = 0; i < number; i++) {
                 uint16_t idx = offsets[i];
-                if (!bloom_filter.test_element(get_element(data, idx))) {
+                if (!bloom_filter.test_element<fixed_len_to_uint32_method>(
+                            get_element(data, idx))) {
                     continue;
                 }
                 offsets[new_size++] = idx;
@@ -294,7 +319,8 @@ uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* dat
                         continue;
                     }
                 } else {
-                    if (!bloom_filter.test_element(get_element(data, idx))) {
+                    if (!bloom_filter.test_element<fixed_len_to_uint32_method>(
+                                get_element(data, idx))) {
                         continue;
                     }
                 }
@@ -304,7 +330,7 @@ uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* dat
     } else {
         if (nullmap == nullptr) {
             for (int i = 0; i < number; i++) {
-                if (!bloom_filter.test_element(get_element(data, i))) {
+                if (!bloom_filter.test_element<fixed_len_to_uint32_method>(get_element(data, i))) {
                     continue;
                 }
                 offsets[new_size++] = i;
@@ -316,7 +342,8 @@ uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* dat
                         continue;
                     }
                 } else {
-                    if (!bloom_filter.test_element(get_element(data, i))) {
+                    if (!bloom_filter.test_element<fixed_len_to_uint32_method>(
+                                get_element(data, i))) {
                         continue;
                     }
                 }
@@ -327,16 +354,17 @@ uint16_t find_batch_olap(const BloomFilterAdaptor& bloom_filter, const char* dat
     return new_size;
 }
 
-template <class T>
+template <typename fixed_len_to_uint32_method, class T>
 struct CommonFindOp {
-    uint16_t find_batch_olap_engine(const BloomFilterAdaptor& bloom_filter, const char* data,
-                                    const uint8* nullmap, uint16_t* offsets, int number,
-                                    const bool is_parse_column) {
-        return find_batch_olap<T>(bloom_filter, data, nullmap, offsets, number, is_parse_column);
+    static uint16_t find_batch_olap_engine(const BloomFilterAdaptor& bloom_filter, const char* data,
+                                           const uint8* nullmap, uint16_t* offsets, int number,
+                                           const bool is_parse_column) {
+        return find_batch_olap<fixed_len_to_uint32_method, T>(bloom_filter, data, nullmap, offsets,
+                                                              number, is_parse_column);
     }
 
-    void insert_batch(BloomFilterAdaptor& bloom_filter, const vectorized::ColumnPtr& column,
-                      size_t start) const {
+    static void insert_batch(BloomFilterAdaptor& bloom_filter, const vectorized::ColumnPtr& column,
+                             size_t start) {
         const auto size = column->size();
         if (column->is_nullable()) {
             const auto* nullable = assert_cast<const vectorized::ColumnNullable*>(column.get());
@@ -348,7 +376,7 @@ struct CommonFindOp {
             const T* data = (T*)col.get_raw_data().data;
             for (size_t i = start; i < size; i++) {
                 if (!nullmap[i]) {
-                    bloom_filter.add_element(*(data + i));
+                    bloom_filter.add_element<fixed_len_to_uint32_method>(*(data + i));
                 } else {
                     bloom_filter.set_contain_null();
                 }
@@ -356,13 +384,13 @@ struct CommonFindOp {
         } else {
             const T* data = (T*)column->get_raw_data().data;
             for (size_t i = start; i < size; i++) {
-                bloom_filter.add_element(*(data + i));
+                bloom_filter.add_element<fixed_len_to_uint32_method>(*(data + i));
             }
         }
     }
 
-    void find_batch(const BloomFilterAdaptor& bloom_filter, const vectorized::ColumnPtr& column,
-                    uint8_t* results) const {
+    static void find_batch(const BloomFilterAdaptor& bloom_filter,
+                           const vectorized::ColumnPtr& column, uint8_t* results) {
         const T* __restrict data = nullptr;
         const uint8_t* __restrict nullmap = nullptr;
         if (column->is_nullable()) {
@@ -382,31 +410,32 @@ struct CommonFindOp {
         if (nullmap) {
             for (size_t i = 0; i < size; i++) {
                 if (!nullmap[i]) {
-                    results[i] = bloom_filter.test_element(data[i]);
+                    results[i] = bloom_filter.test_element<fixed_len_to_uint32_method>(data[i]);
                 } else {
                     results[i] = bloom_filter.contain_null();
                 }
             }
         } else {
             for (size_t i = 0; i < size; i++) {
-                results[i] = bloom_filter.test_element(data[i]);
+                results[i] = bloom_filter.test_element<fixed_len_to_uint32_method>(data[i]);
             }
         }
     }
 
-    void insert(BloomFilterAdaptor& bloom_filter, const void* data) const {
-        bloom_filter.add_element(*(T*)data);
+    static void insert(BloomFilterAdaptor& bloom_filter, const void* data) {
+        bloom_filter.add_element<fixed_len_to_uint32_method>(*(T*)data);
     }
 };
 
-struct StringFindOp : CommonFindOp<StringRef> {
+template <typename fixed_len_to_uint32_method>
+struct StringFindOp : CommonFindOp<fixed_len_to_uint32_method, StringRef> {
     static void insert_batch(BloomFilterAdaptor& bloom_filter, const vectorized::ColumnPtr& column,
                              size_t start) {
         auto _insert_batch_col_str = [&](const auto& col, const uint8_t* __restrict nullmap,
                                          size_t start, size_t size) {
             for (size_t i = start; i < size; i++) {
                 if (nullmap == nullptr || !nullmap[i]) {
-                    bloom_filter.add_element(col.get_data_at(i));
+                    bloom_filter.add_element<fixed_len_to_uint32_method>(col.get_data_at(i));
                 } else {
                     bloom_filter.set_contain_null();
                 }
@@ -451,20 +480,23 @@ struct StringFindOp : CommonFindOp<StringRef> {
             if (nullable->has_null()) {
                 for (size_t i = 0; i < col.size(); i++) {
                     if (!nullmap[i]) {
-                        results[i] = bloom_filter.test_element(col.get_data_at(i));
+                        results[i] = bloom_filter.test_element<fixed_len_to_uint32_method>(
+                                col.get_data_at(i));
                     } else {
                         results[i] = bloom_filter.contain_null();
                     }
                 }
             } else {
                 for (size_t i = 0; i < col.size(); i++) {
-                    results[i] = bloom_filter.test_element(col.get_data_at(i));
+                    results[i] = bloom_filter.test_element<fixed_len_to_uint32_method>(
+                            col.get_data_at(i));
                 }
             }
         } else {
             const auto& col = assert_cast<const vectorized::ColumnString*>(column.get());
             for (size_t i = 0; i < col->size(); i++) {
-                results[i] = bloom_filter.test_element(col->get_data_at(i));
+                results[i] =
+                        bloom_filter.test_element<fixed_len_to_uint32_method>(col->get_data_at(i));
             }
         }
     }
@@ -472,34 +504,35 @@ struct StringFindOp : CommonFindOp<StringRef> {
 
 // We do not need to judge whether data is empty, because null will not appear
 // when filer used by the storage engine
-struct FixedStringFindOp : public StringFindOp {
+template <typename fixed_len_to_uint32_method>
+struct FixedStringFindOp : public StringFindOp<fixed_len_to_uint32_method> {
     static uint16_t find_batch_olap_engine(const BloomFilterAdaptor& bloom_filter, const char* data,
                                            const uint8* nullmap, uint16_t* offsets, int number,
                                            const bool is_parse_column) {
-        return find_batch_olap<StringRef, true>(bloom_filter, data, nullmap, offsets, number,
-                                                is_parse_column);
+        return find_batch_olap<fixed_len_to_uint32_method, StringRef, true>(
+                bloom_filter, data, nullmap, offsets, number, is_parse_column);
     }
 };
 
-template <PrimitiveType type>
+template <typename fixed_len_to_uint32_method, PrimitiveType type>
 struct BloomFilterTypeTraits {
     using T = typename PrimitiveTypeTraits<type>::CppType;
-    using FindOp = CommonFindOp<T>;
+    using FindOp = CommonFindOp<fixed_len_to_uint32_method, T>;
 };
 
-template <>
-struct BloomFilterTypeTraits<TYPE_CHAR> {
-    using FindOp = FixedStringFindOp;
+template <typename fixed_len_to_uint32_method>
+struct BloomFilterTypeTraits<fixed_len_to_uint32_method, TYPE_CHAR> {
+    using FindOp = FixedStringFindOp<fixed_len_to_uint32_method>;
 };
 
-template <>
-struct BloomFilterTypeTraits<TYPE_VARCHAR> {
-    using FindOp = StringFindOp;
+template <typename fixed_len_to_uint32_method>
+struct BloomFilterTypeTraits<fixed_len_to_uint32_method, TYPE_VARCHAR> {
+    using FindOp = StringFindOp<fixed_len_to_uint32_method>;
 };
 
-template <>
-struct BloomFilterTypeTraits<TYPE_STRING> {
-    using FindOp = StringFindOp;
+template <typename fixed_len_to_uint32_method>
+struct BloomFilterTypeTraits<fixed_len_to_uint32_method, TYPE_STRING> {
+    using FindOp = StringFindOp<fixed_len_to_uint32_method>;
 };
 
 template <PrimitiveType type>
@@ -511,16 +544,28 @@ class BloomFilterFunc final : public BloomFilterFuncBase {
 
     void insert(const void* data) override {
         DCHECK(_bloom_filter != nullptr);
-        dummy.insert(*_bloom_filter, data);
+        if (_enable_fixed_len_to_uint32_v2) {
+            OpV2::insert(*_bloom_filter, data);
+        } else {
+            Op::insert(*_bloom_filter, data);
+        }
     }
 
     void insert_fixed_len(const vectorized::ColumnPtr& column, size_t start) override {
         DCHECK(_bloom_filter != nullptr);
-        dummy.insert_batch(*_bloom_filter, column, start);
+        if (_enable_fixed_len_to_uint32_v2) {
+            OpV2::insert_batch(*_bloom_filter, column, start);
+        } else {
+            Op::insert_batch(*_bloom_filter, column, start);
+        }
     }
 
     void find_fixed_len(const vectorized::ColumnPtr& column, uint8_t* results) override {
-        dummy.find_batch(*_bloom_filter, column, results);
+        if (_enable_fixed_len_to_uint32_v2) {
+            OpV2::find_batch(*_bloom_filter, column, results);
+        } else {
+            Op::find_batch(*_bloom_filter, column, results);
+        }
     }
 
     template <bool is_nullable>
@@ -542,12 +587,18 @@ class BloomFilterFunc final : public BloomFilterFuncBase {
 
     uint16_t find_fixed_len_olap_engine(const char* data, const uint8* nullmap, uint16_t* offsets,
                                         int number, bool is_parse_column) override {
-        return dummy.find_batch_olap_engine(*_bloom_filter, data, nullmap, offsets, number,
-                                            is_parse_column);
+        if (_enable_fixed_len_to_uint32_v2) {
+            return OpV2::find_batch_olap_engine(*_bloom_filter, data, nullmap, offsets, number,
+                                                is_parse_column);
+        } else {
+            return Op::find_batch_olap_engine(*_bloom_filter, data, nullmap, offsets, number,
+                                              is_parse_column);
+        }
     }
 
 private:
-    typename BloomFilterTypeTraits<type>::FindOp dummy;
+    using Op = typename BloomFilterTypeTraits<fixed_len_to_uint32, type>::FindOp;
+    using OpV2 = typename BloomFilterTypeTraits<fixed_len_to_uint32_v2, type>::FindOp;
 };
 
 } // namespace doris
diff --git a/be/src/exprs/create_predicate_function.h b/be/src/exprs/create_predicate_function.h
index 44f39fb77f6d85..57a8b6376a9fed 100644
--- a/be/src/exprs/create_predicate_function.h
+++ b/be/src/exprs/create_predicate_function.h
@@ -232,7 +232,7 @@ inline auto create_bitmap_filter(PrimitiveType type) {
 template <PrimitiveType PT>
 ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
                                               const std::shared_ptr<BloomFilterFuncBase>& filter,
-                                              int be_exec_version, const TabletColumn*) {
+                                              const TabletColumn*) {
     std::shared_ptr<BloomFilterFuncBase> filter_olap;
     filter_olap.reset(create_bloom_filter(PT));
     filter_olap->light_copy(filter.get());
@@ -243,10 +243,10 @@ ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
 template <PrimitiveType PT>
 ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
                                               const std::shared_ptr<BitmapFilterFuncBase>& filter,
-                                              int be_exec_version, const TabletColumn*) {
+                                              const TabletColumn*) {
     if constexpr (PT == TYPE_TINYINT || PT == TYPE_SMALLINT || PT == TYPE_INT ||
                   PT == TYPE_BIGINT) {
-        return new BitmapFilterColumnPredicate<PT>(column_id, filter, be_exec_version);
+        return new BitmapFilterColumnPredicate<PT>(column_id, filter);
     } else {
         throw Exception(ErrorCode::INTERNAL_ERROR, "bitmap filter do not support type {}", PT);
     }
@@ -254,7 +254,7 @@ ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
 
 template <PrimitiveType PT>
 ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
-                                              const std::shared_ptr<HybridSetBase>& filter, int,
+                                              const std::shared_ptr<HybridSetBase>& filter,
                                               const TabletColumn* column = nullptr) {
     return create_in_list_predicate<PT, PredicateType::IN_LIST>(column_id, filter,
                                                                 column->length());
@@ -262,7 +262,7 @@ ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
 
 template <PrimitiveType PT>
 ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
-                                              const std::shared_ptr<FunctionFilter>& filter, int,
+                                              const std::shared_ptr<FunctionFilter>& filter,
                                               const TabletColumn* column = nullptr) {
     // currently only support like predicate
     if constexpr (PT == TYPE_CHAR) {
@@ -277,22 +277,19 @@ ColumnPredicate* create_olap_column_predicate(uint32_t column_id,
 
 template <typename T>
 ColumnPredicate* create_column_predicate(uint32_t column_id, const std::shared_ptr<T>& filter,
-                                         FieldType type, int be_exec_version,
-                                         const TabletColumn* column = nullptr) {
+                                         FieldType type, const TabletColumn* column = nullptr) {
     switch (type) {
-#define M(NAME)                                                                                \
-    case FieldType::OLAP_FIELD_##NAME: {                                                       \
-        return create_olap_column_predicate<NAME>(column_id, filter, be_exec_version, column); \
+#define M(NAME)                                                               \
+    case FieldType::OLAP_FIELD_##NAME: {                                      \
+        return create_olap_column_predicate<NAME>(column_id, filter, column); \
     }
         APPLY_FOR_PRIMTYPE(M)
 #undef M
     case FieldType::OLAP_FIELD_TYPE_DECIMAL: {
-        return create_olap_column_predicate<TYPE_DECIMALV2>(column_id, filter, be_exec_version,
-                                                            column);
+        return create_olap_column_predicate<TYPE_DECIMALV2>(column_id, filter, column);
     }
     case FieldType::OLAP_FIELD_TYPE_BOOL: {
-        return create_olap_column_predicate<TYPE_BOOLEAN>(column_id, filter, be_exec_version,
-                                                          column);
+        return create_olap_column_predicate<TYPE_BOOLEAN>(column_id, filter, column);
     }
     default:
         return nullptr;
diff --git a/be/src/exprs/runtime_filter.cpp b/be/src/exprs/runtime_filter.cpp
index c983af0fb3ea71..8f297d7074ff12 100644
--- a/be/src/exprs/runtime_filter.cpp
+++ b/be/src/exprs/runtime_filter.cpp
@@ -740,6 +740,12 @@ class RuntimePredicateWrapper {
         return Status::OK();
     }
 
+    void set_enable_fixed_len_to_uint32_v2() {
+        if (is_bloomfilter()) {
+            _context->bloom_filter_func->set_enable_fixed_len_to_uint32_v2();
+        }
+    }
+
     // used by shuffle runtime filter
     // assign this filter by protobuf
     Status assign(const PBloomFilter* bloom_filter, butil::IOBufAsZeroCopyInputStream* data,
@@ -975,11 +981,10 @@ class RuntimePredicateWrapper {
 
 Status IRuntimeFilter::create(RuntimeFilterParamsContext* state, const TRuntimeFilterDesc* desc,
                               const TQueryOptions* query_options, const RuntimeFilterRole role,
-                              int node_id, std::shared_ptr<IRuntimeFilter>* res,
-                              bool build_bf_exactly) {
+                              int node_id, std::shared_ptr<IRuntimeFilter>* res) {
     *res = std::make_shared<IRuntimeFilter>(state, desc);
     (*res)->set_role(role);
-    return (*res)->init_with_desc(desc, query_options, node_id, build_bf_exactly);
+    return (*res)->init_with_desc(desc, query_options, node_id);
 }
 
 RuntimeFilterContextSPtr& IRuntimeFilter::get_shared_context_ref() {
@@ -1348,7 +1353,7 @@ std::string IRuntimeFilter::formatted_state() const {
 }
 
 Status IRuntimeFilter::init_with_desc(const TRuntimeFilterDesc* desc, const TQueryOptions* options,
-                                      int node_id, bool build_bf_exactly) {
+                                      int node_id) {
     // if node_id == -1 , it shouldn't be a consumer
     DCHECK(node_id >= 0 || (node_id == -1 && !is_consumer()));
 
@@ -1358,6 +1363,8 @@ Status IRuntimeFilter::init_with_desc(const TRuntimeFilterDesc* desc, const TQue
     _expr_order = desc->expr_order;
     vectorized::VExprContextSPtr build_ctx;
     RETURN_IF_ERROR(vectorized::VExpr::create_expr_tree(desc->src_expr, build_ctx));
+    _enable_fixed_len_to_uint32_v2 = options->__isset.enable_fixed_len_to_uint32_v2 &&
+                                     options->enable_fixed_len_to_uint32_v2;
 
     RuntimeFilterParams params;
     params.filter_id = _filter_id;
@@ -1370,21 +1377,10 @@ Status IRuntimeFilter::init_with_desc(const TRuntimeFilterDesc* desc, const TQue
     params.runtime_bloom_filter_max_size = options->__isset.runtime_bloom_filter_max_size
                                                    ? options->runtime_bloom_filter_max_size
                                                    : 0;
-    auto sync_filter_size = desc->__isset.sync_filter_size && desc->sync_filter_size;
-    // We build runtime filter by exact distinct count if all of 3 conditions are met:
-    // 1. Only 1 join key
-    // 2. Bloom filter
-    // 3. Size of all bloom filters will be same (size will be sync or this is a broadcast join).
-    params.build_bf_exactly =
-            build_bf_exactly && (_runtime_filter_type == RuntimeFilterType::BLOOM_FILTER ||
-                                 _runtime_filter_type == RuntimeFilterType::IN_OR_BLOOM_FILTER);
 
+    params.build_bf_exactly = desc->__isset.build_bf_exactly && desc->build_bf_exactly;
     params.bloom_filter_size_calculated_by_ndv = desc->bloom_filter_size_calculated_by_ndv;
 
-    if (!sync_filter_size) {
-        params.build_bf_exactly &= !_is_broadcast_join;
-    }
-
     if (desc->__isset.bloom_filter_size_bytes) {
         params.bloom_filter_size = desc->bloom_filter_size_bytes;
     }
@@ -1419,7 +1415,11 @@ Status IRuntimeFilter::init_with_desc(const TRuntimeFilterDesc* desc, const TQue
     }
 
     _wrapper = std::make_shared<RuntimePredicateWrapper>(&params);
-    return _wrapper->init(&params);
+    RETURN_IF_ERROR(_wrapper->init(&params));
+    if (_enable_fixed_len_to_uint32_v2) {
+        _wrapper->set_enable_fixed_len_to_uint32_v2();
+    }
+    return Status::OK();
 }
 
 Status IRuntimeFilter::serialize(PMergeFilterRequest* request, void** data, int* len) {
@@ -1544,7 +1544,7 @@ std::string IRuntimeFilter::debug_string() const {
     return fmt::format(
             "RuntimeFilter: (id = {}, type = {}, is_broadcast: {}, ignored: {}, "
             "build_bf_cardinality: {}, dependency: {}, synced_size: {}, has_local_target: {}, "
-            "has_remote_target: {},error_msg: [{}]",
+            "has_remote_target: {}, error_msg: [{}]",
             _filter_id, to_string(_runtime_filter_type), _is_broadcast_join,
             _wrapper->_context->ignored, _wrapper->get_build_bf_cardinality(),
             _dependency ? _dependency->debug_string() : "none", _synced_size, _has_local_target,
@@ -1616,6 +1616,9 @@ void IRuntimeFilter::update_filter(std::shared_ptr<RuntimePredicateWrapper> wrap
         wrapper->_column_return_type = _wrapper->_column_return_type;
     }
     _wrapper = wrapper;
+    if (_enable_fixed_len_to_uint32_v2) {
+        _wrapper->set_enable_fixed_len_to_uint32_v2();
+    }
     update_runtime_filter_type_to_profile(local_merge_time);
     signal();
 }
diff --git a/be/src/exprs/runtime_filter.h b/be/src/exprs/runtime_filter.h
index a1fdfbf07d239d..b0e82a75335cc5 100644
--- a/be/src/exprs/runtime_filter.h
+++ b/be/src/exprs/runtime_filter.h
@@ -213,8 +213,7 @@ class IRuntimeFilter {
 
     static Status create(RuntimeFilterParamsContext* state, const TRuntimeFilterDesc* desc,
                          const TQueryOptions* query_options, const RuntimeFilterRole role,
-                         int node_id, std::shared_ptr<IRuntimeFilter>* res,
-                         bool build_bf_exactly = false);
+                         int node_id, std::shared_ptr<IRuntimeFilter>* res);
 
     RuntimeFilterContextSPtr& get_shared_context_ref();
 
@@ -260,7 +259,7 @@ class IRuntimeFilter {
 
     // init filter with desc
     Status init_with_desc(const TRuntimeFilterDesc* desc, const TQueryOptions* options,
-                          int node_id = -1, bool build_bf_exactly = false);
+                          int node_id = -1);
 
     // serialize _wrapper to protobuf
     Status serialize(PMergeFilterRequest* request, void** data, int* len);
@@ -355,8 +354,9 @@ class IRuntimeFilter {
             const std::shared_ptr<pipeline::CountedFinishDependency>& dependency);
 
     int64_t get_synced_size() const {
-        if (_synced_size == -1) {
-            throw Status::InternalError("sync filter size meet error, filter: {}", debug_string());
+        if (_synced_size == -1 || !_dependency) {
+            throw Exception(doris::ErrorCode::INTERNAL_ERROR,
+                            "sync filter size meet error, filter: {}", debug_string());
         }
         return _synced_size;
     }
@@ -424,6 +424,8 @@ class IRuntimeFilter {
 
     int64_t _synced_size = -1;
     std::shared_ptr<pipeline::CountedFinishDependency> _dependency;
+
+    bool _enable_fixed_len_to_uint32_v2 = false;
 };
 
 // avoid expose RuntimePredicateWrapper
diff --git a/be/src/http/http_handler_with_auth.cpp b/be/src/http/http_handler_with_auth.cpp
index 518b9868de191e..ae5c024e76d093 100644
--- a/be/src/http/http_handler_with_auth.cpp
+++ b/be/src/http/http_handler_with_auth.cpp
@@ -35,6 +35,7 @@ HttpHandlerWithAuth::HttpHandlerWithAuth(ExecEnv* exec_env, TPrivilegeHier::type
         : _exec_env(exec_env), _hier(hier), _type(type) {}
 
 int HttpHandlerWithAuth::on_header(HttpRequest* req) {
+    //if u return value isn't 0,u should `send_reply`,Avoid requesting links that never return.
     TCheckAuthRequest auth_request;
     TCheckAuthResult auth_result;
     AuthInfo auth_info;
@@ -83,6 +84,11 @@ int HttpHandlerWithAuth::on_header(HttpRequest* req) {
 
 #ifndef BE_TEST
     TNetworkAddress master_addr = _exec_env->cluster_info()->master_fe_addr;
+    if (master_addr.hostname.empty() || master_addr.port == 0) {
+        LOG(WARNING) << "Not found master fe, Can't auth API request: " << req->debug_string();
+        HttpChannel::send_error(req, HttpStatus::SERVICE_UNAVAILABLE);
+        return -1;
+    }
     {
         auto status = ThriftRpcHelper::rpc<FrontendServiceClient>(
                 master_addr.hostname, master_addr.port,
@@ -90,6 +96,10 @@ int HttpHandlerWithAuth::on_header(HttpRequest* req) {
                     client->checkAuth(auth_result, auth_request);
                 });
         if (!status) {
+            LOG(WARNING) << "CheckAuth Rpc Fail.Fe Ip:" << master_addr.hostname
+                         << ", Fe port:" << master_addr.port << ".Status:" << status.to_string()
+                         << ".Request: " << req->debug_string();
+            HttpChannel::send_error(req, HttpStatus::SERVICE_UNAVAILABLE);
             return -1;
         }
     }
@@ -98,6 +108,7 @@ int HttpHandlerWithAuth::on_header(HttpRequest* req) {
         auth_result.status.status_code = TStatusCode::type::OK;
         auth_result.status.error_msgs.clear();
     } else {
+        HttpChannel::send_reply(req, HttpStatus::FORBIDDEN);
         return -1;
     }
 #endif
diff --git a/be/src/olap/base_tablet.cpp b/be/src/olap/base_tablet.cpp
index a499a27b07f6e2..82dc122e19f5ef 100644
--- a/be/src/olap/base_tablet.cpp
+++ b/be/src/olap/base_tablet.cpp
@@ -376,7 +376,7 @@ Status BaseTablet::calc_delete_bitmap_between_segments(
         seq_col_length = _tablet_meta->tablet_schema()->column(seq_col_idx).length() + 1;
     }
     size_t rowid_length = 0;
-    if (!_tablet_meta->tablet_schema()->cluster_key_idxes().empty()) {
+    if (!_tablet_meta->tablet_schema()->cluster_key_uids().empty()) {
         rowid_length = PrimaryKeyIndexReader::ROW_ID_LENGTH;
     }
 
@@ -438,7 +438,6 @@ Status BaseTablet::lookup_row_data(const Slice& encoded_key, const RowLocation&
     StringRef value = string_column->get_data_at(0);
     values = value.to_string();
     if (write_to_cache) {
-        StringRef value = string_column->get_data_at(0);
         RowCache::instance()->insert({tablet_id(), encoded_key}, Slice {value.data, value.size});
     }
     return Status::OK();
@@ -461,7 +460,7 @@ Status BaseTablet::lookup_row_key(const Slice& encoded_key, TabletSchema* latest
         seq_col_length = schema->column(schema->sequence_col_idx()).length() + 1;
     }
     size_t rowid_length = 0;
-    if (with_rowid && !schema->cluster_key_idxes().empty()) {
+    if (with_rowid && !schema->cluster_key_uids().empty()) {
         rowid_length = PrimaryKeyIndexReader::ROW_ID_LENGTH;
     }
     Slice key_without_seq =
@@ -476,12 +475,12 @@ Status BaseTablet::lookup_row_key(const Slice& encoded_key, TabletSchema* latest
         int num_segments = cast_set<int>(rs->num_segments());
         DCHECK_EQ(segments_key_bounds.size(), num_segments);
         std::vector<uint32_t> picked_segments;
-        for (int i = num_segments - 1; i >= 0; i--) {
-            if (key_without_seq.compare(segments_key_bounds[i].max_key()) > 0 ||
-                key_without_seq.compare(segments_key_bounds[i].min_key()) < 0) {
+        for (int j = num_segments - 1; j >= 0; j--) {
+            if (key_without_seq.compare(segments_key_bounds[j].max_key()) > 0 ||
+                key_without_seq.compare(segments_key_bounds[j].min_key()) < 0) {
                 continue;
             }
-            picked_segments.emplace_back(i);
+            picked_segments.emplace_back(j);
         }
         if (picked_segments.empty()) {
             continue;
@@ -654,7 +653,7 @@ Status BaseTablet::calc_segment_delete_bitmap(RowsetSharedPtr rowset,
             Slice key = Slice(index_column->get_data_at(i).data, index_column->get_data_at(i).size);
             RowLocation loc;
             // calculate row id
-            if (!_tablet_meta->tablet_schema()->cluster_key_idxes().empty()) {
+            if (!_tablet_meta->tablet_schema()->cluster_key_uids().empty()) {
                 size_t seq_col_length = 0;
                 if (_tablet_meta->tablet_schema()->has_sequence_col()) {
                     seq_col_length =
@@ -778,11 +777,11 @@ Status BaseTablet::calc_segment_delete_bitmap(RowsetSharedPtr rowset,
 
     if (config::enable_merge_on_write_correctness_check) {
         RowsetIdUnorderedSet rowsetids;
-        for (const auto& rowset : specified_rowsets) {
-            rowsetids.emplace(rowset->rowset_id());
+        for (const auto& specified_rowset : specified_rowsets) {
+            rowsetids.emplace(specified_rowset->rowset_id());
             VLOG_NOTICE << "[tabletID:" << tablet_id() << "]"
                         << "[add_sentinel_mark_to_delete_bitmap][end_version:" << end_version << "]"
-                        << "add:" << rowset->rowset_id();
+                        << "add:" << specified_rowset->rowset_id();
         }
         add_sentinel_mark_to_delete_bitmap(delete_bitmap.get(), rowsetids);
     }
@@ -892,11 +891,11 @@ Status BaseTablet::fetch_value_through_row_column(RowsetSharedPtr input_rowset,
     std::vector<std::string> default_values;
     default_values.resize(cids.size());
     for (int i = 0; i < cids.size(); ++i) {
-        const TabletColumn& column = tablet_schema.column(cids[i]);
+        const TabletColumn& tablet_column = tablet_schema.column(cids[i]);
         vectorized::DataTypePtr type =
-                vectorized::DataTypeFactory::instance().create_data_type(column);
-        col_uid_to_idx[column.unique_id()] = i;
-        default_values[i] = column.default_value();
+                vectorized::DataTypeFactory::instance().create_data_type(tablet_column);
+        col_uid_to_idx[tablet_column.unique_id()] = i;
+        default_values[i] = tablet_column.default_value();
         serdes[i] = type->get_serde();
     }
     vectorized::JsonbSerializeUtil::jsonb_to_block(serdes, *string_column, col_uid_to_idx, block,
@@ -1326,12 +1325,12 @@ Status BaseTablet::check_delete_bitmap_correctness(DeleteBitmapPtr delete_bitmap
                 required_rowsets_arr.PushBack(value, required_rowsets_arr.GetAllocator());
             }
         } else {
-            std::vector<RowsetSharedPtr> rowsets;
+            std::vector<RowsetSharedPtr> tablet_rowsets;
             {
                 std::shared_lock meta_rlock(_meta_lock);
-                rowsets = get_rowset_by_ids(&rowset_ids);
+                tablet_rowsets = get_rowset_by_ids(&rowset_ids);
             }
-            for (const auto& rowset : rowsets) {
+            for (const auto& rowset : tablet_rowsets) {
                 rapidjson::Value value;
                 std::string version_str = rowset->get_rowset_info_str();
                 value.SetString(version_str.c_str(),
@@ -1439,12 +1438,12 @@ Status BaseTablet::update_delete_bitmap(const BaseTabletSPtr& self, TabletTxnInf
                 txn_info->partial_update_info->max_version_in_flush_phase;
         DCHECK(max_version_in_flush_phase != -1);
         std::vector<RowsetSharedPtr> remained_rowsets;
-        for (const auto& rowset : specified_rowsets) {
-            if (rowset->end_version() <= max_version_in_flush_phase &&
-                rowset->produced_by_compaction()) {
-                rowsets_skip_alignment.emplace_back(rowset);
+        for (const auto& specified_rowset : specified_rowsets) {
+            if (specified_rowset->end_version() <= max_version_in_flush_phase &&
+                specified_rowset->produced_by_compaction()) {
+                rowsets_skip_alignment.emplace_back(specified_rowset);
             } else {
-                remained_rowsets.emplace_back(rowset);
+                remained_rowsets.emplace_back(specified_rowset);
             }
         }
         if (!rowsets_skip_alignment.empty()) {
@@ -1604,10 +1603,6 @@ Status BaseTablet::check_rowid_conversion(
         VLOG_DEBUG << "check_rowid_conversion, location_map is empty";
         return Status::OK();
     }
-    if (!tablet_schema()->cluster_key_idxes().empty()) {
-        VLOG_DEBUG << "skip check_rowid_conversion for mow tables with cluster keys";
-        return Status::OK();
-    }
     std::vector<segment_v2::SegmentSharedPtr> dst_segments;
 
     RETURN_IF_ERROR(
@@ -1762,7 +1757,7 @@ std::vector<RowsetSharedPtr> BaseTablet::get_snapshot_rowset(bool include_stale_
 
 void BaseTablet::calc_consecutive_empty_rowsets(
         std::vector<RowsetSharedPtr>* empty_rowsets,
-        const std::vector<RowsetSharedPtr>& candidate_rowsets, int limit) {
+        const std::vector<RowsetSharedPtr>& candidate_rowsets, int64_t limit) {
     int len = cast_set<int>(candidate_rowsets.size());
     for (int i = 0; i < len - 1; ++i) {
         auto rowset = candidate_rowsets[i];
diff --git a/be/src/olap/base_tablet.h b/be/src/olap/base_tablet.h
index f961f4c49eedd6..c6de447200f87c 100644
--- a/be/src/olap/base_tablet.h
+++ b/be/src/olap/base_tablet.h
@@ -276,10 +276,13 @@ class BaseTablet {
     // Find the first consecutive empty rowsets. output->size() >= limit
     void calc_consecutive_empty_rowsets(std::vector<RowsetSharedPtr>* empty_rowsets,
                                         const std::vector<RowsetSharedPtr>& candidate_rowsets,
-                                        int limit);
+                                        int64_t limit);
 
     // Return the merged schema of all rowsets
-    virtual TabletSchemaSPtr merged_tablet_schema() const { return _max_version_schema; }
+    virtual TabletSchemaSPtr merged_tablet_schema() const {
+        std::shared_lock rlock(_meta_lock);
+        return _max_version_schema;
+    }
 
     void traverse_rowsets(std::function<void(const RowsetSharedPtr&)> visitor,
                           bool include_stale = false) {
diff --git a/be/src/olap/bitmap_filter_predicate.h b/be/src/olap/bitmap_filter_predicate.h
index 716c99927bf2d6..8d89c7a31fb271 100644
--- a/be/src/olap/bitmap_filter_predicate.h
+++ b/be/src/olap/bitmap_filter_predicate.h
@@ -37,7 +37,7 @@ class BitmapFilterColumnPredicate : public ColumnPredicate {
     using SpecificFilter = BitmapFilterFunc<T>;
 
     BitmapFilterColumnPredicate(uint32_t column_id,
-                                const std::shared_ptr<BitmapFilterFuncBase>& filter, int)
+                                const std::shared_ptr<BitmapFilterFuncBase>& filter)
             : ColumnPredicate(column_id),
               _filter(filter),
               _specific_filter(assert_cast<SpecificFilter*>(_filter.get())) {}
diff --git a/be/src/olap/bloom_filter.hpp b/be/src/olap/bloom_filter.hpp
deleted file mode 100644
index 5c7cb5f9e6419f..00000000000000
--- a/be/src/olap/bloom_filter.hpp
+++ /dev/null
@@ -1,272 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-#ifndef DORIS_BE_SRC_OLAP_COLUMN_FILE_BLOOM_FILTER_HPP
-#define DORIS_BE_SRC_OLAP_COLUMN_FILE_BLOOM_FILTER_HPP
-
-#include <math.h>
-
-#include <sstream>
-#include <string>
-
-#include "olap/olap_define.h"
-#include "olap/utils.h"
-#include "util/hash_util.hpp"
-
-namespace doris {
-
-static const uint64_t DEFAULT_SEED = 104729;
-static const uint64_t BLOOM_FILTER_NULL_HASHCODE = 2862933555777941757ULL;
-
-struct BloomFilterIndexHeader {
-    uint64_t block_count;
-    BloomFilterIndexHeader() : block_count(0) {}
-} __attribute__((packed));
-
-// Bare metal bit set implementation. For performance reasons, this implementation does not
-// check for index bounds nor expand the bit set if the specified index is greater than the size.
-class BitSet {
-public:
-    BitSet() : _data(nullptr), _data_len(0) {}
-
-    ~BitSet() { SAFE_DELETE_ARRAY(_data); }
-
-    // Init BitSet with given bit_num, which will align up to uint64_t
-    bool init(uint32_t bit_num) {
-        if (bit_num <= 0) {
-            return false;
-        }
-
-        _data_len = (bit_num + sizeof(uint64_t) * 8 - 1) / (sizeof(uint64_t) * 8);
-        _data = new (std::nothrow) uint64_t[_data_len];
-        if (_data == nullptr) {
-            return false;
-        }
-
-        memset(_data, 0, _data_len * sizeof(uint64_t));
-        return true;
-    }
-
-    // Init BitSet with given buffer
-    bool init(uint64_t* data, uint32_t data_len) {
-        _data = data;
-        _data_len = data_len;
-        return true;
-    }
-
-    // Set the bit specified by param, note that uint64_t type contains 2^6 bits
-    void set(uint32_t index) { _data[index >> 6] |= 1L << (index % 64); }
-
-    // Return true if the bit specified by param is set
-    bool get(uint32_t index) const { return (_data[index >> 6] & (1L << (index % 64))) != 0; }
-
-    // Merge with another BitSet by byte, return false when the length is not equal
-    bool merge(const BitSet& set) {
-        if (_data_len != set.data_len()) {
-            return false;
-        }
-
-        for (uint32_t i = 0; i < _data_len; ++i) {
-            _data[i] |= set.data()[i];
-        }
-
-        return true;
-    }
-
-    // Convert BitSet to string to convenient debug and test
-    std::string to_string() const {
-        uint32_t bit_num = _data_len * sizeof(uint64_t) * 8;
-        std::string str(bit_num, '0');
-        for (uint32_t i = 0; i < bit_num; ++i) {
-            if ((_data[i >> 6] & (1L << i)) != 0) {
-                str[i] = '1';
-            }
-        }
-
-        return str;
-    }
-
-    uint64_t* data() const { return _data; }
-
-    uint32_t data_len() const { return _data_len; }
-
-    uint32_t bit_num() const { return _data_len * sizeof(uint64_t) * 8; }
-
-    void clear() { memset(_data, 0, _data_len * sizeof(uint64_t)); }
-
-    void reset() {
-        _data = NULL;
-        _data_len = 0;
-    }
-
-private:
-    uint64_t* _data;
-    uint32_t _data_len;
-};
-
-class BloomFilter {
-public:
-    BloomFilter() : _bit_num(0), _hash_function_num(0) {}
-    ~BloomFilter() {}
-
-    // Create BloomFilter with given entry num and fpp, which is used for loading data
-    bool init(int64_t expected_entries, double fpp) {
-        uint32_t bit_num = _optimal_bit_num(expected_entries, fpp);
-        if (!_bit_set.init(bit_num)) {
-            return false;
-        }
-
-        _bit_num = _bit_set.bit_num();
-        _hash_function_num = _optimal_hash_function_num(expected_entries, _bit_num);
-        return true;
-    }
-
-    // Create BloomFilter with given entry num and default fpp
-    bool init(int64_t expected_entries) {
-        return this->init(expected_entries, BLOOM_FILTER_DEFAULT_FPP);
-    }
-
-    // Init BloomFilter with given buffer, which is used for query
-    bool init(uint64_t* data, uint32_t len, uint32_t hash_function_num) {
-        _bit_num = sizeof(uint64_t) * 8 * len;
-        _hash_function_num = hash_function_num;
-        return _bit_set.init(data, len);
-    }
-
-    // Compute hash value of given buffer and add to BloomFilter
-    void add_bytes(const char* buf, uint32_t len) {
-        uint64_t hash = buf == nullptr ? BLOOM_FILTER_NULL_HASHCODE
-                                       : HashUtil::hash64(buf, len, DEFAULT_SEED);
-        add_hash(hash);
-    }
-
-    // Generate multiple hash value according to following rule:
-    //     new_hash_value = hash_high_part + (i * hash_low_part)
-    void add_hash(uint64_t hash) {
-        uint32_t hash1 = (uint32_t)hash;
-        uint32_t hash2 = (uint32_t)(hash >> 32);
-
-        for (uint32_t i = 0; i < _hash_function_num; ++i) {
-            uint64_t combine_hash = hash1 + hash2 * i;
-            uint32_t index = combine_hash % _bit_num;
-            _bit_set.set(index);
-        }
-    }
-
-    // Compute hash value of given buffer and verify whether exist in BloomFilter
-    bool test_bytes(const char* buf, uint32_t len) const {
-        uint64_t hash = buf == nullptr ? BLOOM_FILTER_NULL_HASHCODE
-                                       : HashUtil::hash64(buf, len, DEFAULT_SEED);
-        return test_hash(hash);
-    }
-
-    // Verify whether hash value in BloomFilter
-    bool test_hash(uint64_t hash) const {
-        uint32_t hash1 = (uint32_t)hash;
-        uint32_t hash2 = (uint32_t)(hash >> 32);
-
-        for (uint32_t i = 0; i < _hash_function_num; ++i) {
-            uint64_t combine_hash = hash1 + hash2 * i;
-            uint32_t index = combine_hash % _bit_num;
-            if (!_bit_set.get(index)) {
-                return false;
-            }
-        }
-
-        return true;
-    }
-
-    // Merge with another BloomFilter, return false when the length
-    //     and hash function number is not equal
-    bool merge(const BloomFilter& that) {
-        if (_bit_num == that.bit_num() && _hash_function_num == that.hash_function_num()) {
-            _bit_set.merge(that.bit_set());
-            return true;
-        }
-
-        return false;
-    }
-
-    void clear() { _bit_set.clear(); }
-
-    void reset() {
-        _bit_num = 0;
-        _hash_function_num = 0;
-        _bit_set.reset();
-    }
-
-    uint32_t bit_num() const { return _bit_num; }
-
-    uint32_t hash_function_num() const { return _hash_function_num; }
-
-    const BitSet& bit_set() const { return _bit_set; }
-
-    uint64_t* bit_set_data() const { return _bit_set.data(); }
-
-    uint32_t bit_set_data_len() const { return _bit_set.data_len(); }
-
-    // Convert BloomFilter to string to convenient debug and test
-    std::string to_string() const {
-        std::stringstream bf_stream;
-        bf_stream << "bit_num:" << _bit_num << " hash_function_num:" << _hash_function_num
-                  << " bit_set:" << _bit_set.to_string();
-        return bf_stream.str();
-    }
-
-    // Get points which set by given buffer in the BitSet
-    std::string get_bytes_points_string(const char* buf, uint32_t len) const {
-        uint64_t hash = buf == nullptr ? BLOOM_FILTER_NULL_HASHCODE
-                                       : HashUtil::hash64(buf, len, DEFAULT_SEED);
-        uint32_t hash1 = (uint32_t)hash;
-        uint32_t hash2 = (uint32_t)(hash >> 32);
-
-        std::stringstream stream;
-        for (uint32_t i = 0; i < _hash_function_num; ++i) {
-            if (i != 0) {
-                stream << "-";
-            }
-
-            uint32_t combine_hash = hash1 + hash2 * i;
-            uint32_t index = combine_hash % _bit_num;
-            stream << index;
-        }
-
-        return stream.str();
-    }
-
-private:
-    // Compute the optimal bit number according to the following rule:
-    //     m = -n * ln(fpp) / (ln(2) ^ 2)
-    uint32_t _optimal_bit_num(int64_t n, double fpp) {
-        return (uint32_t)(-n * log(fpp) / (log(2) * log(2)));
-    }
-
-    // Compute the optimal hash function number according to the following rule:
-    //     k = round(m * ln(2) / n)
-    uint32_t _optimal_hash_function_num(int64_t n, uint32_t m) {
-        uint32_t k = (uint32_t)round(m * log(2) / n);
-        return k > 1 ? k : 1;
-    }
-
-    BitSet _bit_set;
-    uint32_t _bit_num;
-    uint32_t _hash_function_num;
-};
-
-} // namespace doris
-
-#endif // DORIS_BE_SRC_OLAP_COLUMN_FILE_BLOOM_FILTER_HPP
diff --git a/be/src/olap/compaction.cpp b/be/src/olap/compaction.cpp
index e71e1862dc8dbb..8c45c20f799427 100644
--- a/be/src/olap/compaction.cpp
+++ b/be/src/olap/compaction.cpp
@@ -191,11 +191,14 @@ Status Compaction::merge_input_rowsets() {
         SCOPED_TIMER(_merge_rowsets_latency_timer);
         // 1. Merge segment files and write bkd inverted index
         if (_is_vertical) {
+            if (!_tablet->tablet_schema()->cluster_key_uids().empty()) {
+                RETURN_IF_ERROR(update_delete_bitmap());
+            }
             res = Merger::vertical_merge_rowsets(_tablet, compaction_type(), *_cur_tablet_schema,
                                                  input_rs_readers, _output_rs_writer.get(),
                                                  get_avg_segment_rows(), way_num, &_stats);
         } else {
-            if (!_tablet->tablet_schema()->cluster_key_idxes().empty()) {
+            if (!_tablet->tablet_schema()->cluster_key_uids().empty()) {
                 return Status::InternalError(
                         "mow table with cluster keys does not support non vertical compaction");
             }
@@ -872,6 +875,60 @@ void Compaction::construct_index_compaction_columns(RowsetWriterContext& ctx) {
     }
 }
 
+Status CompactionMixin::update_delete_bitmap() {
+    // for mow with cluster keys, compaction read data with delete bitmap
+    // if tablet is not ready(such as schema change), we need to update delete bitmap
+    {
+        std::shared_lock meta_rlock(_tablet->get_header_lock());
+        if (_tablet->tablet_state() != TABLET_NOTREADY) {
+            return Status::OK();
+        }
+    }
+    OlapStopWatch watch;
+    std::vector<RowsetSharedPtr> rowsets;
+    for (const auto& rowset : _input_rowsets) {
+        std::lock_guard rwlock(tablet()->get_rowset_update_lock());
+        std::shared_lock rlock(_tablet->get_header_lock());
+        Status st = _tablet->update_delete_bitmap_without_lock(_tablet, rowset, &rowsets);
+        if (!st.ok()) {
+            LOG(INFO) << "failed update_delete_bitmap_without_lock for tablet_id="
+                      << _tablet->tablet_id() << ", st=" << st.to_string();
+            return st;
+        }
+        rowsets.push_back(rowset);
+    }
+    LOG(INFO) << "finish update delete bitmap for tablet: " << _tablet->tablet_id()
+              << ", rowsets: " << _input_rowsets.size() << ", cost: " << watch.get_elapse_time_us()
+              << "(us)";
+    return Status::OK();
+}
+
+Status CloudCompactionMixin::update_delete_bitmap() {
+    // for mow with cluster keys, compaction read data with delete bitmap
+    // if tablet is not ready(such as schema change), we need to update delete bitmap
+    {
+        std::shared_lock meta_rlock(_tablet->get_header_lock());
+        if (_tablet->tablet_state() != TABLET_NOTREADY) {
+            return Status::OK();
+        }
+    }
+    OlapStopWatch watch;
+    std::vector<RowsetSharedPtr> rowsets;
+    for (const auto& rowset : _input_rowsets) {
+        Status st = _tablet->update_delete_bitmap_without_lock(_tablet, rowset, &rowsets);
+        if (!st.ok()) {
+            LOG(INFO) << "failed update_delete_bitmap_without_lock for tablet_id="
+                      << _tablet->tablet_id() << ", st=" << st.to_string();
+            return st;
+        }
+        rowsets.push_back(rowset);
+    }
+    LOG(INFO) << "finish update delete bitmap for tablet: " << _tablet->tablet_id()
+              << ", rowsets: " << _input_rowsets.size() << ", cost: " << watch.get_elapse_time_us()
+              << "(us)";
+    return Status::OK();
+}
+
 Status CompactionMixin::construct_output_rowset_writer(RowsetWriterContext& ctx) {
     // only do index compaction for dup_keys and unique_keys with mow enabled
     if (config::inverted_index_compaction_enable &&
@@ -908,7 +965,8 @@ Status CompactionMixin::modify_rowsets() {
             LOG(INFO) << "RowLocation Set inited succ for tablet:" << _tablet->tablet_id();
         }
         std::unique_ptr<std::map<RowsetSharedPtr, RowLocationPairList>> location_map;
-        if (config::enable_rowid_conversion_correctness_check) {
+        if (config::enable_rowid_conversion_correctness_check &&
+            tablet()->tablet_schema()->cluster_key_uids().empty()) {
             location_map = std::make_unique<std::map<RowsetSharedPtr, RowLocationPairList>>();
             LOG(INFO) << "Location Map inited succ for tablet:" << _tablet->tablet_id();
         }
@@ -925,7 +983,7 @@ Status CompactionMixin::modify_rowsets() {
         if (missed_rows) {
             missed_rows_size = missed_rows->size();
             std::size_t merged_missed_rows_size = _stats.merged_rows;
-            if (!_tablet->tablet_meta()->tablet_schema()->cluster_key_idxes().empty()) {
+            if (!_tablet->tablet_meta()->tablet_schema()->cluster_key_uids().empty()) {
                 merged_missed_rows_size += _stats.filtered_rows;
             }
             if (_tablet->tablet_state() == TABLET_RUNNING &&
diff --git a/be/src/olap/compaction.h b/be/src/olap/compaction.h
index 06ef4268529247..7f92a6c5f4d7dc 100644
--- a/be/src/olap/compaction.h
+++ b/be/src/olap/compaction.h
@@ -84,6 +84,8 @@ class Compaction {
 
     int64_t merge_way_num();
 
+    virtual Status update_delete_bitmap() = 0;
+
     // the root tracker for this compaction
     std::shared_ptr<MemTrackerLimiter> _mem_tracker;
 
@@ -146,6 +148,8 @@ class CompactionMixin : public Compaction {
 
     virtual Status modify_rowsets();
 
+    Status update_delete_bitmap() override;
+
     StorageEngine& _engine;
 
 private:
@@ -175,6 +179,8 @@ class CloudCompactionMixin : public Compaction {
 protected:
     CloudTablet* cloud_tablet() { return static_cast<CloudTablet*>(_tablet.get()); }
 
+    Status update_delete_bitmap() override;
+
     virtual void garbage_collection();
 
     CloudStorageEngine& _engine;
diff --git a/be/src/olap/cumulative_compaction.cpp b/be/src/olap/cumulative_compaction.cpp
index b961c694ede4d0..2dfd30fb86ed9a 100644
--- a/be/src/olap/cumulative_compaction.cpp
+++ b/be/src/olap/cumulative_compaction.cpp
@@ -145,7 +145,7 @@ Status CumulativeCompaction::pick_rowsets_to_compact() {
         DCHECK(missing_versions.size() % 2 == 0);
         LOG(WARNING) << "There are missed versions among rowsets. "
                      << "total missed version size: " << missing_versions.size() / 2
-                     << " first missed version prev rowset verison=" << missing_versions[0]
+                     << ", first missed version prev rowset verison=" << missing_versions[0]
                      << ", first missed version next rowset version=" << missing_versions[1]
                      << ", tablet=" << _tablet->tablet_id();
     }
diff --git a/be/src/olap/delta_writer_v2.h b/be/src/olap/delta_writer_v2.h
index beeb3d3ecd3ec5..f9c2800a68f499 100644
--- a/be/src/olap/delta_writer_v2.h
+++ b/be/src/olap/delta_writer_v2.h
@@ -46,7 +46,6 @@ namespace doris {
 
 class FlushToken;
 class MemTable;
-class MemTracker;
 class Schema;
 class StorageEngine;
 class TupleDescriptor;
diff --git a/be/src/olap/inverted_index_parser.cpp b/be/src/olap/inverted_index_parser.cpp
index f7e511970d91f2..f1de5a5e0c10fc 100644
--- a/be/src/olap/inverted_index_parser.cpp
+++ b/be/src/olap/inverted_index_parser.cpp
@@ -136,4 +136,13 @@ std::string get_parser_stopwords_from_properties(
     }
 }
 
+std::string get_parser_dict_compression_from_properties(
+        const std::map<std::string, std::string>& properties) {
+    if (properties.find(INVERTED_INDEX_PARSER_DICT_COMPRESSION_KEY) != properties.end()) {
+        return properties.at(INVERTED_INDEX_PARSER_DICT_COMPRESSION_KEY);
+    } else {
+        return "";
+    }
+}
+
 } // namespace doris
diff --git a/be/src/olap/inverted_index_parser.h b/be/src/olap/inverted_index_parser.h
index 0b8426d74c7ab3..f1f85995a206a8 100644
--- a/be/src/olap/inverted_index_parser.h
+++ b/be/src/olap/inverted_index_parser.h
@@ -83,6 +83,8 @@ const std::string INVERTED_INDEX_PARSER_LOWERCASE_KEY = "lower_case";
 
 const std::string INVERTED_INDEX_PARSER_STOPWORDS_KEY = "stopwords";
 
+const std::string INVERTED_INDEX_PARSER_DICT_COMPRESSION_KEY = "dict_compression";
+
 std::string inverted_index_parser_type_to_string(InvertedIndexParserType parser_type);
 
 InvertedIndexParserType get_inverted_index_parser_type_from_string(const std::string& parser_str);
@@ -119,4 +121,7 @@ std::string get_parser_lowercase_from_properties(
 std::string get_parser_stopwords_from_properties(
         const std::map<std::string, std::string>& properties);
 
+std::string get_parser_dict_compression_from_properties(
+        const std::map<std::string, std::string>& properties);
+
 } // namespace doris
diff --git a/be/src/olap/memtable.cpp b/be/src/olap/memtable.cpp
index 5db3d89378bcc2..765f67a07c7884 100644
--- a/be/src/olap/memtable.cpp
+++ b/be/src/olap/memtable.cpp
@@ -350,7 +350,7 @@ Status MemTable::_sort_by_cluster_keys() {
     }
     Tie tie = Tie(0, mutable_block.rows());
 
-    for (auto cid : _tablet_schema->cluster_key_idxes()) {
+    for (auto cid : _tablet_schema->cluster_key_uids()) {
         auto index = _tablet_schema->field_index(cid);
         if (index == -1) {
             return Status::InternalError("could not find cluster key column with unique_id=" +
@@ -619,7 +619,7 @@ Status MemTable::_to_block(std::unique_ptr<vectorized::Block>* res) {
         (_skip_bitmap_col_idx == -1) ? _aggregate<true, false>() : _aggregate<true, true>();
     }
     if (_keys_type == KeysType::UNIQUE_KEYS && _enable_unique_key_mow &&
-        !_tablet_schema->cluster_key_idxes().empty()) {
+        !_tablet_schema->cluster_key_uids().empty()) {
         if (_partial_update_mode != UniqueKeyUpdateModePB::UPSERT) {
             return Status::InternalError(
                     "Partial update for mow with cluster keys is not supported");
diff --git a/be/src/olap/memtable_writer.h b/be/src/olap/memtable_writer.h
index fb07e740fa3cf6..713400793a1754 100644
--- a/be/src/olap/memtable_writer.h
+++ b/be/src/olap/memtable_writer.h
@@ -45,7 +45,6 @@ namespace doris {
 
 class FlushToken;
 class MemTable;
-class MemTracker;
 class StorageEngine;
 class TupleDescriptor;
 class SlotDescriptor;
diff --git a/be/src/olap/merger.cpp b/be/src/olap/merger.cpp
index b207cc4c5ad22b..975aaa0bca3de5 100644
--- a/be/src/olap/merger.cpp
+++ b/be/src/olap/merger.cpp
@@ -86,7 +86,7 @@ Status Merger::vmerge_rowsets(BaseTabletSPtr tablet, ReaderType reader_type,
         merge_tablet_schema->merge_dropped_columns(*del_pred_rs->tablet_schema());
     }
     reader_params.tablet_schema = merge_tablet_schema;
-    if (!tablet->tablet_schema()->cluster_key_idxes().empty()) {
+    if (!tablet->tablet_schema()->cluster_key_uids().empty()) {
         reader_params.delete_bitmap = &tablet->tablet_meta()->delete_bitmap();
     }
 
@@ -173,8 +173,8 @@ void Merger::vertical_split_columns(const TabletSchema& tablet_schema,
         if (delete_sign_idx != -1) {
             key_columns.emplace_back(delete_sign_idx);
         }
-        if (!tablet_schema.cluster_key_idxes().empty()) {
-            for (const auto& cid : tablet_schema.cluster_key_idxes()) {
+        if (!tablet_schema.cluster_key_uids().empty()) {
+            for (const auto& cid : tablet_schema.cluster_key_uids()) {
                 auto idx = tablet_schema.field_index(cid);
                 DCHECK(idx >= 0) << "could not find cluster key column with unique_id=" << cid
                                  << " in tablet schema, table_id=" << tablet_schema.table_id();
@@ -186,7 +186,7 @@ void Merger::vertical_split_columns(const TabletSchema& tablet_schema,
             // cluster key unique ids: [3, 1, 4]
             // the key_columns should be [0, 1, 3, 5]
             // the key_group_cluster_key_idxes should be [2, 1, 3]
-            for (const auto& cid : tablet_schema.cluster_key_idxes()) {
+            for (const auto& cid : tablet_schema.cluster_key_uids()) {
                 auto idx = tablet_schema.field_index(cid);
                 for (auto i = 0; i < key_columns.size(); ++i) {
                     if (idx == key_columns[i]) {
@@ -261,7 +261,7 @@ Status Merger::vertical_compact_one_group(
 
     reader_params.tablet_schema = merge_tablet_schema;
     bool has_cluster_key = false;
-    if (!tablet->tablet_schema()->cluster_key_idxes().empty()) {
+    if (!tablet->tablet_schema()->cluster_key_uids().empty()) {
         reader_params.delete_bitmap = &tablet->tablet_meta()->delete_bitmap();
         has_cluster_key = true;
     }
diff --git a/be/src/olap/metadata_adder.h b/be/src/olap/metadata_adder.h
index 559c5db873b2f6..5b5ba16322490e 100644
--- a/be/src/olap/metadata_adder.h
+++ b/be/src/olap/metadata_adder.h
@@ -20,6 +20,8 @@
 #include <bvar/bvar.h>
 #include <stdint.h>
 
+#include "runtime/exec_env.h"
+#include "runtime/memory/mem_tracker_limiter.h"
 #include "util/runtime_profile.h"
 
 namespace doris {
@@ -27,8 +29,8 @@ namespace doris {
 inline bvar::Adder<int64_t> g_rowset_meta_mem_bytes("doris_rowset_meta_mem_bytes");
 inline bvar::Adder<int64_t> g_rowset_meta_num("doris_rowset_meta_num");
 
-inline bvar::Adder<int64_t> g_all_rowsets_mem_bytes("doris_all_rowsets_mem_bytes");
-inline bvar::Adder<int64_t> g_all_rowsets_num("doris_all_rowsets_num");
+inline bvar::Adder<int64_t> g_rowset_mem_bytes("doris_rowset_mem_bytes");
+inline bvar::Adder<int64_t> g_rowset_num("doris_rowset_num");
 
 inline bvar::Adder<int64_t> g_tablet_meta_mem_bytes("doris_tablet_meta_mem_bytes");
 inline bvar::Adder<int64_t> g_tablet_meta_num("doris_tablet_meta_num");
@@ -42,8 +44,9 @@ inline bvar::Adder<int64_t> g_tablet_index_num("doris_tablet_index_num");
 inline bvar::Adder<int64_t> g_tablet_schema_mem_bytes("doris_tablet_schema_mem_bytes");
 inline bvar::Adder<int64_t> g_tablet_schema_num("doris_tablet_schema_num");
 
-inline bvar::Adder<int64_t> g_all_segments_mem_bytes("doris_all_segments_mem_bytes");
-inline bvar::Adder<int64_t> g_all_segments_num("doris_all_segments_num");
+inline bvar::Adder<int64_t> g_segment_mem_bytes("doris_segment_mem_bytes");
+inline bvar::Adder<int64_t> g_segment_num("doris_segment_num");
+inline bvar::Adder<int64_t> g_segment_estimate_mem_bytes("doris_segment_estimate_mem_bytes");
 
 inline bvar::Adder<int64_t> g_column_reader_mem_bytes("doris_column_reader_mem_bytes");
 inline bvar::Adder<int64_t> g_column_reader_num("doris_column_reader_num");
@@ -96,6 +99,10 @@ class ZoneMapIndexReader;
     When a derived Class extends MetadataAdder, then the Class's number and fixed length field's memory can be counted automatically.
     But if the Class has variable length field, then you should overwrite get_metadata_size and call update_metadata_size when the Class's memory changes.
 
+    get_metadata_size is only the memory of the metadata object itself, not include child objects,
+    for example, TabletMeta::get_metadata_size does not include the memory of TabletSchema.
+    Note, the memory allocated by Doris Allocator is not included.
+
     There are some special situations that need to be noted:
     1. when the derived Class override copy constructor, you'd better update memory size(call update_metadata_size) if derived class's 
     memory changed in its copy constructor or you not call MetadataAdder's copy constructor.
@@ -111,6 +118,31 @@ class MetadataAdder {
 
     static void dump_metadata_object(RuntimeProfile* object_heap_dump_snapshot);
 
+    static int64_t get_all_tablets_size() {
+        return g_tablet_meta_mem_bytes.get_value() + g_tablet_column_mem_bytes.get_value() +
+               g_tablet_index_mem_bytes.get_value() + g_tablet_schema_mem_bytes.get_value();
+    }
+
+    static int64_t get_all_rowsets_size() {
+        return g_rowset_meta_mem_bytes.get_value() + g_rowset_mem_bytes.get_value();
+    }
+
+    static int64_t get_all_segments_size() {
+        return g_segment_mem_bytes.get_value() + g_column_reader_mem_bytes.get_value() +
+               g_bitmap_index_reader_mem_bytes.get_value() +
+               g_bloom_filter_index_reader_mem_bytes.get_value() +
+               g_index_page_reader_mem_bytes.get_value() +
+               g_indexed_column_reader_mem_bytes.get_value() +
+               g_inverted_index_reader_mem_bytes.get_value() +
+               g_ordinal_index_reader_mem_bytes.get_value() +
+               g_zone_map_index_reader_mem_bytes.get_value();
+    }
+
+    // Doris currently uses the estimated segments memory as the basis, maybe it is more realistic.
+    static int64_t get_all_segments_estimate_size() {
+        return g_segment_estimate_mem_bytes.get_value();
+    }
+
 protected:
     MetadataAdder(const MetadataAdder& other);
 
@@ -122,7 +154,6 @@ class MetadataAdder {
 
     MetadataAdder<T>& operator=(const MetadataAdder<T>& other) = default;
 
-private:
     int64_t _current_meta_size {0};
 
     void add_mem_size(int64_t val);
@@ -167,7 +198,7 @@ void MetadataAdder<T>::add_mem_size(int64_t val) {
     if constexpr (std::is_same_v<T, RowsetMeta>) {
         g_rowset_meta_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, Rowset>) {
-        g_all_rowsets_mem_bytes << val;
+        g_rowset_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, TabletMeta>) {
         g_tablet_meta_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, TabletColumn>) {
@@ -177,7 +208,7 @@ void MetadataAdder<T>::add_mem_size(int64_t val) {
     } else if constexpr (std::is_same_v<T, TabletSchema>) {
         g_tablet_schema_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, segment_v2::Segment>) {
-        g_all_segments_mem_bytes << val;
+        g_segment_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, segment_v2::ColumnReader>) {
         g_column_reader_mem_bytes << val;
     } else if constexpr (std::is_same_v<T, segment_v2::BitmapIndexReader>) {
@@ -208,7 +239,7 @@ void MetadataAdder<T>::add_num(int64_t val) {
     if constexpr (std::is_same_v<T, RowsetMeta>) {
         g_rowset_meta_num << val;
     } else if constexpr (std::is_same_v<T, Rowset>) {
-        g_all_rowsets_num << val;
+        g_rowset_num << val;
     } else if constexpr (std::is_same_v<T, TabletMeta>) {
         g_tablet_meta_num << val;
     } else if constexpr (std::is_same_v<T, TabletColumn>) {
@@ -218,7 +249,7 @@ void MetadataAdder<T>::add_num(int64_t val) {
     } else if constexpr (std::is_same_v<T, TabletSchema>) {
         g_tablet_schema_num << val;
     } else if constexpr (std::is_same_v<T, segment_v2::Segment>) {
-        g_all_segments_num << val;
+        g_segment_num << val;
     } else if constexpr (std::is_same_v<T, segment_v2::ColumnReader>) {
         g_column_reader_num << val;
     } else if constexpr (std::is_same_v<T, segment_v2::BitmapIndexReader>) {
@@ -250,12 +281,12 @@ void MetadataAdder<T>::dump_metadata_object(RuntimeProfile* object_heap_dump_sna
     COUNTER_SET(rowset_meta_mem_bytes_counter, g_rowset_meta_mem_bytes.get_value());
     COUNTER_SET(rowset_meta_num_counter, g_rowset_meta_num.get_value());
 
-    RuntimeProfile::Counter* all_rowsets_mem_bytes_counter =
-            ADD_COUNTER(object_heap_dump_snapshot, "AllRowsetsMemBytes", TUnit::BYTES);
-    RuntimeProfile::Counter* all_rowsets_num_counter =
-            ADD_COUNTER(object_heap_dump_snapshot, "AllRowsetsNum", TUnit::UNIT);
-    COUNTER_SET(all_rowsets_mem_bytes_counter, g_all_rowsets_mem_bytes.get_value());
-    COUNTER_SET(all_rowsets_num_counter, g_all_rowsets_num.get_value());
+    RuntimeProfile::Counter* rowset_mem_bytes_counter =
+            ADD_COUNTER(object_heap_dump_snapshot, "RowsetMemBytes", TUnit::BYTES);
+    RuntimeProfile::Counter* rowset_num_counter =
+            ADD_COUNTER(object_heap_dump_snapshot, "RowsetNum", TUnit::UNIT);
+    COUNTER_SET(rowset_mem_bytes_counter, g_rowset_mem_bytes.get_value());
+    COUNTER_SET(rowset_num_counter, g_rowset_num.get_value());
 
     RuntimeProfile::Counter* tablet_meta_mem_bytes_counter =
             ADD_COUNTER(object_heap_dump_snapshot, "TabletMetaMemBytes", TUnit::BYTES);
@@ -285,12 +316,12 @@ void MetadataAdder<T>::dump_metadata_object(RuntimeProfile* object_heap_dump_sna
     COUNTER_SET(tablet_schema_mem_bytes_counter, g_tablet_schema_mem_bytes.get_value());
     COUNTER_SET(tablet_schema_num_counter, g_tablet_schema_num.get_value());
 
-    RuntimeProfile::Counter* all_segments_mem_bytes_counter =
-            ADD_COUNTER(object_heap_dump_snapshot, "AllSegmentsMemBytes", TUnit::BYTES);
-    RuntimeProfile::Counter* all_segments_num_counter =
-            ADD_COUNTER(object_heap_dump_snapshot, "AllSegmentsNum", TUnit::UNIT);
-    COUNTER_SET(all_segments_mem_bytes_counter, g_all_segments_mem_bytes.get_value());
-    COUNTER_SET(all_segments_num_counter, g_all_segments_num.get_value());
+    RuntimeProfile::Counter* segment_mem_bytes_counter =
+            ADD_COUNTER(object_heap_dump_snapshot, "SegmentMemBytes", TUnit::BYTES);
+    RuntimeProfile::Counter* segment_num_counter =
+            ADD_COUNTER(object_heap_dump_snapshot, "SegmentNum", TUnit::UNIT);
+    COUNTER_SET(segment_mem_bytes_counter, g_segment_mem_bytes.get_value());
+    COUNTER_SET(segment_num_counter, g_segment_num.get_value());
 
     RuntimeProfile::Counter* column_reader_mem_bytes_counter =
             ADD_COUNTER(object_heap_dump_snapshot, "ColumnReaderMemBytes", TUnit::BYTES);
diff --git a/be/src/olap/olap_server.cpp b/be/src/olap/olap_server.cpp
index 736bdaa99304d3..90d0883984e78b 100644
--- a/be/src/olap/olap_server.cpp
+++ b/be/src/olap/olap_server.cpp
@@ -1071,7 +1071,8 @@ Status StorageEngine::_submit_compaction_task(TabletSharedPtr tablet,
             if (!tablet->can_do_compaction(tablet->data_dir()->path_hash(), compaction_type)) {
                 LOG(INFO) << "Tablet state has been changed, no need to begin this compaction "
                              "task, tablet_id="
-                          << tablet->tablet_id() << "tablet_state=" << tablet->tablet_state();
+                          << tablet->tablet_id() << ", tablet_state=" << tablet->tablet_state();
+                _pop_tablet_from_submitted_compaction(tablet, compaction_type);
                 return;
             }
             tablet->compaction_stage = CompactionStage::EXECUTING;
diff --git a/be/src/olap/rowset/beta_rowset.cpp b/be/src/olap/rowset/beta_rowset.cpp
index bbb2ca72b4ae7f..cd52deed0c8a4d 100644
--- a/be/src/olap/rowset/beta_rowset.cpp
+++ b/be/src/olap/rowset/beta_rowset.cpp
@@ -703,10 +703,24 @@ Status BetaRowset::show_nested_index_file(rapidjson::Value* rowset_value,
                                           rapidjson::Document::AllocatorType& allocator) {
     const auto& fs = _rowset_meta->fs();
     auto storage_format = _schema->get_inverted_index_storage_format();
-    auto format_str = storage_format == InvertedIndexStorageFormatPB::V1 ? "V1" : "V2";
+    std::string format_str;
+    switch (storage_format) {
+    case InvertedIndexStorageFormatPB::V1:
+        format_str = "V1";
+        break;
+    case InvertedIndexStorageFormatPB::V2:
+        format_str = "V2";
+        break;
+    case InvertedIndexStorageFormatPB::V3:
+        format_str = "V3";
+        break;
+    default:
+        return Status::InternalError("inverted index storage format error");
+        break;
+    }
     auto rs_id = rowset_id().to_string();
     rowset_value->AddMember("rowset_id", rapidjson::Value(rs_id.c_str(), allocator), allocator);
-    rowset_value->AddMember("index_storage_format", rapidjson::Value(format_str, allocator),
+    rowset_value->AddMember("index_storage_format", rapidjson::Value(format_str.c_str(), allocator),
                             allocator);
     rapidjson::Value segments(rapidjson::kArrayType);
     for (int seg_id = 0; seg_id < num_segments(); ++seg_id) {
diff --git a/be/src/olap/rowset/beta_rowset_writer.cpp b/be/src/olap/rowset/beta_rowset_writer.cpp
index 198b4e8595ed20..ab5bc48db80b00 100644
--- a/be/src/olap/rowset/beta_rowset_writer.cpp
+++ b/be/src/olap/rowset/beta_rowset_writer.cpp
@@ -60,6 +60,7 @@
 #include "vec/data_types/data_type_factory.hpp"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 namespace {
@@ -475,15 +476,15 @@ Status BetaRowsetWriter::_rename_compacted_segments(int64_t begin, int64_t end)
     return Status::OK();
 }
 
-void BetaRowsetWriter::_clear_statistics_for_deleting_segments_unsafe(uint64_t begin,
-                                                                      uint64_t end) {
+void BetaRowsetWriter::_clear_statistics_for_deleting_segments_unsafe(uint32_t begin,
+                                                                      uint32_t end) {
     VLOG_DEBUG << "_segid_statistics_map clear record segid range from:" << begin << " to:" << end;
-    for (int i = begin; i <= end; ++i) {
+    for (uint32_t i = begin; i <= end; ++i) {
         _segid_statistics_map.erase(i);
     }
 }
 
-Status BetaRowsetWriter::_rename_compacted_segment_plain(uint64_t seg_id) {
+Status BetaRowsetWriter::_rename_compacted_segment_plain(uint32_t seg_id) {
     if (seg_id == _num_segcompacted) {
         ++_num_segcompacted;
         return Status::OK();
@@ -581,7 +582,7 @@ Status BetaRowsetWriter::_segcompaction_if_necessary() {
     Status status = Status::OK();
     // if not doing segcompaction, just check segment number
     if (!config::enable_segcompaction || !_context.enable_segcompaction ||
-        !_context.tablet_schema->cluster_key_idxes().empty() ||
+        !_context.tablet_schema->cluster_key_uids().empty() ||
         _context.tablet_schema->num_variant_columns() > 0) {
         return _check_segment_number_limit(_num_segment);
     }
@@ -653,7 +654,7 @@ Status BaseBetaRowsetWriter::add_rowset(RowsetSharedPtr rowset) {
     _num_rows_written += rowset->num_rows();
     _total_data_size += rowset->rowset_meta()->data_disk_size();
     _total_index_size += rowset->rowset_meta()->index_disk_size();
-    _num_segment += rowset->num_segments();
+    _num_segment += cast_set<int32_t>(rowset->num_segments());
     // append key_bounds to current rowset
     RETURN_IF_ERROR(rowset->get_segments_key_bounds(&_segments_encoded_key_bounds));
 
@@ -1043,7 +1044,7 @@ Status BaseBetaRowsetWriter::add_segment(uint32_t segment_id, const SegmentStati
         if (segment_id >= _segment_num_rows.size()) {
             _segment_num_rows.resize(segment_id + 1);
         }
-        _segment_num_rows[segid_offset] = segstat.row_num;
+        _segment_num_rows[segid_offset] = cast_set<uint32_t>(segstat.row_num);
     }
     VLOG_DEBUG << "_segid_statistics_map add new record. segment_id:" << segment_id
                << " row_num:" << segstat.row_num << " data_size:" << segstat.data_size
@@ -1111,4 +1112,5 @@ Status BetaRowsetWriter::flush_segment_writer_for_segcompaction(
     return Status::OK();
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/olap/rowset/beta_rowset_writer.h b/be/src/olap/rowset/beta_rowset_writer.h
index d96301af22630d..a69d1063a55086 100644
--- a/be/src/olap/rowset/beta_rowset_writer.h
+++ b/be/src/olap/rowset/beta_rowset_writer.h
@@ -298,9 +298,9 @@ class BetaRowsetWriter : public BaseBetaRowsetWriter {
     Status _load_noncompacted_segment(segment_v2::SegmentSharedPtr& segment, int32_t segment_id);
     Status _find_longest_consecutive_small_segment(SegCompactionCandidatesSharedPtr& segments);
     Status _rename_compacted_segments(int64_t begin, int64_t end);
-    Status _rename_compacted_segment_plain(uint64_t seg_id);
+    Status _rename_compacted_segment_plain(uint32_t seg_id);
     Status _rename_compacted_indices(int64_t begin, int64_t end, uint64_t seg_id);
-    void _clear_statistics_for_deleting_segments_unsafe(uint64_t begin, uint64_t end);
+    void _clear_statistics_for_deleting_segments_unsafe(uint32_t begin, uint32_t end);
 
     StorageEngine& _engine;
 
diff --git a/be/src/olap/rowset/segment_creator.cpp b/be/src/olap/rowset/segment_creator.cpp
index c2a4469d97f324..e0eb7534123a86 100644
--- a/be/src/olap/rowset/segment_creator.cpp
+++ b/be/src/olap/rowset/segment_creator.cpp
@@ -115,8 +115,7 @@ Status SegmentFlusher::close() {
 bool SegmentFlusher::need_buffering() {
     // buffering variants for schema change
     return _context.write_type == DataWriteType::TYPE_SCHEMA_CHANGE &&
-           (_context.tablet_schema->num_variant_columns() > 0 ||
-            !_context.tablet_schema->cluster_key_idxes().empty());
+           _context.tablet_schema->num_variant_columns() > 0;
 }
 
 Status SegmentFlusher::_add_rows(std::unique_ptr<segment_v2::SegmentWriter>& segment_writer,
diff --git a/be/src/olap/rowset/segment_v2/block_split_bloom_filter.h b/be/src/olap/rowset/segment_v2/block_split_bloom_filter.h
index f68ddd7e74bfc5..8dc470d9da4f88 100644
--- a/be/src/olap/rowset/segment_v2/block_split_bloom_filter.h
+++ b/be/src/olap/rowset/segment_v2/block_split_bloom_filter.h
@@ -34,7 +34,6 @@ class BlockSplitBloomFilter : public BloomFilter {
     void add_hash(uint64_t hash) override;
 
     bool test_hash(uint64_t hash) const override;
-    bool contains(const BloomFilter&) const override { return true; }
 
 private:
     // Bytes in a tiny Bloom filter block.
diff --git a/be/src/olap/rowset/segment_v2/bloom_filter.h b/be/src/olap/rowset/segment_v2/bloom_filter.h
index a7845d1ca36704..4f4adf0fd12283 100644
--- a/be/src/olap/rowset/segment_v2/bloom_filter.h
+++ b/be/src/olap/rowset/segment_v2/bloom_filter.h
@@ -186,7 +186,7 @@ class BloomFilter {
 
     /// Checks if this contains everything from another bloom filter.
     /// Bloom filters must have equal size and seed.
-    virtual bool contains(const BloomFilter& bf_) const = 0;
+    virtual bool contains(const BloomFilter& bf_) const { return true; };
 
     virtual char* data() const { return _data; }
 
diff --git a/be/src/olap/rowset/segment_v2/bloom_filter_index_reader.cpp b/be/src/olap/rowset/segment_v2/bloom_filter_index_reader.cpp
index 609d21ce4f5c22..8c63c25d20acee 100644
--- a/be/src/olap/rowset/segment_v2/bloom_filter_index_reader.cpp
+++ b/be/src/olap/rowset/segment_v2/bloom_filter_index_reader.cpp
@@ -70,6 +70,7 @@ Status BloomFilterIndexIterator::read_bloom_filter(rowid_t ordinal,
     auto column = data_type->create_column();
 
     RETURN_IF_ERROR(_bloom_filter_iter.seek_to_ordinal(ordinal));
+    DCHECK(current_bloom_filter_index() == ordinal);
     size_t num_read = num_to_read;
     RETURN_IF_ERROR(_bloom_filter_iter.next_batch(&num_read, column));
     DCHECK(num_to_read == num_read);
diff --git a/be/src/olap/rowset/segment_v2/bloom_filter_index_writer.cpp b/be/src/olap/rowset/segment_v2/bloom_filter_index_writer.cpp
index edc6102703f492..3f9fb94df0a844 100644
--- a/be/src/olap/rowset/segment_v2/bloom_filter_index_writer.cpp
+++ b/be/src/olap/rowset/segment_v2/bloom_filter_index_writer.cpp
@@ -21,6 +21,7 @@
 #include <string.h>
 
 #include <algorithm>
+#include <memory>
 #include <set>
 #include <string>
 #include <utility>
@@ -68,15 +69,12 @@ class BloomFilterIndexWriterImpl : public BloomFilterIndexWriter {
 
     explicit BloomFilterIndexWriterImpl(const BloomFilterOptions& bf_options,
                                         const TypeInfo* type_info)
-            : _bf_options(bf_options),
-              _type_info(type_info),
-              _has_null(false),
-              _bf_buffer_size(0) {}
+            : _bf_options(bf_options), _type_info(type_info) {}
 
     ~BloomFilterIndexWriterImpl() override = default;
 
     Status add_values(const void* values, size_t count) override {
-        const CppType* v = (const CppType*)values;
+        const auto* v = (const CppType*)values;
         for (int i = 0; i < count; ++i) {
             if (_values.find(*v) == _values.end()) {
                 if constexpr (_is_slice_type()) {
@@ -105,7 +103,7 @@ class BloomFilterIndexWriterImpl : public BloomFilterIndexWriter {
         bf->set_has_null(_has_null);
         for (auto& v : _values) {
             if constexpr (_is_slice_type()) {
-                Slice* s = (Slice*)&v;
+                auto* s = (Slice*)&v;
                 bf->add_bytes(s->data, s->size);
             } else {
                 bf->add_bytes((char*)&v, sizeof(CppType));
@@ -160,11 +158,11 @@ class BloomFilterIndexWriterImpl : public BloomFilterIndexWriter {
     static constexpr bool _is_int128() { return field_type == FieldType::OLAP_FIELD_TYPE_LARGEINT; }
 
 private:
-    BloomFilterOptions _bf_options;
-    const TypeInfo* _type_info;
+    BloomFilterOptions _bf_options {};
+    const TypeInfo* _type_info = nullptr;
     vectorized::Arena _arena;
-    bool _has_null;
-    uint64_t _bf_buffer_size;
+    bool _has_null = false;
+    uint64_t _bf_buffer_size = 0;
     // distinct values
     ValueDict _values;
     std::vector<std::unique_ptr<BloomFilter>> _bfs;
@@ -173,7 +171,7 @@ class BloomFilterIndexWriterImpl : public BloomFilterIndexWriter {
 } // namespace
 
 Status PrimaryKeyBloomFilterIndexWriterImpl::add_values(const void* values, size_t count) {
-    const Slice* v = (const Slice*)values;
+    const auto* v = (const Slice*)values;
     for (int i = 0; i < count; ++i) {
         Slice new_value;
         RETURN_IF_CATCH_EXCEPTION(_type_info->deep_copy(&new_value, v, &_arena));
@@ -189,7 +187,7 @@ Status PrimaryKeyBloomFilterIndexWriterImpl::flush() {
     RETURN_IF_ERROR(bf->init(_values.size(), _bf_options.fpp, _bf_options.strategy));
     bf->set_has_null(_has_null);
     for (auto& v : _values) {
-        Slice* s = (Slice*)&v;
+        auto* s = (Slice*)&v;
         bf->add_bytes(s->data, s->size);
     }
     _bf_buffer_size += bf->size();
@@ -205,7 +203,7 @@ Status PrimaryKeyBloomFilterIndexWriterImpl::flush() {
 
 Status PrimaryKeyBloomFilterIndexWriterImpl::finish(io::FileWriter* file_writer,
                                                     ColumnIndexMetaPB* index_meta) {
-    if (_values.size() > 0) {
+    if (!_values.empty()) {
         RETURN_IF_ERROR(flush());
     }
     index_meta->set_type(BLOOM_FILTER_INDEX);
@@ -246,7 +244,7 @@ NGramBloomFilterIndexWriterImpl::NGramBloomFilterIndexWriterImpl(
 }
 
 Status NGramBloomFilterIndexWriterImpl::add_values(const void* values, size_t count) {
-    const Slice* src = reinterpret_cast<const Slice*>(values);
+    const auto* src = reinterpret_cast<const Slice*>(values);
     for (int i = 0; i < count; ++i, ++src) {
         if (src->size < _gram_size) {
             continue;
@@ -339,7 +337,8 @@ Status NGramBloomFilterIndexWriterImpl::create(const BloomFilterOptions& bf_opti
     case FieldType::OLAP_FIELD_TYPE_CHAR:
     case FieldType::OLAP_FIELD_TYPE_VARCHAR:
     case FieldType::OLAP_FIELD_TYPE_STRING:
-        res->reset(new NGramBloomFilterIndexWriterImpl(bf_options, gram_size, gram_bf_size));
+        *res = std::make_unique<NGramBloomFilterIndexWriterImpl>(bf_options, gram_size,
+                                                                 gram_bf_size);
         break;
     default:
         return Status::NotSupported("unsupported type for ngram bloom filter index:{}",
diff --git a/be/src/olap/rowset/segment_v2/indexed_column_reader.cpp b/be/src/olap/rowset/segment_v2/indexed_column_reader.cpp
index 3028211f266157..da6beff5d8d6a2 100644
--- a/be/src/olap/rowset/segment_v2/indexed_column_reader.cpp
+++ b/be/src/olap/rowset/segment_v2/indexed_column_reader.cpp
@@ -81,7 +81,8 @@ Status IndexedColumnReader::load(bool use_page_cache, bool kept_in_memory,
             _sole_data_page = PagePointer(_meta.ordinal_index_meta().root_page());
         } else {
             RETURN_IF_ERROR(load_index_page(_meta.ordinal_index_meta().root_page(),
-                                            &_ordinal_index_page_handle, &_ordinal_index_reader));
+                                            &_ordinal_index_page_handle,
+                                            _ordinal_index_reader.get()));
             _has_index_page = true;
         }
     }
@@ -92,7 +93,7 @@ Status IndexedColumnReader::load(bool use_page_cache, bool kept_in_memory,
             _sole_data_page = PagePointer(_meta.value_index_meta().root_page());
         } else {
             RETURN_IF_ERROR(load_index_page(_meta.value_index_meta().root_page(),
-                                            &_value_index_page_handle, &_value_index_reader));
+                                            &_value_index_page_handle, _value_index_reader.get()));
             _has_index_page = true;
         }
     }
diff --git a/be/src/olap/rowset/segment_v2/indexed_column_reader.h b/be/src/olap/rowset/segment_v2/indexed_column_reader.h
index c3469f9f6bed0d..c9640c0007c153 100644
--- a/be/src/olap/rowset/segment_v2/indexed_column_reader.h
+++ b/be/src/olap/rowset/segment_v2/indexed_column_reader.h
@@ -50,9 +50,12 @@ class EncodingInfo;
 class IndexedColumnReader : public MetadataAdder<IndexedColumnReader> {
 public:
     explicit IndexedColumnReader(io::FileReaderSPtr file_reader, const IndexedColumnMetaPB& meta)
-            : _file_reader(std::move(file_reader)), _meta(meta) {}
+            : _file_reader(std::move(file_reader)), _meta(meta) {
+        _ordinal_index_reader = std::make_unique<IndexPageReader>();
+        _value_index_reader = std::make_unique<IndexPageReader>();
+    }
 
-    ~IndexedColumnReader();
+    ~IndexedColumnReader() override;
 
     Status load(bool use_page_cache, bool kept_in_memory,
                 OlapReaderStatistics* index_load_stats = nullptr);
@@ -90,8 +93,8 @@ class IndexedColumnReader : public MetadataAdder<IndexedColumnReader> {
     bool _has_index_page = false;
     // valid only when the column contains only one data page
     PagePointer _sole_data_page;
-    IndexPageReader _ordinal_index_reader;
-    IndexPageReader _value_index_reader;
+    std::unique_ptr<IndexPageReader> _ordinal_index_reader;
+    std::unique_ptr<IndexPageReader> _value_index_reader;
     PageHandle _ordinal_index_page_handle;
     PageHandle _value_index_page_handle;
 
@@ -108,8 +111,8 @@ class IndexedColumnIterator {
     explicit IndexedColumnIterator(const IndexedColumnReader* reader,
                                    OlapReaderStatistics* stats = nullptr)
             : _reader(reader),
-              _ordinal_iter(&reader->_ordinal_index_reader),
-              _value_iter(&reader->_value_index_reader),
+              _ordinal_iter(reader->_ordinal_index_reader.get()),
+              _value_iter(reader->_value_index_reader.get()),
               _stats(stats) {}
 
     // Seek to the given ordinal entry. Entry 0 is the first entry.
diff --git a/be/src/olap/rowset/segment_v2/inverted_index/char_filter/char_replace_char_filter.h b/be/src/olap/rowset/segment_v2/inverted_index/char_filter/char_replace_char_filter.h
index d9e5080d2d584d..1e5e6f5d5cedd0 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index/char_filter/char_replace_char_filter.h
+++ b/be/src/olap/rowset/segment_v2/inverted_index/char_filter/char_replace_char_filter.h
@@ -17,7 +17,7 @@
 
 #pragma once
 
-#include <CLucene.h>
+#include <CLucene.h> // IWYU pragma: keep
 #include <CLucene/analysis/CharFilter.h>
 
 #include <bitset>
diff --git a/be/src/olap/rowset/segment_v2/inverted_index_file_reader.cpp b/be/src/olap/rowset/segment_v2/inverted_index_file_reader.cpp
index 113833d560fd06..8d480829a0cd37 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index_file_reader.cpp
+++ b/be/src/olap/rowset/segment_v2/inverted_index_file_reader.cpp
@@ -30,8 +30,8 @@ namespace doris::segment_v2 {
 Status InvertedIndexFileReader::init(int32_t read_buffer_size) {
     if (!_inited) {
         _read_buffer_size = read_buffer_size;
-        if (_storage_format == InvertedIndexStorageFormatPB::V2) {
-            auto st = _init_from_v2(read_buffer_size);
+        if (_storage_format >= InvertedIndexStorageFormatPB::V2) {
+            auto st = _init_from(read_buffer_size);
             if (!st.ok()) {
                 return st;
             }
@@ -41,7 +41,7 @@ Status InvertedIndexFileReader::init(int32_t read_buffer_size) {
     return Status::OK();
 }
 
-Status InvertedIndexFileReader::_init_from_v2(int32_t read_buffer_size) {
+Status InvertedIndexFileReader::_init_from(int32_t read_buffer_size) {
     auto index_file_full_path = InvertedIndexDescriptor::get_index_file_path_v2(_index_path_prefix);
 
     std::unique_lock<std::shared_mutex> lock(_mutex); // Lock for writing
@@ -79,7 +79,7 @@ Status InvertedIndexFileReader::_init_from_v2(int32_t read_buffer_size) {
 
         // 3. read file
         int32_t version = _stream->readInt(); // Read version number
-        if (version == InvertedIndexStorageFormatPB::V2) {
+        if (version >= InvertedIndexStorageFormatPB::V2) {
             DCHECK(version == _storage_format);
             int32_t numIndices = _stream->readInt(); // Read number of indices
             ReaderFileEntry* entry = nullptr;
diff --git a/be/src/olap/rowset/segment_v2/inverted_index_file_reader.h b/be/src/olap/rowset/segment_v2/inverted_index_file_reader.h
index 3b7161c7643cef..443d40cfaf0d4f 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index_file_reader.h
+++ b/be/src/olap/rowset/segment_v2/inverted_index_file_reader.h
@@ -70,7 +70,7 @@ class InvertedIndexFileReader {
     int64_t get_inverted_file_size() const { return _stream == nullptr ? 0 : _stream->length(); }
 
 private:
-    Status _init_from_v2(int32_t read_buffer_size);
+    Status _init_from(int32_t read_buffer_size);
     Result<std::unique_ptr<DorisCompoundReader>> _open(int64_t index_id,
                                                        const std::string& index_suffix) const;
 
diff --git a/be/src/olap/rowset/segment_v2/inverted_index_file_writer.cpp b/be/src/olap/rowset/segment_v2/inverted_index_file_writer.cpp
index bb373be5ee906a..4d6892aa78568f 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index_file_writer.cpp
+++ b/be/src/olap/rowset/segment_v2/inverted_index_file_writer.cpp
@@ -150,7 +150,7 @@ Status InvertedIndexFileWriter::close() {
         }
     } else {
         try {
-            RETURN_IF_ERROR(write_v2());
+            RETURN_IF_ERROR(write());
             for (const auto& entry : _indices_dirs) {
                 const auto& dir = entry.second;
                 // delete index path, which contains separated inverted index files
@@ -293,7 +293,7 @@ Status InvertedIndexFileWriter::write_v1() {
     return Status::OK();
 }
 
-Status InvertedIndexFileWriter::write_v2() {
+Status InvertedIndexFileWriter::write() {
     std::unique_ptr<lucene::store::Directory, DirectoryDeleter> out_dir = nullptr;
     std::unique_ptr<lucene::store::IndexOutput> compound_file_output = nullptr;
     ErrorContext error_context;
@@ -301,10 +301,10 @@ Status InvertedIndexFileWriter::write_v2() {
         // Calculate header length and initialize offset
         int64_t current_offset = headerLength();
         // Prepare file metadata
-        auto file_metadata = prepare_file_metadata_v2(current_offset);
+        auto file_metadata = prepare_file_metadata(current_offset);
 
         // Create output stream
-        auto result = create_output_stream_v2();
+        auto result = create_output_stream();
         out_dir = std::move(result.first);
         compound_file_output = std::move(result.second);
 
@@ -315,7 +315,7 @@ Status InvertedIndexFileWriter::write_v2() {
         write_index_headers_and_metadata(compound_file_output.get(), file_metadata);
 
         // Copy file data
-        copy_files_data_v2(compound_file_output.get(), file_metadata);
+        copy_files_data(compound_file_output.get(), file_metadata);
 
         _total_file_size = compound_file_output->getFilePointer();
         _file_info.set_index_size(_total_file_size);
@@ -470,7 +470,7 @@ void InvertedIndexFileWriter::write_header_and_data_v1(lucene::store::IndexOutpu
 
 std::pair<std::unique_ptr<lucene::store::Directory, DirectoryDeleter>,
           std::unique_ptr<lucene::store::IndexOutput>>
-InvertedIndexFileWriter::create_output_stream_v2() {
+InvertedIndexFileWriter::create_output_stream() {
     io::Path index_path {InvertedIndexDescriptor::get_index_file_path_v2(_index_path_prefix)};
 
     auto* out_dir = DorisFSDirectoryFactory::getDirectory(_fs, index_path.parent_path().c_str());
@@ -486,15 +486,15 @@ InvertedIndexFileWriter::create_output_stream_v2() {
 
 void InvertedIndexFileWriter::write_version_and_indices_count(lucene::store::IndexOutput* output) {
     // Write the version number
-    output->writeInt(InvertedIndexStorageFormatPB::V2);
+    output->writeInt(_storage_format);
 
     // Write the number of indices
     const auto num_indices = static_cast<uint32_t>(_indices_dirs.size());
     output->writeInt(num_indices);
 }
 
-std::vector<InvertedIndexFileWriter::FileMetadata>
-InvertedIndexFileWriter::prepare_file_metadata_v2(int64_t& current_offset) {
+std::vector<InvertedIndexFileWriter::FileMetadata> InvertedIndexFileWriter::prepare_file_metadata(
+        int64_t& current_offset) {
     std::vector<FileMetadata> file_metadata;
 
     for (const auto& entry : _indices_dirs) {
@@ -546,8 +546,8 @@ void InvertedIndexFileWriter::write_index_headers_and_metadata(
     }
 }
 
-void InvertedIndexFileWriter::copy_files_data_v2(lucene::store::IndexOutput* output,
-                                                 const std::vector<FileMetadata>& file_metadata) {
+void InvertedIndexFileWriter::copy_files_data(lucene::store::IndexOutput* output,
+                                              const std::vector<FileMetadata>& file_metadata) {
     const int64_t buffer_length = 16384;
     uint8_t buffer[buffer_length];
 
diff --git a/be/src/olap/rowset/segment_v2/inverted_index_file_writer.h b/be/src/olap/rowset/segment_v2/inverted_index_file_writer.h
index ba42ffdceb1475..ab7cdbff152460 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index_file_writer.h
+++ b/be/src/olap/rowset/segment_v2/inverted_index_file_writer.h
@@ -71,7 +71,7 @@ class InvertedIndexFileWriter {
     Status delete_index(const TabletIndex* index_meta);
     Status initialize(InvertedIndexDirectoryMap& indices_dirs);
     virtual ~InvertedIndexFileWriter() = default;
-    Status write_v2();
+    Status write();
     Status write_v1();
     Status close();
     const InvertedIndexFileInfo* get_index_file_info() const {
@@ -122,7 +122,7 @@ class InvertedIndexFileWriter {
     // Helper functions specific to write_v2
     virtual std::pair<std::unique_ptr<lucene::store::Directory, DirectoryDeleter>,
                       std::unique_ptr<lucene::store::IndexOutput>>
-    create_output_stream_v2();
+    create_output_stream();
     void write_version_and_indices_count(lucene::store::IndexOutput* output);
     struct FileMetadata {
         int64_t index_id;
@@ -141,11 +141,11 @@ class InvertedIndexFileWriter {
                   length(len),
                   directory(dir) {}
     };
-    std::vector<FileMetadata> prepare_file_metadata_v2(int64_t& current_offset);
+    std::vector<FileMetadata> prepare_file_metadata(int64_t& current_offset);
     virtual void write_index_headers_and_metadata(lucene::store::IndexOutput* output,
                                                   const std::vector<FileMetadata>& file_metadata);
-    void copy_files_data_v2(lucene::store::IndexOutput* output,
-                            const std::vector<FileMetadata>& file_metadata);
+    void copy_files_data(lucene::store::IndexOutput* output,
+                         const std::vector<FileMetadata>& file_metadata);
     Status _insert_directory_into_map(int64_t index_id, const std::string& index_suffix,
                                       std::shared_ptr<DorisFSDirectory> dir);
     // Member variables...
diff --git a/be/src/olap/rowset/segment_v2/inverted_index_writer.cpp b/be/src/olap/rowset/segment_v2/inverted_index_writer.cpp
index 86a8f89e4c94e4..02edf2f1976e3e 100644
--- a/be/src/olap/rowset/segment_v2/inverted_index_writer.cpp
+++ b/be/src/olap/rowset/segment_v2/inverted_index_writer.cpp
@@ -212,6 +212,28 @@ class InvertedIndexColumnWriterImpl : public InvertedIndexColumnWriter {
         (*field)->setOmitTermFreqAndPositions(
                 !(get_parser_phrase_support_string_from_properties(_index_meta->properties()) ==
                   INVERTED_INDEX_PARSER_PHRASE_SUPPORT_YES));
+        DBUG_EXECUTE_IF("InvertedIndexColumnWriterImpl::create_field_v3", {
+            if (_index_file_writer->get_storage_format() != InvertedIndexStorageFormatPB::V3) {
+                return Status::Error<doris::ErrorCode::INVERTED_INDEX_CLUCENE_ERROR>(
+                        "debug point: InvertedIndexColumnWriterImpl::create_field_v3 error");
+            }
+        })
+        if (_index_file_writer->get_storage_format() >= InvertedIndexStorageFormatPB::V3) {
+            (*field)->setIndexVersion(IndexVersion::kV3);
+            // Only effective in v3
+            std::string dict_compression =
+                    get_parser_dict_compression_from_properties(_index_meta->properties());
+            DBUG_EXECUTE_IF("InvertedIndexColumnWriterImpl::create_field_dic_compression", {
+                if (dict_compression != INVERTED_INDEX_PARSER_TRUE) {
+                    return Status::Error<doris::ErrorCode::INVERTED_INDEX_CLUCENE_ERROR>(
+                            "debug point: "
+                            "InvertedIndexColumnWriterImpl::create_field_dic_compression error");
+                }
+            })
+            if (dict_compression == INVERTED_INDEX_PARSER_TRUE) {
+                (*field)->updateFlag(FlagBits::DICT_COMPRESS);
+            }
+        }
         return Status::OK();
     }
 
diff --git a/be/src/olap/rowset/segment_v2/page_handle.h b/be/src/olap/rowset/segment_v2/page_handle.h
index b1e53ee808697e..d4dfdfb2ff3c55 100644
--- a/be/src/olap/rowset/segment_v2/page_handle.h
+++ b/be/src/olap/rowset/segment_v2/page_handle.h
@@ -23,6 +23,10 @@
 #include "util/slice.h" // for Slice
 
 namespace doris {
+
+// After disable page cache, sometimes we need to know the percentage of data pages in query memory.
+inline bvar::Adder<int64_t> g_page_no_cache_mem_bytes("doris_page_no_cache_mem_bytes");
+
 namespace segment_v2 {
 
 // When a column page is read into memory, we use this to store it.
@@ -37,8 +41,7 @@ class PageHandle {
     // This class will take the ownership of input data's memory. It will
     // free it when deconstructs.
     PageHandle(DataPage* data) : _is_data_owner(true), _data(data) {
-        _page_tracker = ExecEnv::GetInstance()->page_no_cache_mem_tracker();
-        _page_tracker->consume(_data->capacity());
+        g_page_no_cache_mem_bytes << _data->capacity();
     }
 
     // This class will take the content of cache data, and will make input
@@ -51,20 +54,18 @@ class PageHandle {
         // we can use std::exchange if we switch c++14 on
         std::swap(_is_data_owner, other._is_data_owner);
         std::swap(_data, other._data);
-        _page_tracker = ExecEnv::GetInstance()->page_no_cache_mem_tracker();
     }
 
     PageHandle& operator=(PageHandle&& other) noexcept {
         std::swap(_is_data_owner, other._is_data_owner);
         std::swap(_data, other._data);
         _cache_data = std::move(other._cache_data);
-        _page_tracker = ExecEnv::GetInstance()->page_no_cache_mem_tracker();
         return *this;
     }
 
     ~PageHandle() {
         if (_is_data_owner) {
-            _page_tracker->release(_data->capacity());
+            g_page_no_cache_mem_bytes << -_data->capacity();
             delete _data;
         } else {
             DCHECK(_data == nullptr);
@@ -85,7 +86,6 @@ class PageHandle {
     // otherwise _cache_data is valid, and data is belong to cache.
     bool _is_data_owner = false;
     DataPage* _data = nullptr;
-    std::shared_ptr<MemTracker> _page_tracker;
     PageCacheHandle _cache_data;
 
     // Don't allow copy and assign
diff --git a/be/src/olap/rowset/segment_v2/segment.cpp b/be/src/olap/rowset/segment_v2/segment.cpp
index 0ad799683fc458..513c0be4f8cd14 100644
--- a/be/src/olap/rowset/segment_v2/segment.cpp
+++ b/be/src/olap/rowset/segment_v2/segment.cpp
@@ -163,7 +163,11 @@ Segment::Segment(uint32_t segment_id, RowsetId rowset_id, TabletSchemaSPtr table
           _tablet_schema(std::move(tablet_schema)),
           _idx_file_info(idx_file_info) {}
 
-Segment::~Segment() = default;
+Segment::~Segment() {
+    g_segment_estimate_mem_bytes << -_tracked_meta_mem_usage;
+    // if failed, fix `_tracked_meta_mem_usage` accuracy
+    DCHECK(_tracked_meta_mem_usage == meta_mem_usage());
+}
 
 io::UInt128Wrapper Segment::file_cache_key(std::string_view rowset_id, uint32_t seg_id) {
     return io::BlockFileCache::hash(fmt::format("{}_{}.dat", rowset_id, seg_id));
@@ -174,6 +178,12 @@ int64_t Segment::get_metadata_size() const {
            (_pk_index_meta ? _pk_index_meta->ByteSizeLong() : 0);
 }
 
+void Segment::update_metadata_size() {
+    MetadataAdder::update_metadata_size();
+    g_segment_estimate_mem_bytes << _meta_mem_usage - _tracked_meta_mem_usage;
+    _tracked_meta_mem_usage = _meta_mem_usage;
+}
+
 Status Segment::_open() {
     _footer_pb = std::make_unique<SegmentFooterPB>();
     RETURN_IF_ERROR(_parse_footer(_footer_pb.get()));
@@ -191,8 +201,6 @@ Status Segment::_open() {
         _meta_mem_usage += _pk_index_meta->ByteSizeLong();
     }
 
-    update_metadata_size();
-
     _meta_mem_usage += sizeof(*this);
     _meta_mem_usage += _tablet_schema->num_columns() * config::estimated_mem_per_column_reader;
 
@@ -201,6 +209,8 @@ Status Segment::_open() {
     // 0.01 comes from PrimaryKeyIndexBuilder::init
     _meta_mem_usage += BloomFilter::optimal_bit_num(_num_rows, 0.01) / 8;
 
+    update_metadata_size();
+
     return Status::OK();
 }
 
@@ -467,6 +477,7 @@ Status Segment::_load_pk_bloom_filter() {
         // for BE UT "segment_cache_test"
         return _load_pk_bf_once.call([this] {
             _meta_mem_usage += 100;
+            update_metadata_size();
             return Status::OK();
         });
     }
@@ -955,7 +966,7 @@ Status Segment::lookup_row_key(const Slice& key, const TabletSchema* latest_sche
                                std::string* encoded_seq_value, OlapReaderStatistics* stats) {
     RETURN_IF_ERROR(load_pk_index_and_bf());
     bool has_seq_col = latest_schema->has_sequence_col();
-    bool has_rowid = !latest_schema->cluster_key_idxes().empty();
+    bool has_rowid = !latest_schema->cluster_key_uids().empty();
     size_t seq_col_length = 0;
     if (has_seq_col) {
         seq_col_length = latest_schema->column(latest_schema->sequence_col_idx()).length() + 1;
@@ -1065,7 +1076,7 @@ Status Segment::read_key_by_rowid(uint32_t row_id, std::string* key) {
     RETURN_IF_ERROR(iter->next_batch(&num_read, index_column));
     CHECK(num_read == 1);
     // trim row id
-    if (_tablet_schema->cluster_key_idxes().empty()) {
+    if (_tablet_schema->cluster_key_uids().empty()) {
         *key = index_column->get_data_at(0).to_string();
     } else {
         Slice sought_key =
diff --git a/be/src/olap/rowset/segment_v2/segment.h b/be/src/olap/rowset/segment_v2/segment.h
index bc5ab1e1fdc80a..1b20c1f066bdf9 100644
--- a/be/src/olap/rowset/segment_v2/segment.h
+++ b/be/src/olap/rowset/segment_v2/segment.h
@@ -57,7 +57,6 @@ class IDataType;
 class ShortKeyIndexDecoder;
 class Schema;
 class StorageReadOptions;
-class MemTracker;
 class PrimaryKeyIndexReader;
 class RowwiseIterator;
 struct RowLocation;
@@ -93,6 +92,7 @@ class Segment : public std::enable_shared_from_this<Segment>, public MetadataAdd
     ~Segment();
 
     int64_t get_metadata_size() const override;
+    void update_metadata_size();
 
     Status new_iterator(SchemaSPtr schema, const StorageReadOptions& read_options,
                         std::unique_ptr<RowwiseIterator>* iter);
@@ -163,6 +163,8 @@ class Segment : public std::enable_shared_from_this<Segment>, public MetadataAdd
 
     io::FileReaderSPtr file_reader() { return _file_reader; }
 
+    // Including the column reader memory.
+    // another method `get_metadata_size` not include the column reader, only the segment object itself.
     int64_t meta_mem_usage() const { return _meta_mem_usage; }
 
     // Identify the column by unique id or path info
@@ -249,9 +251,8 @@ class Segment : public std::enable_shared_from_this<Segment>, public MetadataAdd
     // 1. Tracking memory use by segment meta data such as footer or index page.
     // 2. Tracking memory use by segment column reader
     // The memory consumed by querying is tracked in segment iterator.
-    // TODO: Segment::_meta_mem_usage Unknown value overflow, causes the value of SegmentMeta mem tracker
-    // is similar to `-2912341218700198079`. So, temporarily put it in experimental type tracker.
     int64_t _meta_mem_usage;
+    int64_t _tracked_meta_mem_usage = 0;
 
     RowsetId _rowset_id;
     TabletSchemaSPtr _tablet_schema;
diff --git a/be/src/olap/rowset/segment_v2/segment_iterator.cpp b/be/src/olap/rowset/segment_v2/segment_iterator.cpp
index 4ee73547c117e9..abdf9116756f0e 100644
--- a/be/src/olap/rowset/segment_v2/segment_iterator.cpp
+++ b/be/src/olap/rowset/segment_v2/segment_iterator.cpp
@@ -377,7 +377,7 @@ Status SegmentIterator::_lazy_init() {
     _row_bitmap.addRange(0, _segment->num_rows());
     // z-order can not use prefix index
     if (_segment->_tablet_schema->sort_type() != SortType::ZORDER &&
-        _segment->_tablet_schema->cluster_key_idxes().empty()) {
+        _segment->_tablet_schema->cluster_key_uids().empty()) {
         RETURN_IF_ERROR(_get_row_ranges_by_keys());
     }
     RETURN_IF_ERROR(_get_row_ranges_by_column_conditions());
@@ -1193,7 +1193,7 @@ Status SegmentIterator::_lookup_ordinal_from_pk_index(const RowCursor& key, bool
     bool has_seq_col = _segment->_tablet_schema->has_sequence_col();
     // Used to get key range from primary key index,
     // for mow with cluster key table, we should get key range from short key index.
-    DCHECK(_segment->_tablet_schema->cluster_key_idxes().empty());
+    DCHECK(_segment->_tablet_schema->cluster_key_uids().empty());
 
     // if full key is exact_match, the primary key without sequence column should also the same
     if (has_seq_col && !exact_match) {
@@ -2175,11 +2175,11 @@ Status SegmentIterator::_next_batch_internal(vectorized::Block* block) {
                     if (block->rows() == 0) {
                         vectorized::MutableColumnPtr col0 =
                                 std::move(*block->get_by_position(0).column).mutate();
-                        auto res_column = vectorized::ColumnString::create();
-                        res_column->insert_data("", 0);
-                        auto col_const = vectorized::ColumnConst::create(std::move(res_column),
-                                                                         selected_size);
-                        block->replace_by_position(0, std::move(col_const));
+                        auto tmp_indicator_col =
+                                block->get_by_position(0)
+                                        .type->create_column_const_with_default_value(
+                                                selected_size);
+                        block->replace_by_position(0, std::move(tmp_indicator_col));
                         _output_index_result_column_for_expr(_sel_rowid_idx.data(), selected_size,
                                                              block);
                         block->shrink_char_type_column_suffix_zero(_char_type_idx_no_0);
diff --git a/be/src/olap/rowset/segment_v2/segment_writer.cpp b/be/src/olap/rowset/segment_v2/segment_writer.cpp
index fc22c3570e52a2..fe465f98a2aad2 100644
--- a/be/src/olap/rowset/segment_v2/segment_writer.cpp
+++ b/be/src/olap/rowset/segment_v2/segment_writer.cpp
@@ -103,7 +103,7 @@ SegmentWriter::SegmentWriter(io::FileWriter* file_writer, uint32_t segment_id,
                 << ", table_id=" << _tablet_schema->table_id()
                 << ", num_key_columns=" << _num_sort_key_columns
                 << ", num_short_key_columns=" << _num_short_key_columns
-                << ", cluster_key_columns=" << _tablet_schema->cluster_key_idxes().size();
+                << ", cluster_key_columns=" << _tablet_schema->cluster_key_uids().size();
     }
     for (size_t cid = 0; cid < _num_sort_key_columns; ++cid) {
         const auto& column = _tablet_schema->column(cid);
@@ -125,8 +125,8 @@ SegmentWriter::SegmentWriter(io::FileWriter* file_writer, uint32_t segment_id,
             // cluster keys
             _key_coders.clear();
             _key_index_size.clear();
-            _num_sort_key_columns = _tablet_schema->cluster_key_idxes().size();
-            for (auto cid : _tablet_schema->cluster_key_idxes()) {
+            _num_sort_key_columns = _tablet_schema->cluster_key_uids().size();
+            for (auto cid : _tablet_schema->cluster_key_uids()) {
                 const auto& column = _tablet_schema->column_by_uid(cid);
                 _key_coders.push_back(get_key_coder(column.type()));
                 _key_index_size.push_back(column.index_length());
@@ -545,6 +545,39 @@ Status SegmentWriter::probe_key_for_mow(
     return Status::OK();
 }
 
+Status SegmentWriter::partial_update_preconditions_check(size_t row_pos) {
+    if (!_is_mow()) {
+        auto msg = fmt::format(
+                "Can only do partial update on merge-on-write unique table, but found: "
+                "keys_type={}, _opts.enable_unique_key_merge_on_write={}, tablet_id={}",
+                _tablet_schema->keys_type(), _opts.enable_unique_key_merge_on_write,
+                _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    if (_opts.rowset_ctx->partial_update_info == nullptr) {
+        auto msg =
+                fmt::format("partial_update_info should not be nullptr, please check, tablet_id={}",
+                            _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    if (!_opts.rowset_ctx->partial_update_info->is_fixed_partial_update()) {
+        auto msg = fmt::format(
+                "in fixed partial update code, but update_mode={}, please check, tablet_id={}",
+                _opts.rowset_ctx->partial_update_info->update_mode(), _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    if (row_pos != 0) {
+        auto msg = fmt::format("row_pos should be 0, but found {}, tablet_id={}", row_pos,
+                               _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    return Status::OK();
+}
+
 // for partial update, we should do following steps to fill content of block:
 // 1. set block data to data convertor, and get all key_column's converted slice
 // 2. get pk of input block, and read missing columns
@@ -562,11 +595,7 @@ Status SegmentWriter::append_block_with_partial_content(const vectorized::Block*
                             block->columns(), _tablet_schema->num_key_columns(),
                             _tablet_schema->num_columns()));
     }
-    DCHECK(_is_mow());
-
-    DCHECK(_opts.rowset_ctx->partial_update_info);
-    DCHECK(_opts.rowset_ctx->partial_update_info->is_fixed_partial_update());
-    DCHECK(row_pos == 0);
+    RETURN_IF_ERROR(partial_update_preconditions_check(row_pos));
 
     // find missing column cids
     const auto& missing_cids = _opts.rowset_ctx->partial_update_info->missing_cids;
@@ -788,7 +817,7 @@ Status SegmentWriter::append_block(const vectorized::Block* block, size_t row_po
                                                         seq_column, num_rows, true));
             // 2. generate short key index (use cluster key)
             key_columns.clear();
-            for (const auto& cid : _tablet_schema->cluster_key_idxes()) {
+            for (const auto& cid : _tablet_schema->cluster_key_uids()) {
                 // find cluster key index in tablet schema
                 auto cluster_key_index = _tablet_schema->field_index(cid);
                 if (cluster_key_index == -1) {
@@ -1016,6 +1045,18 @@ Status SegmentWriter::finalize_columns_index(uint64_t* index_size) {
     *index_size = _file_writer->bytes_appended() - index_start;
     if (_has_key) {
         if (_is_mow_with_cluster_key()) {
+            // 1. sort primary keys
+            std::sort(_primary_keys.begin(), _primary_keys.end());
+            // 2. write primary keys index
+            std::string last_key;
+            for (const auto& key : _primary_keys) {
+                DCHECK(key.compare(last_key) > 0)
+                        << "found duplicate key or key is not sorted! current key: " << key
+                        << ", last key: " << last_key;
+                RETURN_IF_ERROR(_primary_key_index_builder->add_item(key));
+                last_key = key;
+            }
+
             RETURN_IF_ERROR(_write_short_key_index());
             *index_size = _file_writer->bytes_appended() - index_start;
             RETURN_IF_ERROR(_write_primary_key_index());
@@ -1236,27 +1277,16 @@ Status SegmentWriter::_generate_primary_key_index(
             last_key = std::move(key);
         }
     } else { // mow table with cluster key
-        // 1. generate primary keys in memory
-        std::vector<std::string> primary_keys;
+        // generate primary keys in memory
         for (uint32_t pos = 0; pos < num_rows; pos++) {
             std::string key = _full_encode_keys(primary_key_coders, primary_key_columns, pos);
             _maybe_invalid_row_cache(key);
             if (_tablet_schema->has_sequence_col()) {
                 _encode_seq_column(seq_column, pos, &key);
             }
-            _encode_rowid(pos, &key);
-            primary_keys.emplace_back(std::move(key));
-        }
-        // 2. sort primary keys
-        std::sort(primary_keys.begin(), primary_keys.end());
-        // 3. write primary keys index
-        std::string last_key;
-        for (const auto& key : primary_keys) {
-            DCHECK(key.compare(last_key) > 0)
-                    << "found duplicate key or key is not sorted! current key: " << key
-                    << ", last key: " << last_key;
-            RETURN_IF_ERROR(_primary_key_index_builder->add_item(key));
-            last_key = key;
+            _encode_rowid(pos + _num_rows_written, &key);
+            _primary_keys_size += key.size();
+            _primary_keys.emplace_back(std::move(key));
         }
     }
     return Status::OK();
@@ -1289,7 +1319,7 @@ inline bool SegmentWriter::_is_mow() {
 }
 
 inline bool SegmentWriter::_is_mow_with_cluster_key() {
-    return _is_mow() && !_tablet_schema->cluster_key_idxes().empty();
+    return _is_mow() && !_tablet_schema->cluster_key_uids().empty();
 }
 } // namespace segment_v2
 } // namespace doris
diff --git a/be/src/olap/rowset/segment_v2/segment_writer.h b/be/src/olap/rowset/segment_v2/segment_writer.h
index 9a8af131087f92..60300383d7287d 100644
--- a/be/src/olap/rowset/segment_v2/segment_writer.h
+++ b/be/src/olap/rowset/segment_v2/segment_writer.h
@@ -105,6 +105,7 @@ class SegmentWriter {
                              const std::function<void(const RowLocation& loc)>& found_cb,
                              const std::function<Status()>& not_found_cb,
                              PartialUpdateStats& stats);
+    Status partial_update_preconditions_check(size_t row_pos);
     Status append_block_with_partial_content(const vectorized::Block* block, size_t row_pos,
                                              size_t num_rows);
     Status append_block_with_variant_subcolumns(vectorized::Block& data);
@@ -155,6 +156,8 @@ class SegmentWriter {
         return Status::OK();
     }
 
+    uint64_t primary_keys_size() const { return _primary_keys_size; }
+
 private:
     DISALLOW_COPY_AND_ASSIGN(SegmentWriter);
     Status _create_column_writer(uint32_t cid, const TabletColumn& column,
@@ -260,6 +263,8 @@ class SegmentWriter {
     std::map<RowsetId, RowsetSharedPtr> _rsid_to_rowset;
     // contains auto generated columns, should be nullptr if no variants's subcolumns
     TabletSchemaSPtr _flush_schema = nullptr;
+    std::vector<std::string> _primary_keys;
+    uint64_t _primary_keys_size = 0;
 };
 
 } // namespace segment_v2
diff --git a/be/src/olap/rowset/segment_v2/vertical_segment_writer.cpp b/be/src/olap/rowset/segment_v2/vertical_segment_writer.cpp
index ce16e2d502b622..0846b0fc1186a8 100644
--- a/be/src/olap/rowset/segment_v2/vertical_segment_writer.cpp
+++ b/be/src/olap/rowset/segment_v2/vertical_segment_writer.cpp
@@ -109,7 +109,7 @@ VerticalSegmentWriter::VerticalSegmentWriter(io::FileWriter* file_writer, uint32
                 << ", table_id=" << _tablet_schema->table_id()
                 << ", num_key_columns=" << _num_sort_key_columns
                 << ", num_short_key_columns=" << _num_short_key_columns
-                << ", cluster_key_columns=" << _tablet_schema->cluster_key_idxes().size();
+                << ", cluster_key_columns=" << _tablet_schema->cluster_key_uids().size();
     }
     for (size_t cid = 0; cid < _num_sort_key_columns; ++cid) {
         const auto& column = _tablet_schema->column(cid);
@@ -131,8 +131,8 @@ VerticalSegmentWriter::VerticalSegmentWriter(io::FileWriter* file_writer, uint32
             // cluster keys
             _key_coders.clear();
             _key_index_size.clear();
-            _num_sort_key_columns = _tablet_schema->cluster_key_idxes().size();
-            for (auto cid : _tablet_schema->cluster_key_idxes()) {
+            _num_sort_key_columns = _tablet_schema->cluster_key_uids().size();
+            for (auto cid : _tablet_schema->cluster_key_uids()) {
                 const auto& column = _tablet_schema->column_by_uid(cid);
                 _key_coders.push_back(get_key_coder(column.type()));
                 _key_index_size.push_back(column.index_length());
@@ -418,6 +418,51 @@ Status VerticalSegmentWriter::_probe_key_for_mow(
     return Status::OK();
 }
 
+Status VerticalSegmentWriter::_partial_update_preconditions_check(size_t row_pos,
+                                                                  bool is_flexible_update) {
+    if (!_is_mow()) {
+        auto msg = fmt::format(
+                "Can only do partial update on merge-on-write unique table, but found: "
+                "keys_type={}, _opts.enable_unique_key_merge_on_write={}, tablet_id={}",
+                _tablet_schema->keys_type(), _opts.enable_unique_key_merge_on_write,
+                _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    if (_opts.rowset_ctx->partial_update_info == nullptr) {
+        auto msg =
+                fmt::format("partial_update_info should not be nullptr, please check, tablet_id={}",
+                            _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    if (!is_flexible_update) {
+        if (!_opts.rowset_ctx->partial_update_info->is_fixed_partial_update()) {
+            auto msg = fmt::format(
+                    "in fixed partial update code, but update_mode={}, please check, tablet_id={}",
+                    _opts.rowset_ctx->partial_update_info->update_mode(), _tablet->tablet_id());
+            DCHECK(false) << msg;
+            return Status::InternalError<false>(msg);
+        }
+    } else {
+        if (!_opts.rowset_ctx->partial_update_info->is_flexible_partial_update()) {
+            auto msg = fmt::format(
+                    "in flexible partial update code, but update_mode={}, please check, "
+                    "tablet_id={}",
+                    _opts.rowset_ctx->partial_update_info->update_mode(), _tablet->tablet_id());
+            DCHECK(false) << msg;
+            return Status::InternalError<false>(msg);
+        }
+    }
+    if (row_pos != 0) {
+        auto msg = fmt::format("row_pos should be 0, but found {}, tablet_id={}", row_pos,
+                               _tablet->tablet_id());
+        DCHECK(false) << msg;
+        return Status::InternalError<false>(msg);
+    }
+    return Status::OK();
+}
+
 // for partial update, we should do following steps to fill content of block:
 // 1. set block data to data convertor, and get all key_column's converted slice
 // 2. get pk of input block, and read missing columns
@@ -427,11 +472,7 @@ Status VerticalSegmentWriter::_probe_key_for_mow(
 // 3. set columns to data convertor and then write all columns
 Status VerticalSegmentWriter::_append_block_with_partial_content(RowsInBlock& data,
                                                                  vectorized::Block& full_block) {
-    DCHECK(_is_mow());
-    DCHECK(_opts.rowset_ctx->partial_update_info != nullptr);
-    DCHECK(_opts.rowset_ctx->partial_update_info->is_fixed_partial_update());
-    DCHECK(data.row_pos == 0);
-
+    RETURN_IF_ERROR(_partial_update_preconditions_check(data.row_pos, false));
     // create full block and fill with input columns
     full_block = _tablet_schema->create_block();
     const auto& including_cids = _opts.rowset_ctx->partial_update_info->update_cids;
@@ -580,10 +621,7 @@ Status VerticalSegmentWriter::_append_block_with_partial_content(RowsInBlock& da
 
 Status VerticalSegmentWriter::_append_block_with_flexible_partial_content(
         RowsInBlock& data, vectorized::Block& full_block) {
-    DCHECK(_is_mow());
-    DCHECK(_opts.rowset_ctx->partial_update_info != nullptr);
-    DCHECK(_opts.rowset_ctx->partial_update_info->is_flexible_partial_update());
-    DCHECK(data.row_pos == 0);
+    RETURN_IF_ERROR(_partial_update_preconditions_check(data.row_pos, true));
 
     // data.block has the same schema with full_block
     DCHECK(data.block->columns() == _tablet_schema->num_columns());
@@ -1149,9 +1187,9 @@ Status VerticalSegmentWriter::write_batch() {
             }
             auto column_unique_id = _tablet_schema->column(cid).unique_id();
             if (_is_mow_with_cluster_key() &&
-                std::find(_tablet_schema->cluster_key_idxes().begin(),
-                          _tablet_schema->cluster_key_idxes().end(),
-                          column_unique_id) != _tablet_schema->cluster_key_idxes().end()) {
+                std::find(_tablet_schema->cluster_key_uids().begin(),
+                          _tablet_schema->cluster_key_uids().end(),
+                          column_unique_id) != _tablet_schema->cluster_key_uids().end()) {
                 cid_to_column[column_unique_id] = column;
             }
             RETURN_IF_ERROR(_column_writers[cid]->append(column->get_nullmap(), column->get_data(),
@@ -1213,7 +1251,7 @@ Status VerticalSegmentWriter::_generate_key_index(
                                                     data.num_rows, true));
         // 2. generate short key index (use cluster key)
         std::vector<vectorized::IOlapColumnDataAccessor*> short_key_columns;
-        for (const auto& cid : _tablet_schema->cluster_key_idxes()) {
+        for (const auto& cid : _tablet_schema->cluster_key_uids()) {
             short_key_columns.push_back(cid_to_column[cid]);
         }
         RETURN_IF_ERROR(_generate_short_key_index(short_key_columns, data.num_rows, short_key_pos));
@@ -1572,7 +1610,7 @@ inline bool VerticalSegmentWriter::_is_mow() {
 }
 
 inline bool VerticalSegmentWriter::_is_mow_with_cluster_key() {
-    return _is_mow() && !_tablet_schema->cluster_key_idxes().empty();
+    return _is_mow() && !_tablet_schema->cluster_key_uids().empty();
 }
 } // namespace segment_v2
 } // namespace doris
diff --git a/be/src/olap/rowset/segment_v2/vertical_segment_writer.h b/be/src/olap/rowset/segment_v2/vertical_segment_writer.h
index 951e9c2e2838c3..8cec6ed4d1abd6 100644
--- a/be/src/olap/rowset/segment_v2/vertical_segment_writer.h
+++ b/be/src/olap/rowset/segment_v2/vertical_segment_writer.h
@@ -175,6 +175,7 @@ class VerticalSegmentWriter {
                               const std::function<void(const RowLocation& loc)>& found_cb,
                               const std::function<Status()>& not_found_cb,
                               PartialUpdateStats& stats);
+    Status _partial_update_preconditions_check(size_t row_pos, bool is_flexible_update);
     Status _append_block_with_partial_content(RowsInBlock& data, vectorized::Block& full_block);
     Status _append_block_with_flexible_partial_content(RowsInBlock& data,
                                                        vectorized::Block& full_block);
diff --git a/be/src/olap/rowset/vertical_beta_rowset_writer.cpp b/be/src/olap/rowset/vertical_beta_rowset_writer.cpp
index ee9bfd97745c9b..f493f21ac97fb7 100644
--- a/be/src/olap/rowset/vertical_beta_rowset_writer.cpp
+++ b/be/src/olap/rowset/vertical_beta_rowset_writer.cpp
@@ -72,10 +72,9 @@ Status VerticalBetaRowsetWriter<T>::add_columns(const vectorized::Block* block,
         _cur_writer_idx = 0;
         RETURN_IF_ERROR(_segment_writers[_cur_writer_idx]->append_block(block, 0, num_rows));
     } else if (is_key) {
-        // TODO for cluster key, always create new segment writer because the primary keys are
-        // sorted in SegmentWriter::_generate_primary_key_index, will cause too many segments
         if (_segment_writers[_cur_writer_idx]->num_rows_written() > max_rows_per_segment ||
-            has_cluster_key) {
+            (has_cluster_key && _segment_writers[_cur_writer_idx]->primary_keys_size() >
+                                        config::mow_primary_key_index_max_size_in_memory)) {
             // segment is full, need flush columns and create new segment writer
             RETURN_IF_ERROR(_flush_columns(_segment_writers[_cur_writer_idx].get(), true));
 
@@ -181,6 +180,7 @@ Status VerticalBetaRowsetWriter<T>::_create_segment_writer(
     writer_options.enable_unique_key_merge_on_write = context.enable_unique_key_merge_on_write;
     writer_options.rowset_ctx = &context;
     writer_options.max_rows_per_segment = context.max_rows_per_segment;
+    // TODO if support VerticalSegmentWriter, also need to handle cluster key primary key index
     *writer = std::make_unique<segment_v2::SegmentWriter>(
             segment_file_writer.get(), seg_id, context.tablet_schema, context.tablet,
             context.data_dir, writer_options, inverted_index_file_writer.get());
diff --git a/be/src/olap/rowset_builder.h b/be/src/olap/rowset_builder.h
index 7fd578037363a0..fb2294d1770cc4 100644
--- a/be/src/olap/rowset_builder.h
+++ b/be/src/olap/rowset_builder.h
@@ -38,7 +38,6 @@ namespace doris {
 class CalcDeleteBitmapToken;
 class FlushToken;
 class MemTable;
-class MemTracker;
 class StorageEngine;
 class TupleDescriptor;
 class SlotDescriptor;
diff --git a/be/src/olap/schema_change.cpp b/be/src/olap/schema_change.cpp
index ec291d8d2f0068..cdb637b1c42647 100644
--- a/be/src/olap/schema_change.cpp
+++ b/be/src/olap/schema_change.cpp
@@ -198,6 +198,21 @@ class MultiBlockMerger {
                         pushed_row_refs.push_back(row_refs[i]);
                     }
                 }
+                if (!_tablet->tablet_schema()->cluster_key_uids().empty()) {
+                    std::vector<uint32_t> ids;
+                    for (const auto& cid : _tablet->tablet_schema()->cluster_key_uids()) {
+                        auto index = _tablet->tablet_schema()->field_index(cid);
+                        if (index == -1) {
+                            return Status::InternalError(
+                                    "could not find cluster key column with unique_id=" +
+                                    std::to_string(cid) + " in tablet schema");
+                        }
+                        ids.push_back(index);
+                    }
+                    // sort by cluster key
+                    std::stable_sort(pushed_row_refs.begin(), pushed_row_refs.end(),
+                                     ClusterKeyRowRefComparator(ids));
+                }
             }
 
             // update real inserted row number
@@ -249,6 +264,20 @@ class MultiBlockMerger {
         const size_t _num_columns;
     };
 
+    struct ClusterKeyRowRefComparator {
+        ClusterKeyRowRefComparator(std::vector<uint32_t> columns) : _columns(columns) {}
+
+        int compare(const RowRef& lhs, const RowRef& rhs) const {
+            return lhs.block->compare_at(lhs.position, rhs.position, &_columns, *rhs.block, -1);
+        }
+
+        bool operator()(const RowRef& lhs, const RowRef& rhs) const {
+            return compare(lhs, rhs) < 0;
+        }
+
+        const std::vector<uint32_t> _columns;
+    };
+
     BaseTabletSPtr _tablet;
     RowRefComparator _cmp;
     vectorized::Arena _arena;
@@ -1158,6 +1187,7 @@ Status SchemaChangeJob::_convert_historical_rowsets(const SchemaChangeParams& sc
         }
 
         context.write_type = DataWriteType::TYPE_SCHEMA_CHANGE;
+        // TODO if support VerticalSegmentWriter, also need to handle cluster key primary key index
         auto result = _new_tablet->create_rowset_writer(context, false);
         if (!result.has_value()) {
             res = Status::Error<ROWSET_BUILDER_INIT>("create_rowset_writer failed, reason={}",
diff --git a/be/src/olap/segment_loader.cpp b/be/src/olap/segment_loader.cpp
index 26ac54c699b81a..4240f7e250a06b 100644
--- a/be/src/olap/segment_loader.cpp
+++ b/be/src/olap/segment_loader.cpp
@@ -77,9 +77,8 @@ Status SegmentLoader::load_segments(const BetaRowsetSharedPtr& rowset,
         }
         if (use_cache && !config::disable_segment_cache) {
             // memory of SegmentCache::CacheValue will be handled by SegmentCache
-            auto* cache_value = new SegmentCache::CacheValue();
+            auto* cache_value = new SegmentCache::CacheValue(segment);
             _cache_mem_usage += segment->meta_mem_usage();
-            cache_value->segment = std::move(segment);
             _segment_cache->insert(cache_key, *cache_value, cache_handle);
         } else {
             cache_handle->push_segment(std::move(segment));
diff --git a/be/src/olap/segment_loader.h b/be/src/olap/segment_loader.h
index 834906da93bf74..2c5b1ed200dde7 100644
--- a/be/src/olap/segment_loader.h
+++ b/be/src/olap/segment_loader.h
@@ -75,9 +75,9 @@ class SegmentCache : public LRUCachePolicy {
     // Holding all opened segments of a rowset.
     class CacheValue : public LRUCacheValueBase {
     public:
-        ~CacheValue() override { segment.reset(); }
+        CacheValue(segment_v2::SegmentSharedPtr segment_) : segment(std::move(segment_)) {}
 
-        segment_v2::SegmentSharedPtr segment;
+        const segment_v2::SegmentSharedPtr segment;
     };
 
     SegmentCache(size_t memory_bytes_limit, size_t segment_num_limit)
@@ -124,8 +124,13 @@ class SegmentLoader {
 
     void erase_segments(const RowsetId& rowset_id, int64_t num_segments);
 
-    // Just used for BE UT
-    int64_t cache_mem_usage() const { return _cache_mem_usage; }
+    int64_t cache_mem_usage() const {
+#ifdef BE_TEST
+        return _cache_mem_usage;
+#else
+        return _segment_cache->value_mem_consumption();
+#endif
+    }
 
 private:
     SegmentLoader();
diff --git a/be/src/olap/tablet.cpp b/be/src/olap/tablet.cpp
index 0d04984d0e06ba..379fb6eec3cb43 100644
--- a/be/src/olap/tablet.cpp
+++ b/be/src/olap/tablet.cpp
@@ -1692,6 +1692,10 @@ void Tablet::build_tablet_report_info(TTabletInfo* tablet_info,
         // tablet may not have cooldowned data, but the storage policy is set
         tablet_info->__set_cooldown_term(_cooldown_conf.term);
     }
+    tablet_info->__set_local_index_size(_tablet_meta->tablet_local_index_size());
+    tablet_info->__set_local_segment_size(_tablet_meta->tablet_local_segment_size());
+    tablet_info->__set_remote_index_size(_tablet_meta->tablet_remote_index_size());
+    tablet_info->__set_remote_segment_size(_tablet_meta->tablet_remote_segment_size());
 }
 
 void Tablet::report_error(const Status& st) {
diff --git a/be/src/olap/tablet_manager.cpp b/be/src/olap/tablet_manager.cpp
index d6a944dbc39853..33fee7ca350900 100644
--- a/be/src/olap/tablet_manager.cpp
+++ b/be/src/olap/tablet_manager.cpp
@@ -57,8 +57,6 @@
 #include "olap/tablet_schema.h"
 #include "olap/txn_manager.h"
 #include "runtime/exec_env.h"
-#include "runtime/memory/mem_tracker.h"
-#include "runtime/thread_context.h"
 #include "service/backend_options.h"
 #include "util/defer_op.h"
 #include "util/doris_metrics.h"
@@ -83,28 +81,18 @@ using std::vector;
 namespace doris {
 using namespace ErrorCode;
 
-DEFINE_GAUGE_METRIC_PROTOTYPE_5ARG(tablet_meta_mem_consumption, MetricUnit::BYTES, "",
-                                   mem_consumption, Labels({{"type", "tablet_meta"}}));
-
 bvar::Adder<int64_t> g_tablet_meta_schema_columns_count("tablet_meta_schema_columns_count");
 
 TabletManager::TabletManager(StorageEngine& engine, int32_t tablet_map_lock_shard_size)
         : _engine(engine),
-          _tablet_meta_mem_tracker(std::make_shared<MemTracker>("TabletMeta(experimental)")),
           _tablets_shards_size(tablet_map_lock_shard_size),
           _tablets_shards_mask(tablet_map_lock_shard_size - 1) {
     CHECK_GT(_tablets_shards_size, 0);
     CHECK_EQ(_tablets_shards_size & _tablets_shards_mask, 0);
     _tablets_shards.resize(_tablets_shards_size);
-    REGISTER_HOOK_METRIC(tablet_meta_mem_consumption,
-                         [this]() { return _tablet_meta_mem_tracker->consumption(); });
 }
 
-TabletManager::~TabletManager() {
-#ifndef BE_TEST
-    DEREGISTER_HOOK_METRIC(tablet_meta_mem_consumption);
-#endif
-}
+TabletManager::~TabletManager() = default;
 
 Status TabletManager::_add_tablet_unlocked(TTabletId tablet_id, const TabletSharedPtr& tablet,
                                            bool update_meta, bool force, RuntimeProfile* profile) {
@@ -242,10 +230,6 @@ Status TabletManager::_add_tablet_to_map_unlocked(TTabletId tablet_id,
     tablet_map_t& tablet_map = _get_tablet_map(tablet_id);
     tablet_map[tablet_id] = tablet;
     _add_tablet_to_partition(tablet);
-    // TODO: remove multiply 2 of tablet meta mem size
-    // Because table schema will copy in tablet, there will be double mem cost
-    // so here multiply 2
-    _tablet_meta_mem_tracker->consume(tablet->tablet_meta()->mem_size() * 2);
     g_tablet_meta_schema_columns_count << tablet->tablet_meta()->tablet_columns_num();
     COUNTER_UPDATE(ADD_CHILD_TIMER(profile, "RegisterTabletInfo", "AddTablet"),
                    static_cast<int64_t>(watch.reset()));
@@ -599,7 +583,6 @@ Status TabletManager::_drop_tablet(TTabletId tablet_id, TReplicaId replica_id, b
     }
 
     to_drop_tablet->deregister_tablet_from_dir();
-    _tablet_meta_mem_tracker->release(to_drop_tablet->tablet_meta()->mem_size() * 2);
     g_tablet_meta_schema_columns_count << -to_drop_tablet->tablet_meta()->tablet_columns_num();
     return Status::OK();
 }
@@ -1083,6 +1066,10 @@ void TabletManager::build_all_report_tablets_info(std::map<TTabletId, TTablet>*
         t_tablet_stat.__set_total_version_count(tablet_info.total_version_count);
         t_tablet_stat.__set_visible_version_count(tablet_info.visible_version_count);
         t_tablet_stat.__set_visible_version(tablet_info.version);
+        t_tablet_stat.__set_local_index_size(tablet_info.local_index_size);
+        t_tablet_stat.__set_local_segment_size(tablet_info.local_segment_size);
+        t_tablet_stat.__set_remote_index_size(tablet_info.remote_index_size);
+        t_tablet_stat.__set_remote_segment_size(tablet_info.remote_segment_size);
     };
     for_each_tablet(handler, filter_all_tablets);
 
@@ -1183,14 +1170,14 @@ bool TabletManager::_move_tablet_to_trash(const TabletSharedPtr& tablet) {
             if (tablet_in_not_shutdown->tablet_path() != tablet->tablet_path()) {
                 LOG(INFO) << "tablet path not eq shutdown tablet path, move it to trash, tablet_id="
                           << tablet_in_not_shutdown->tablet_id()
-                          << " mem manager tablet path=" << tablet_in_not_shutdown->tablet_path()
-                          << " shutdown tablet path=" << tablet->tablet_path();
+                          << ", mem manager tablet path=" << tablet_in_not_shutdown->tablet_path()
+                          << ", shutdown tablet path=" << tablet->tablet_path();
                 return tablet->data_dir()->move_to_trash(tablet->tablet_path());
             } else {
                 LOG(INFO) << "tablet path eq shutdown tablet path, not move to trash, tablet_id="
                           << tablet_in_not_shutdown->tablet_id()
-                          << " mem manager tablet path=" << tablet_in_not_shutdown->tablet_path()
-                          << " shutdown tablet path=" << tablet->tablet_path();
+                          << ", mem manager tablet path=" << tablet_in_not_shutdown->tablet_path()
+                          << ", shutdown tablet path=" << tablet->tablet_path();
                 return true;
             }
         }
@@ -1295,7 +1282,7 @@ Status TabletManager::register_transition_tablet(int64_t tablet_id, std::string
         // not found
         shard.tablets_under_transition[tablet_id] = std::make_tuple(reason, thread_id, 1);
         LOG(INFO) << "add tablet_id= " << tablet_id << " to map, reason=" << reason
-                  << " lock times=1 thread_id_in_map=" << thread_id;
+                  << ", lock times=1, thread_id_in_map=" << thread_id;
         return Status::OK();
     } else {
         // found
@@ -1303,15 +1290,15 @@ Status TabletManager::register_transition_tablet(int64_t tablet_id, std::string
         if (thread_id != thread_id_in_map) {
             // other thread, failed
             LOG(INFO) << "tablet_id = " << tablet_id << " is doing " << r
-                      << " thread_id_in_map=" << thread_id_in_map << " , add reason=" << reason
-                      << " thread_id=" << thread_id;
+                      << ", thread_id_in_map=" << thread_id_in_map << " , add reason=" << reason
+                      << ", thread_id=" << thread_id;
             return Status::InternalError<false>("{} failed try later, tablet_id={}", reason,
                                                 tablet_id);
         }
         // add lock times
         ++lock_times;
         LOG(INFO) << "add tablet_id= " << tablet_id << " to map, reason=" << reason
-                  << " lock times=" << lock_times << " thread_id_in_map=" << thread_id_in_map;
+                  << ", lock times=" << lock_times << ", thread_id_in_map=" << thread_id_in_map;
         return Status::OK();
     }
 }
@@ -1335,10 +1322,10 @@ void TabletManager::unregister_transition_tablet(int64_t tablet_id, std::string
         --lock_times;
         if (lock_times != 0) {
             LOG(INFO) << "erase tablet_id= " << tablet_id << " from map, reason=" << reason
-                      << " left=" << lock_times << " thread_id_in_map=" << thread_id_in_map;
+                      << ", left=" << lock_times << ", thread_id_in_map=" << thread_id_in_map;
         } else {
             LOG(INFO) << "erase tablet_id= " << tablet_id << " from map, reason=" << reason
-                      << " thread_id_in_map=" << thread_id_in_map;
+                      << ", thread_id_in_map=" << thread_id_in_map;
             shard.tablets_under_transition.erase(tablet_id);
         }
     }
diff --git a/be/src/olap/tablet_manager.h b/be/src/olap/tablet_manager.h
index 42623cf05f2aea..6b6e7998f9cee1 100644
--- a/be/src/olap/tablet_manager.h
+++ b/be/src/olap/tablet_manager.h
@@ -251,9 +251,6 @@ class TabletManager {
 
     StorageEngine& _engine;
 
-    // TODO: memory size of TabletSchema cannot be accurately tracked.
-    std::shared_ptr<MemTracker> _tablet_meta_mem_tracker;
-
     const int32_t _tablets_shards_size;
     const int32_t _tablets_shards_mask;
     std::vector<tablets_shard> _tablets_shards;
diff --git a/be/src/olap/tablet_meta.cpp b/be/src/olap/tablet_meta.cpp
index 0570aff349c583..3247f34656fb5d 100644
--- a/be/src/olap/tablet_meta.cpp
+++ b/be/src/olap/tablet_meta.cpp
@@ -57,6 +57,7 @@ using std::unordered_map;
 using std::vector;
 
 namespace doris {
+#include "common/compile_check_begin.h"
 using namespace ErrorCode;
 
 TabletMetaSharedPtr TabletMeta::create(
@@ -106,7 +107,7 @@ TabletMeta::TabletMeta()
           _delete_bitmap(new DeleteBitmap(_tablet_id)) {}
 
 TabletMeta::TabletMeta(int64_t table_id, int64_t partition_id, int64_t tablet_id,
-                       int64_t replica_id, int32_t schema_hash, uint64_t shard_id,
+                       int64_t replica_id, int32_t schema_hash, int32_t shard_id,
                        const TTabletSchema& tablet_schema, uint32_t next_unique_id,
                        const std::unordered_map<uint32_t, uint32_t>& col_ordinal_to_unique_id,
                        TabletUid tablet_uid, TTabletType::type tabletType,
@@ -203,6 +204,9 @@ TabletMeta::TabletMeta(int64_t table_id, int64_t partition_id, int64_t tablet_id
     case TInvertedIndexFileStorageFormat::V2:
         schema->set_inverted_index_storage_format(InvertedIndexStorageFormatPB::V2);
         break;
+    case TInvertedIndexFileStorageFormat::V3:
+        schema->set_inverted_index_storage_format(InvertedIndexStorageFormatPB::V3);
+        break;
     default:
         schema->set_inverted_index_storage_format(InvertedIndexStorageFormatPB::V2);
         break;
@@ -216,8 +220,8 @@ TabletMeta::TabletMeta(int64_t table_id, int64_t partition_id, int64_t tablet_id
         schema->set_sort_type(SortType::LEXICAL);
     }
     schema->set_sort_col_num(tablet_schema.sort_col_num);
-    for (const auto& i : tablet_schema.cluster_key_idxes) {
-        schema->add_cluster_key_idxes(i);
+    for (const auto& i : tablet_schema.cluster_key_uids) {
+        schema->add_cluster_key_uids(i);
     }
     tablet_meta_pb.set_in_restore_mode(false);
 
@@ -571,7 +575,8 @@ void TabletMeta::serialize(string* meta_binary) {
 
 Status TabletMeta::deserialize(std::string_view meta_binary) {
     TabletMetaPB tablet_meta_pb;
-    bool parsed = tablet_meta_pb.ParseFromArray(meta_binary.data(), meta_binary.size());
+    bool parsed = tablet_meta_pb.ParseFromArray(meta_binary.data(),
+                                                static_cast<int32_t>(meta_binary.size()));
     if (!parsed) {
         return Status::Error<INIT_FAILED>("parse tablet meta failed");
     }
@@ -664,7 +669,7 @@ void TabletMeta::init_from_pb(const TabletMetaPB& tablet_meta_pb) {
         int seg_maps_size = tablet_meta_pb.delete_bitmap().segment_delete_bitmaps_size();
         CHECK(rst_ids_size == seg_ids_size && seg_ids_size == seg_maps_size &&
               seg_maps_size == versions_size);
-        for (size_t i = 0; i < rst_ids_size; ++i) {
+        for (int i = 0; i < rst_ids_size; ++i) {
             RowsetId rst_id;
             rst_id.init(tablet_meta_pb.delete_bitmap().rowset_ids(i));
             auto seg_id = tablet_meta_pb.delete_bitmap().segment_ids(i);
@@ -781,12 +786,6 @@ void TabletMeta::to_meta_pb(TabletMetaPB* tablet_meta_pb) {
             time_series_compaction_level_threshold());
 }
 
-int64_t TabletMeta::mem_size() const {
-    auto size = sizeof(TabletMeta);
-    size += _schema->mem_size();
-    return size;
-}
-
 void TabletMeta::to_json(string* json_string, json2pb::Pb2JsonOptions& options) {
     TabletMetaPB tablet_meta_pb;
     to_meta_pb(&tablet_meta_pb);
@@ -1312,4 +1311,5 @@ std::string tablet_state_name(TabletState state) {
     }
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/olap/tablet_meta.h b/be/src/olap/tablet_meta.h
index fb0895604a19fe..25f6bcd569be43 100644
--- a/be/src/olap/tablet_meta.h
+++ b/be/src/olap/tablet_meta.h
@@ -51,6 +51,7 @@
 #include "util/uid_util.h"
 
 namespace json2pb {
+#include "common/compile_check_begin.h"
 struct Pb2JsonOptions;
 } // namespace json2pb
 
@@ -100,7 +101,7 @@ class TabletMeta : public MetadataAdder<TabletMeta> {
 
     TabletMeta();
     TabletMeta(int64_t table_id, int64_t partition_id, int64_t tablet_id, int64_t replica_id,
-               int32_t schema_hash, uint64_t shard_id, const TTabletSchema& tablet_schema,
+               int32_t schema_hash, int32_t shard_id, const TTabletSchema& tablet_schema,
                uint32_t next_unique_id,
                const std::unordered_map<uint32_t, uint32_t>& col_ordinal_to_unique_id,
                TabletUid tablet_uid, TTabletType::type tabletType,
@@ -140,10 +141,6 @@ class TabletMeta : public MetadataAdder<TabletMeta> {
 
     void to_meta_pb(TabletMetaPB* tablet_meta_pb);
     void to_json(std::string* json_string, json2pb::Pb2JsonOptions& options);
-    // Don't use.
-    // TODO: memory size of TabletSchema cannot be accurately tracked.
-    // In some places, temporarily use num_columns() as TabletSchema size.
-    int64_t mem_size() const;
     size_t tablet_columns_num() const { return _schema->num_columns(); }
 
     TabletTypePB tablet_type() const { return _tablet_type; }
@@ -156,7 +153,7 @@ class TabletMeta : public MetadataAdder<TabletMeta> {
     int64_t replica_id() const;
     void set_replica_id(int64_t replica_id) { _replica_id = replica_id; }
     int32_t schema_hash() const;
-    int16_t shard_id() const;
+    int32_t shard_id() const;
     void set_shard_id(int32_t shard_id);
     int64_t creation_time() const;
     void set_creation_time(int64_t creation_time);
@@ -170,6 +167,12 @@ class TabletMeta : public MetadataAdder<TabletMeta> {
     size_t tablet_local_size() const;
     // Remote disk space occupied by tablet.
     size_t tablet_remote_size() const;
+
+    size_t tablet_local_index_size() const;
+    size_t tablet_local_segment_size() const;
+    size_t tablet_remote_index_size() const;
+    size_t tablet_remote_segment_size() const;
+
     size_t version_count() const;
     size_t stale_version_count() const;
     size_t version_count_cross_with_range(const Version& range) const;
@@ -608,7 +611,7 @@ inline int32_t TabletMeta::schema_hash() const {
     return _schema_hash;
 }
 
-inline int16_t TabletMeta::shard_id() const {
+inline int32_t TabletMeta::shard_id() const {
     return _shard_id;
 }
 
@@ -668,6 +671,46 @@ inline size_t TabletMeta::tablet_remote_size() const {
     return total_size;
 }
 
+inline size_t TabletMeta::tablet_local_index_size() const {
+    size_t total_size = 0;
+    for (auto& rs : _rs_metas) {
+        if (rs->is_local()) {
+            total_size += rs->index_disk_size();
+        }
+    }
+    return total_size;
+}
+
+inline size_t TabletMeta::tablet_local_segment_size() const {
+    size_t total_size = 0;
+    for (auto& rs : _rs_metas) {
+        if (rs->is_local()) {
+            total_size += rs->data_disk_size();
+        }
+    }
+    return total_size;
+}
+
+inline size_t TabletMeta::tablet_remote_index_size() const {
+    size_t total_size = 0;
+    for (auto& rs : _rs_metas) {
+        if (!rs->is_local()) {
+            total_size += rs->index_disk_size();
+        }
+    }
+    return total_size;
+}
+
+inline size_t TabletMeta::tablet_remote_segment_size() const {
+    size_t total_size = 0;
+    for (auto& rs : _rs_metas) {
+        if (!rs->is_local()) {
+            total_size += rs->data_disk_size();
+        }
+    }
+    return total_size;
+}
+
 inline size_t TabletMeta::version_count() const {
     return _rs_metas.size();
 }
@@ -732,4 +775,5 @@ std::string tablet_state_name(TabletState state);
 bool operator==(const TabletMeta& a, const TabletMeta& b);
 bool operator!=(const TabletMeta& a, const TabletMeta& b);
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/olap/tablet_meta_manager.cpp b/be/src/olap/tablet_meta_manager.cpp
index 6f27dd4db4e672..7c08d7856200f9 100644
--- a/be/src/olap/tablet_meta_manager.cpp
+++ b/be/src/olap/tablet_meta_manager.cpp
@@ -291,8 +291,7 @@ Status TabletMetaManager::remove_old_version_delete_bitmap(DataDir* store, TTabl
         return true;
     };
     LOG(INFO) << "remove old version delete bitmap, tablet_id: " << tablet_id
-              << " version: " << version << " removed keys size: " << remove_keys.size();
-    ;
+              << " version: " << version << ", removed keys size: " << remove_keys.size();
     RETURN_IF_ERROR(meta->iterate(META_COLUMN_FAMILY_INDEX, begin_key, get_remove_keys_func));
     return meta->remove(META_COLUMN_FAMILY_INDEX, remove_keys);
 }
diff --git a/be/src/olap/tablet_reader.cpp b/be/src/olap/tablet_reader.cpp
index 7410b70f4aa471..a83e0bfdbf4c30 100644
--- a/be/src/olap/tablet_reader.cpp
+++ b/be/src/olap/tablet_reader.cpp
@@ -464,13 +464,39 @@ Status TabletReader::_init_orderby_keys_param(const ReaderParams& read_params) {
     // UNIQUE_KEYS will compare all keys as before
     if (_tablet_schema->keys_type() == DUP_KEYS || (_tablet_schema->keys_type() == UNIQUE_KEYS &&
                                                     _tablet->enable_unique_key_merge_on_write())) {
-        // find index in vector _return_columns
-        //   for the read_orderby_key_num_prefix_columns orderby keys
-        for (uint32_t i = 0; i < read_params.read_orderby_key_num_prefix_columns; i++) {
-            for (uint32_t idx = 0; idx < _return_columns.size(); idx++) {
-                if (_return_columns[idx] == i) {
-                    _orderby_key_columns.push_back(idx);
-                    break;
+        if (!_tablet_schema->cluster_key_uids().empty()) {
+            if (read_params.read_orderby_key_num_prefix_columns >
+                _tablet_schema->cluster_key_uids().size()) {
+                return Status::Error<ErrorCode::INTERNAL_ERROR>(
+                        "read_orderby_key_num_prefix_columns={} > cluster_keys.size()={}",
+                        read_params.read_orderby_key_num_prefix_columns,
+                        _tablet_schema->cluster_key_uids().size());
+            }
+            for (uint32_t i = 0; i < read_params.read_orderby_key_num_prefix_columns; i++) {
+                auto cid = _tablet_schema->cluster_key_uids()[i];
+                auto index = _tablet_schema->field_index(cid);
+                if (index < 0) {
+                    return Status::Error<ErrorCode::INTERNAL_ERROR>(
+                            "could not find cluster key column with unique_id=" +
+                            std::to_string(cid) +
+                            " in tablet schema, tablet_id=" + std::to_string(_tablet->tablet_id()));
+                }
+                for (uint32_t idx = 0; idx < _return_columns.size(); idx++) {
+                    if (_return_columns[idx] == index) {
+                        _orderby_key_columns.push_back(idx);
+                        break;
+                    }
+                }
+            }
+        } else {
+            // find index in vector _return_columns
+            //   for the read_orderby_key_num_prefix_columns orderby keys
+            for (uint32_t i = 0; i < read_params.read_orderby_key_num_prefix_columns; i++) {
+                for (uint32_t idx = 0; idx < _return_columns.size(); idx++) {
+                    if (_return_columns[idx] == i) {
+                        _orderby_key_columns.push_back(idx);
+                        break;
+                    }
                 }
             }
         }
@@ -579,8 +605,7 @@ ColumnPredicate* TabletReader::_parse_to_predicate(
         return nullptr;
     }
     const TabletColumn& column = materialize_column(_tablet_schema->column(index));
-    return create_column_predicate(index, bloom_filter.second, column.type(),
-                                   _reader_context.runtime_state->be_exec_version(), &column);
+    return create_column_predicate(index, bloom_filter.second, column.type(), &column);
 }
 
 ColumnPredicate* TabletReader::_parse_to_predicate(
@@ -590,8 +615,7 @@ ColumnPredicate* TabletReader::_parse_to_predicate(
         return nullptr;
     }
     const TabletColumn& column = materialize_column(_tablet_schema->column(index));
-    return create_column_predicate(index, in_filter.second, column.type(),
-                                   _reader_context.runtime_state->be_exec_version(), &column);
+    return create_column_predicate(index, in_filter.second, column.type(), &column);
 }
 
 ColumnPredicate* TabletReader::_parse_to_predicate(
@@ -601,8 +625,7 @@ ColumnPredicate* TabletReader::_parse_to_predicate(
         return nullptr;
     }
     const TabletColumn& column = materialize_column(_tablet_schema->column(index));
-    return create_column_predicate(index, bitmap_filter.second, column.type(),
-                                   _reader_context.runtime_state->be_exec_version(), &column);
+    return create_column_predicate(index, bitmap_filter.second, column.type(), &column);
 }
 
 ColumnPredicate* TabletReader::_parse_to_predicate(const FunctionFilter& function_filter) {
@@ -612,8 +635,7 @@ ColumnPredicate* TabletReader::_parse_to_predicate(const FunctionFilter& functio
     }
     const TabletColumn& column = materialize_column(_tablet_schema->column(index));
     return create_column_predicate(index, std::make_shared<FunctionFilter>(function_filter),
-                                   column.type(), _reader_context.runtime_state->be_exec_version(),
-                                   &column);
+                                   column.type(), &column);
 }
 
 Status TabletReader::_init_delete_condition(const ReaderParams& read_params) {
diff --git a/be/src/olap/tablet_schema.cpp b/be/src/olap/tablet_schema.cpp
index c4f96e2214853d..3ec5d22166477f 100644
--- a/be/src/olap/tablet_schema.cpp
+++ b/be/src/olap/tablet_schema.cpp
@@ -41,8 +41,6 @@
 #include "olap/tablet_column_object_pool.h"
 #include "olap/types.h"
 #include "olap/utils.h"
-#include "runtime/memory/lru_cache_policy.h"
-#include "runtime/thread_context.h"
 #include "tablet_meta.h"
 #include "vec/aggregate_functions/aggregate_function_simple_factory.h"
 #include "vec/aggregate_functions/aggregate_function_state_union.h"
@@ -975,10 +973,10 @@ void TabletSchema::init_from_pb(const TabletSchemaPB& schema, bool ignore_extrac
     _indexes.clear();
     _field_name_to_index.clear();
     _field_id_to_index.clear();
-    _cluster_key_idxes.clear();
+    _cluster_key_uids.clear();
     clear_column_cache_handlers();
-    for (const auto& i : schema.cluster_key_idxes()) {
-        _cluster_key_idxes.push_back(i);
+    for (const auto& i : schema.cluster_key_uids()) {
+        _cluster_key_uids.push_back(i);
     }
     for (auto& column_pb : schema.column()) {
         TabletColumnPtr column;
@@ -1126,10 +1124,10 @@ void TabletSchema::build_current_tablet_schema(int64_t index_id, int32_t version
     _sequence_col_idx = -1;
     _version_col_idx = -1;
     _skip_bitmap_col_idx = -1;
-    _cluster_key_idxes.clear();
+    _cluster_key_uids.clear();
     clear_column_cache_handlers();
-    for (const auto& i : ori_tablet_schema._cluster_key_idxes) {
-        _cluster_key_idxes.push_back(i);
+    for (const auto& i : ori_tablet_schema._cluster_key_uids) {
+        _cluster_key_uids.push_back(i);
     }
     for (auto& column : index->columns) {
         if (column->is_key()) {
@@ -1237,8 +1235,8 @@ void TabletSchema::reserve_extracted_columns() {
 }
 
 void TabletSchema::to_schema_pb(TabletSchemaPB* tablet_schema_pb) const {
-    for (const auto& i : _cluster_key_idxes) {
-        tablet_schema_pb->add_cluster_key_idxes(i);
+    for (const auto& i : _cluster_key_uids) {
+        tablet_schema_pb->add_cluster_key_uids(i);
     }
     tablet_schema_pb->set_keys_type(_keys_type);
     for (const auto& col : _cols) {
diff --git a/be/src/olap/tablet_schema.h b/be/src/olap/tablet_schema.h
index 5fb3deafd77319..c813d6f0ef8722 100644
--- a/be/src/olap/tablet_schema.h
+++ b/be/src/olap/tablet_schema.h
@@ -332,10 +332,8 @@ class TabletSchema : public MetadataAdder<TabletSchema> {
     void copy_from(const TabletSchema& tablet_schema);
     void update_index_info_from(const TabletSchema& tablet_schema);
     std::string to_key() const;
-    // Don't use.
-    // TODO: memory size of TabletSchema cannot be accurately tracked.
-    // In some places, temporarily use num_columns() as TabletSchema size.
-    int64_t mem_size() const { return _mem_size; }
+    // get_metadata_size is only the memory of the TabletSchema itself, not include child objects.
+    int64_t mem_size() const { return get_metadata_size(); }
     size_t row_size() const;
     int32_t field_index(const std::string& field_name) const;
     int32_t field_index(const vectorized::PathInData& path) const;
@@ -351,7 +349,7 @@ class TabletSchema : public MetadataAdder<TabletSchema> {
     const std::vector<TabletColumnPtr>& columns() const;
     size_t num_columns() const { return _num_columns; }
     size_t num_key_columns() const { return _num_key_columns; }
-    const std::vector<uint32_t>& cluster_key_idxes() const { return _cluster_key_idxes; }
+    const std::vector<uint32_t>& cluster_key_uids() const { return _cluster_key_uids; }
     size_t num_null_columns() const { return _num_null_columns; }
     size_t num_short_key_columns() const { return _num_short_key_columns; }
     size_t num_rows_per_row_block() const { return _num_rows_per_row_block; }
@@ -550,7 +548,7 @@ class TabletSchema : public MetadataAdder<TabletSchema> {
     size_t _num_columns = 0;
     size_t _num_variant_columns = 0;
     size_t _num_key_columns = 0;
-    std::vector<uint32_t> _cluster_key_idxes;
+    std::vector<uint32_t> _cluster_key_uids;
     size_t _num_null_columns = 0;
     size_t _num_short_key_columns = 0;
     size_t _num_rows_per_row_block = 0;
@@ -573,7 +571,6 @@ class TabletSchema : public MetadataAdder<TabletSchema> {
     int64_t _db_id = -1;
     bool _disable_auto_compaction = false;
     bool _enable_single_replica_compaction = false;
-    int64_t _mem_size = 0;
     bool _store_row_column = false;
     bool _skip_write_index_on_load = false;
     InvertedIndexStorageFormatPB _inverted_index_storage_format = InvertedIndexStorageFormatPB::V1;
diff --git a/be/src/olap/tablet_schema_cache.cpp b/be/src/olap/tablet_schema_cache.cpp
index fd238fa5affb3f..e044ef9c0426f4 100644
--- a/be/src/olap/tablet_schema_cache.cpp
+++ b/be/src/olap/tablet_schema_cache.cpp
@@ -56,7 +56,7 @@ std::pair<Cache::Handle*, TabletSchemaSPtr> TabletSchemaCache::insert(const std:
         tablet_schema_ptr->init_from_pb(pb, false, true);
         value->tablet_schema = tablet_schema_ptr;
         lru_handle = LRUCachePolicy::insert(key_signature, value, tablet_schema_ptr->num_columns(),
-                                            0, CachePriority::NORMAL);
+                                            tablet_schema_ptr->mem_size(), CachePriority::NORMAL);
         g_tablet_schema_cache_count << 1;
         g_tablet_schema_cache_columns_count << tablet_schema_ptr->num_columns();
     }
diff --git a/be/src/pipeline/dependency.h b/be/src/pipeline/dependency.h
index f7712625d3e9a6..ad018c8b4f8f3d 100644
--- a/be/src/pipeline/dependency.h
+++ b/be/src/pipeline/dependency.h
@@ -34,6 +34,7 @@
 #include "pipeline/common/set_utils.h"
 #include "pipeline/exec/data_queue.h"
 #include "pipeline/exec/join/process_hash_table_probe.h"
+#include "util/stack_util.h"
 #include "vec/common/sort/partition_sorter.h"
 #include "vec/common/sort/sorter.h"
 #include "vec/core/block.h"
@@ -107,7 +108,7 @@ class Dependency : public std::enable_shared_from_this<Dependency> {
     // Which dependency current pipeline task is blocked by. `nullptr` if this dependency is ready.
     [[nodiscard]] virtual Dependency* is_blocked_by(PipelineTask* task = nullptr);
     // Notify downstream pipeline tasks this dependency is ready.
-    void set_ready();
+    virtual void set_ready();
     void set_ready_to_read() {
         DCHECK_EQ(_shared_state->source_deps.size(), 1) << debug_string();
         _shared_state->source_deps.front()->set_ready();
diff --git a/be/src/pipeline/exec/hashjoin_build_sink.cpp b/be/src/pipeline/exec/hashjoin_build_sink.cpp
index cec0c77da8a61d..b2a79a941f79e7 100644
--- a/be/src/pipeline/exec/hashjoin_build_sink.cpp
+++ b/be/src/pipeline/exec/hashjoin_build_sink.cpp
@@ -91,8 +91,8 @@ Status HashJoinBuildSinkLocalState::init(RuntimeState* state, LocalSinkStateInfo
     RETURN_IF_ERROR(_hash_table_init(state));
     _runtime_filters.resize(p._runtime_filter_descs.size());
     for (size_t i = 0; i < p._runtime_filter_descs.size(); i++) {
-        RETURN_IF_ERROR(state->register_producer_runtime_filter(
-                p._runtime_filter_descs[i], &_runtime_filters[i], _build_expr_ctxs.size() == 1));
+        RETURN_IF_ERROR(state->register_producer_runtime_filter(p._runtime_filter_descs[i],
+                                                                &_runtime_filters[i]));
     }
 
     _runtime_filter_slots =
@@ -139,35 +139,54 @@ Status HashJoinBuildSinkLocalState::close(RuntimeState* state, Status exec_statu
         return Base::close(state, exec_status);
     }
 
-    if (state->get_task()->wake_up_by_downstream()) {
-        if (_should_build_hash_table) {
-            // partitial ignore rf to make global rf work
-            RETURN_IF_ERROR(_runtime_filter_slots->send_filter_size(state, 0, _finish_dependency));
-            RETURN_IF_ERROR(_runtime_filter_slots->ignore_all_filters());
+    try {
+        if (state->get_task()->wake_up_by_downstream()) {
+            if (_should_build_hash_table) {
+                // partitial ignore rf to make global rf work
+                RETURN_IF_ERROR(
+                        _runtime_filter_slots->send_filter_size(state, 0, _finish_dependency));
+                RETURN_IF_ERROR(_runtime_filter_slots->ignore_all_filters());
+            } else {
+                // do not publish filter coz local rf not inited and useless
+                return Base::close(state, exec_status);
+            }
+        } else if (_should_build_hash_table) {
+            if (p._shared_hashtable_controller &&
+                !p._shared_hash_table_context->complete_build_stage) {
+                return Status::InternalError("close before sink meet eos");
+            }
+            auto* block = _shared_state->build_block.get();
+            uint64_t hash_table_size = block ? block->rows() : 0;
+            {
+                SCOPED_TIMER(_runtime_filter_init_timer);
+                RETURN_IF_ERROR(_runtime_filter_slots->init_filters(state, hash_table_size));
+                RETURN_IF_ERROR(_runtime_filter_slots->ignore_filters(state));
+            }
+            if (hash_table_size > 1) {
+                SCOPED_TIMER(_runtime_filter_compute_timer);
+                _runtime_filter_slots->insert(block);
+            }
+        } else if ((p._shared_hashtable_controller && !p._shared_hash_table_context->signaled) ||
+                   (p._shared_hash_table_context &&
+                    !p._shared_hash_table_context->complete_build_stage)) {
+            throw Exception(ErrorCode::INTERNAL_ERROR, "build_sink::close meet error state");
         } else {
-            // do not publish filter coz local rf not inited and useless
-            return Base::close(state, exec_status);
-        }
-    } else if (_should_build_hash_table) {
-        if (p._shared_hashtable_controller && !p._shared_hash_table_context->complete_build_stage) {
-            return Status::InternalError("close before sink meet eos");
+            RETURN_IF_ERROR(
+                    _runtime_filter_slots->copy_from_shared_context(p._shared_hash_table_context));
         }
-        auto* block = _shared_state->build_block.get();
-        uint64_t hash_table_size = block ? block->rows() : 0;
-        {
-            SCOPED_TIMER(_runtime_filter_init_timer);
-            RETURN_IF_ERROR(_runtime_filter_slots->init_filters(state, hash_table_size));
-            RETURN_IF_ERROR(_runtime_filter_slots->ignore_filters(state));
-        }
-        if (hash_table_size > 1) {
-            SCOPED_TIMER(_runtime_filter_compute_timer);
-            _runtime_filter_slots->insert(block);
-        }
-    }
 
-    SCOPED_TIMER(_publish_runtime_filter_timer);
-    RETURN_IF_ERROR_OR_CATCH_EXCEPTION(
-            _runtime_filter_slots->publish(state, !_should_build_hash_table));
+        SCOPED_TIMER(_publish_runtime_filter_timer);
+        RETURN_IF_ERROR(_runtime_filter_slots->publish(state, !_should_build_hash_table));
+    } catch (Exception& e) {
+        return Status::InternalError(
+                "rf process meet error: {}, wake_up_by_downstream: {}, should_build_hash_table: "
+                "{}, _finish_dependency: {}, complete_build_stage: {}, shared_hash_table_signaled: "
+                "{}",
+                e.to_string(), state->get_task()->wake_up_by_downstream(), _should_build_hash_table,
+                _finish_dependency->debug_string(),
+                p._shared_hash_table_context && !p._shared_hash_table_context->complete_build_stage,
+                p._shared_hashtable_controller && !p._shared_hash_table_context->signaled);
+    }
     return Base::close(state, exec_status);
 }
 
@@ -537,9 +556,6 @@ Status HashJoinBuildSinkOperatorX::sink(RuntimeState* state, vectorized::Block*
             return _shared_hash_table_context->status;
         }
 
-        RETURN_IF_ERROR(local_state._runtime_filter_slots->copy_from_shared_context(
-                _shared_hash_table_context));
-
         local_state.profile()->add_info_string(
                 "SharedHashTableFrom",
                 print_id(
diff --git a/be/src/pipeline/exec/nested_loop_join_build_operator.cpp b/be/src/pipeline/exec/nested_loop_join_build_operator.cpp
index 9e3e8a08ca83a5..35b9de619f393d 100644
--- a/be/src/pipeline/exec/nested_loop_join_build_operator.cpp
+++ b/be/src/pipeline/exec/nested_loop_join_build_operator.cpp
@@ -67,7 +67,7 @@ Status NestedLoopJoinBuildSinkLocalState::init(RuntimeState* state, LocalSinkSta
     _runtime_filters.resize(p._runtime_filter_descs.size());
     for (size_t i = 0; i < p._runtime_filter_descs.size(); i++) {
         RETURN_IF_ERROR(state->register_producer_runtime_filter(p._runtime_filter_descs[i],
-                                                                &_runtime_filters[i], false));
+                                                                &_runtime_filters[i]));
     }
     return Status::OK();
 }
diff --git a/be/src/pipeline/exec/partitioned_aggregation_sink_operator.cpp b/be/src/pipeline/exec/partitioned_aggregation_sink_operator.cpp
index ab0a43f4a635cf..5273960a5c1c29 100644
--- a/be/src/pipeline/exec/partitioned_aggregation_sink_operator.cpp
+++ b/be/src/pipeline/exec/partitioned_aggregation_sink_operator.cpp
@@ -202,7 +202,7 @@ size_t PartitionedAggSinkOperatorX::revocable_mem_size(RuntimeState* state) cons
 
 Status PartitionedAggSinkLocalState::setup_in_memory_agg_op(RuntimeState* state) {
     _runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
     _runtime_state->set_task_execution_context(state->get_task_execution_context().lock());
     _runtime_state->set_be_number(state->be_number());
diff --git a/be/src/pipeline/exec/partitioned_aggregation_source_operator.cpp b/be/src/pipeline/exec/partitioned_aggregation_source_operator.cpp
index 655a6e19725a9b..cdc6ef881d436d 100644
--- a/be/src/pipeline/exec/partitioned_aggregation_source_operator.cpp
+++ b/be/src/pipeline/exec/partitioned_aggregation_source_operator.cpp
@@ -166,7 +166,7 @@ Status PartitionedAggSourceOperatorX::get_block(RuntimeState* state, vectorized:
 
 Status PartitionedAggLocalState::setup_in_memory_agg_op(RuntimeState* state) {
     _runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
     _runtime_state->set_task_execution_context(state->get_task_execution_context().lock());
     _runtime_state->set_be_number(state->be_number());
diff --git a/be/src/pipeline/exec/partitioned_hash_join_probe_operator.cpp b/be/src/pipeline/exec/partitioned_hash_join_probe_operator.cpp
index 0e56acc1c574b2..20b25d54ff9f16 100644
--- a/be/src/pipeline/exec/partitioned_hash_join_probe_operator.cpp
+++ b/be/src/pipeline/exec/partitioned_hash_join_probe_operator.cpp
@@ -606,7 +606,7 @@ Status PartitionedHashJoinProbeOperatorX::_setup_internal_operators(
     }
 
     local_state._runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
 
     local_state._runtime_state->set_task_execution_context(
diff --git a/be/src/pipeline/exec/partitioned_hash_join_sink_operator.cpp b/be/src/pipeline/exec/partitioned_hash_join_sink_operator.cpp
index d221eaeed0faba..878c3870946f1c 100644
--- a/be/src/pipeline/exec/partitioned_hash_join_sink_operator.cpp
+++ b/be/src/pipeline/exec/partitioned_hash_join_sink_operator.cpp
@@ -438,7 +438,7 @@ Status PartitionedHashJoinSinkOperatorX::_setup_internal_operator(RuntimeState*
     auto& local_state = get_local_state(state);
 
     local_state._shared_state->inner_runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
     local_state._shared_state->inner_runtime_state->set_task_execution_context(
             state->get_task_execution_context().lock());
diff --git a/be/src/pipeline/exec/schema_scan_operator.cpp b/be/src/pipeline/exec/schema_scan_operator.cpp
index 006ecf8ad82e84..ddc2821cac14a1 100644
--- a/be/src/pipeline/exec/schema_scan_operator.cpp
+++ b/be/src/pipeline/exec/schema_scan_operator.cpp
@@ -48,7 +48,7 @@ Status SchemaScanLocalState::init(RuntimeState* state, LocalStateInfo& info) {
     // new one scanner
     _schema_scanner = SchemaScanner::create(schema_table->schema_table_type());
 
-    _schema_scanner->set_dependency(_data_dependency, _finish_dependency);
+    _schema_scanner->set_dependency(_data_dependency);
     if (nullptr == _schema_scanner) {
         return Status::InternalError("schema scanner get nullptr pointer.");
     }
@@ -266,9 +266,6 @@ Status SchemaScanOperatorX::get_block(RuntimeState* state, vectorized::Block* bl
     } while (block->rows() == 0 && !*eos);
 
     local_state.reached_limit(block, eos);
-    if (*eos) {
-        local_state._finish_dependency->set_always_ready();
-    }
     return Status::OK();
 }
 
diff --git a/be/src/pipeline/exec/schema_scan_operator.h b/be/src/pipeline/exec/schema_scan_operator.h
index 03cf422fbc52e6..c8ddf885e98a0f 100644
--- a/be/src/pipeline/exec/schema_scan_operator.h
+++ b/be/src/pipeline/exec/schema_scan_operator.h
@@ -36,9 +36,6 @@ class SchemaScanLocalState final : public PipelineXLocalState<> {
 
     SchemaScanLocalState(RuntimeState* state, OperatorXBase* parent)
             : PipelineXLocalState<>(state, parent) {
-        _finish_dependency =
-                std::make_shared<Dependency>(parent->operator_id(), parent->node_id(),
-                                             parent->get_name() + "_FINISH_DEPENDENCY", true);
         _data_dependency = std::make_shared<Dependency>(parent->operator_id(), parent->node_id(),
                                                         parent->get_name() + "_DEPENDENCY", true);
     }
@@ -48,7 +45,6 @@ class SchemaScanLocalState final : public PipelineXLocalState<> {
 
     Status open(RuntimeState* state) override;
 
-    Dependency* finishdependency() override { return _finish_dependency.get(); }
     std::vector<Dependency*> dependencies() const override { return {_data_dependency.get()}; }
 
 private:
@@ -57,7 +53,6 @@ class SchemaScanLocalState final : public PipelineXLocalState<> {
     SchemaScannerParam _scanner_param;
     std::unique_ptr<SchemaScanner> _schema_scanner;
 
-    std::shared_ptr<Dependency> _finish_dependency;
     std::shared_ptr<Dependency> _data_dependency;
 };
 
diff --git a/be/src/pipeline/exec/spill_sort_sink_operator.cpp b/be/src/pipeline/exec/spill_sort_sink_operator.cpp
index 6e6689d4134deb..6071301c1d7bcc 100644
--- a/be/src/pipeline/exec/spill_sort_sink_operator.cpp
+++ b/be/src/pipeline/exec/spill_sort_sink_operator.cpp
@@ -80,7 +80,7 @@ Status SpillSortSinkLocalState::close(RuntimeState* state, Status execsink_statu
 
 Status SpillSortSinkLocalState::setup_in_memory_sort_op(RuntimeState* state) {
     _runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
     _runtime_state->set_task_execution_context(state->get_task_execution_context().lock());
     _runtime_state->set_be_number(state->be_number());
diff --git a/be/src/pipeline/exec/spill_sort_source_operator.cpp b/be/src/pipeline/exec/spill_sort_source_operator.cpp
index e766cb27168de1..69ed816fa9142d 100644
--- a/be/src/pipeline/exec/spill_sort_source_operator.cpp
+++ b/be/src/pipeline/exec/spill_sort_source_operator.cpp
@@ -212,7 +212,7 @@ Status SpillSortLocalState::_create_intermediate_merger(
 }
 Status SpillSortLocalState::setup_in_memory_sort_op(RuntimeState* state) {
     _runtime_state = RuntimeState::create_unique(
-            nullptr, state->fragment_instance_id(), state->query_id(), state->fragment_id(),
+            state->fragment_instance_id(), state->query_id(), state->fragment_id(),
             state->query_options(), TQueryGlobals {}, state->exec_env(), state->get_query_ctx());
     _runtime_state->set_task_execution_context(state->get_task_execution_context().lock());
     _runtime_state->set_be_number(state->be_number());
diff --git a/be/src/pipeline/local_exchange/local_exchanger.h b/be/src/pipeline/local_exchange/local_exchanger.h
index f518e2649f89e6..4d699baa52fb8b 100644
--- a/be/src/pipeline/local_exchange/local_exchanger.h
+++ b/be/src/pipeline/local_exchange/local_exchanger.h
@@ -110,7 +110,11 @@ struct BlockQueue {
             : eos(other.eos.load()), data_queue(std::move(other.data_queue)) {}
     inline bool enqueue(BlockType const& item) {
         if (!eos) {
-            data_queue.enqueue(item);
+            if (!data_queue.enqueue(item)) [[unlikely]] {
+                throw Exception(ErrorCode::INTERNAL_ERROR,
+                                "Exception occurs in data queue [size = {}] of local exchange.",
+                                data_queue.size_approx());
+            }
             return true;
         }
         return false;
@@ -118,7 +122,11 @@ struct BlockQueue {
 
     inline bool enqueue(BlockType&& item) {
         if (!eos) {
-            data_queue.enqueue(std::move(item));
+            if (!data_queue.enqueue(std::move(item))) [[unlikely]] {
+                throw Exception(ErrorCode::INTERNAL_ERROR,
+                                "Exception occurs in data queue [size = {}] of local exchange.",
+                                data_queue.size_approx());
+            }
             return true;
         }
         return false;
@@ -186,6 +194,8 @@ struct BlockWrapper {
                         shared_state->exchanger->_free_block_limit *
                                 shared_state->exchanger->_num_sources) {
                 data_block.clear_column_data();
+                // Free blocks is used to improve memory efficiency. Failure during pushing back
+                // free block will not incur any bad result so just ignore the return value.
                 shared_state->exchanger->_free_blocks.enqueue(std::move(data_block));
             }
         }
diff --git a/be/src/pipeline/pipeline.cpp b/be/src/pipeline/pipeline.cpp
index 96da754daa5d98..e4678b7dcf3a83 100644
--- a/be/src/pipeline/pipeline.cpp
+++ b/be/src/pipeline/pipeline.cpp
@@ -112,7 +112,12 @@ void Pipeline::make_all_runnable() {
     if (_sink->count_down_destination()) {
         for (auto* task : _tasks) {
             if (task) {
-                task->clear_blocking_state(true);
+                task->set_wake_up_by_downstream();
+            }
+        }
+        for (auto* task : _tasks) {
+            if (task) {
+                task->clear_blocking_state();
             }
         }
     }
diff --git a/be/src/pipeline/pipeline.h b/be/src/pipeline/pipeline.h
index b969186b178bf7..afbe6c77596432 100644
--- a/be/src/pipeline/pipeline.h
+++ b/be/src/pipeline/pipeline.h
@@ -73,6 +73,14 @@ class Pipeline : public std::enable_shared_from_this<Pipeline> {
         return idx == ExchangeType::HASH_SHUFFLE || idx == ExchangeType::BUCKET_HASH_SHUFFLE;
     }
 
+    // For HASH_SHUFFLE, BUCKET_HASH_SHUFFLE, and ADAPTIVE_PASSTHROUGH,
+    // data is processed and shuffled on the sink.
+    // Compared to PASSTHROUGH, this is a relatively heavy operation.
+    static bool heavy_operations_on_the_sink(ExchangeType idx) {
+        return idx == ExchangeType::HASH_SHUFFLE || idx == ExchangeType::BUCKET_HASH_SHUFFLE ||
+               idx == ExchangeType::ADAPTIVE_PASSTHROUGH;
+    }
+
     bool need_to_local_exchange(const DataDistribution target_data_distribution,
                                 const int idx) const;
     void init_data_distribution() {
diff --git a/be/src/pipeline/pipeline_fragment_context.cpp b/be/src/pipeline/pipeline_fragment_context.cpp
index 0775ef3fb19826..8ceb63eb99324c 100644
--- a/be/src/pipeline/pipeline_fragment_context.cpp
+++ b/be/src/pipeline/pipeline_fragment_context.cpp
@@ -397,9 +397,9 @@ Status PipelineFragmentContext::_build_pipeline_tasks(const doris::TPipelineFrag
                         << print_id(_task_runtime_states[pip_idx][i]->fragment_instance_id()) << " "
                         << pipeline->debug_string();
                 _task_runtime_states[pip_idx][i] = RuntimeState::create_unique(
-                        this, local_params.fragment_instance_id, request.query_id,
-                        request.fragment_id, request.query_options, _query_ctx->query_globals,
-                        _exec_env, _query_ctx.get());
+                        local_params.fragment_instance_id, request.query_id, request.fragment_id,
+                        request.query_options, _query_ctx->query_globals, _exec_env,
+                        _query_ctx.get());
                 auto& task_runtime_state = _task_runtime_states[pip_idx][i];
                 _runtime_filter_states[i]->set_state(task_runtime_state.get());
                 {
@@ -814,7 +814,7 @@ Status PipelineFragmentContext::_add_local_exchange_impl(
     }
     case ExchangeType::ADAPTIVE_PASSTHROUGH:
         shared_state->exchanger = AdaptivePassthroughExchanger::create_unique(
-                cur_pipe->num_tasks(), _num_instances,
+                std::max(cur_pipe->num_tasks(), _num_instances), _num_instances,
                 _runtime_state->query_options().__isset.local_exchange_free_blocks_limit
                         ? cast_set<int>(
                                   _runtime_state->query_options().local_exchange_free_blocks_limit)
@@ -915,9 +915,13 @@ Status PipelineFragmentContext::_add_local_exchange(
             << " cur_pipe->operators().size(): " << cur_pipe->operators().size()
             << " new_pip->operators().size(): " << new_pip->operators().size();
 
-    // Add passthrough local exchanger if necessary
+    // There are some local shuffles with relatively heavy operations on the sink.
+    // If the local sink concurrency is 1 and the local source concurrency is n, the sink becomes a bottleneck.
+    // Therefore, local passthrough is used to increase the concurrency of the sink.
+    // op -> local sink(1) -> local source (n)
+    // op -> local passthrough(1) -> local passthrough(n) ->  local sink(n) -> local source (n)
     if (cur_pipe->num_tasks() > 1 && new_pip->num_tasks() == 1 &&
-        Pipeline::is_hash_exchange(data_distribution.distribution_type)) {
+        Pipeline::heavy_operations_on_the_sink(data_distribution.distribution_type)) {
         RETURN_IF_ERROR(_add_local_exchange_impl(
                 cast_set<int>(new_pip->operators().size()), pool, new_pip,
                 add_pipeline(new_pip, pip_idx + 2), DataDistribution(ExchangeType::PASSTHROUGH),
diff --git a/be/src/pipeline/pipeline_task.h b/be/src/pipeline/pipeline_task.h
index 3b4627f589dc54..4bb062122c0c08 100644
--- a/be/src/pipeline/pipeline_task.h
+++ b/be/src/pipeline/pipeline_task.h
@@ -135,11 +135,12 @@ class PipelineTask {
     int task_id() const { return _index; };
     bool is_finalized() const { return _finalized; }
 
-    void clear_blocking_state(bool wake_up_by_downstream = false) {
+    void set_wake_up_by_downstream() { _wake_up_by_downstream = true; }
+
+    void clear_blocking_state() {
         _state->get_query_ctx()->get_execution_dependency()->set_always_ready();
         // We use a lock to assure all dependencies are not deconstructed here.
         std::unique_lock<std::mutex> lc(_dependency_lock);
-        _wake_up_by_downstream = _wake_up_by_downstream || wake_up_by_downstream;
         if (!_finalized) {
             _execution_dep->set_always_ready();
             for (auto* dep : _filter_dependencies) {
diff --git a/be/src/runtime/buffer_control_block.cpp b/be/src/runtime/buffer_control_block.cpp
index 1ed2836f8eb616..8c1ae79955f317 100644
--- a/be/src/runtime/buffer_control_block.cpp
+++ b/be/src/runtime/buffer_control_block.cpp
@@ -292,6 +292,9 @@ Status BufferControlBlock::get_arrow_batch(std::shared_ptr<vectorized::Block>* r
         _arrow_data_arrival.wait_for(l, std::chrono::milliseconds(20));
     }
 
+    if (!_status.ok()) {
+        return _status;
+    }
     if (_is_cancelled) {
         return Status::Cancelled(fmt::format("Cancelled ()", print_id(_fragment_id)));
     }
@@ -311,9 +314,12 @@ Status BufferControlBlock::get_arrow_batch(std::shared_ptr<vectorized::Block>* r
 
     // normal path end
     if (_is_close) {
+        if (!_status.ok()) {
+            return _status;
+        }
         std::stringstream ss;
         _profile.pretty_print(&ss);
-        VLOG_NOTICE << fmt::format(
+        LOG(INFO) << fmt::format(
                 "BufferControlBlock finished, fragment_id={}, is_close={}, is_cancelled={}, "
                 "packet_num={}, peak_memory_usage={}, profile={}",
                 print_id(_fragment_id), _is_close, _is_cancelled, _packet_num,
@@ -321,7 +327,7 @@ Status BufferControlBlock::get_arrow_batch(std::shared_ptr<vectorized::Block>* r
         return Status::OK();
     }
     return Status::InternalError(
-            fmt::format("Get Arrow Batch Abnormal Ending ()", print_id(_fragment_id)));
+            fmt::format("Get Arrow Batch Abnormal Ending (), ()", print_id(_fragment_id), _status));
 }
 
 void BufferControlBlock::get_arrow_batch(GetArrowResultBatchCtx* ctx) {
@@ -354,10 +360,14 @@ void BufferControlBlock::get_arrow_batch(GetArrowResultBatchCtx* ctx) {
 
     // normal path end
     if (_is_close) {
+        if (!_status.ok()) {
+            ctx->on_failure(_status);
+            return;
+        }
         ctx->on_close(_packet_num);
         std::stringstream ss;
         _profile.pretty_print(&ss);
-        VLOG_NOTICE << fmt::format(
+        LOG(INFO) << fmt::format(
                 "BufferControlBlock finished, fragment_id={}, is_close={}, is_cancelled={}, "
                 "packet_num={}, peak_memory_usage={}, profile={}",
                 print_id(_fragment_id), _is_close, _is_cancelled, _packet_num,
@@ -391,8 +401,8 @@ Status BufferControlBlock::find_arrow_schema(std::shared_ptr<arrow::Schema>* arr
     if (_is_close) {
         return Status::RuntimeError(fmt::format("Closed ()", print_id(_fragment_id)));
     }
-    return Status::InternalError(
-            fmt::format("Get Arrow Schema Abnormal Ending ()", print_id(_fragment_id)));
+    return Status::InternalError(fmt::format("Get Arrow Schema Abnormal Ending (), ()",
+                                             print_id(_fragment_id), _status));
 }
 
 Status BufferControlBlock::close(const TUniqueId& id, Status exec_status) {
diff --git a/be/src/runtime/exec_env.h b/be/src/runtime/exec_env.h
index a27936f5f0d88b..636ce2bf288b58 100644
--- a/be/src/runtime/exec_env.h
+++ b/be/src/runtime/exec_env.h
@@ -178,7 +178,6 @@ class ExecEnv {
     std::vector<TrackerLimiterGroup> mem_tracker_limiter_pool;
     void init_mem_tracker();
     std::shared_ptr<MemTrackerLimiter> orphan_mem_tracker() { return _orphan_mem_tracker; }
-    std::shared_ptr<MemTracker> page_no_cache_mem_tracker() { return _page_no_cache_mem_tracker; }
     std::shared_ptr<MemTrackerLimiter> brpc_iobuf_block_memory_tracker() {
         return _brpc_iobuf_block_memory_tracker;
     }
@@ -188,6 +187,15 @@ class ExecEnv {
     std::shared_ptr<MemTrackerLimiter> stream_load_pipe_tracker() {
         return _stream_load_pipe_tracker;
     }
+    std::shared_ptr<MemTrackerLimiter> tablets_no_cache_mem_tracker() {
+        return _tablets_no_cache_mem_tracker;
+    }
+    std::shared_ptr<MemTrackerLimiter> rowsets_no_cache_mem_tracker() {
+        return _rowsets_no_cache_mem_tracker;
+    }
+    std::shared_ptr<MemTrackerLimiter> segments_no_cache_mem_tracker() {
+        return _segments_no_cache_mem_tracker;
+    }
     std::shared_ptr<MemTrackerLimiter> point_query_executor_mem_tracker() {
         return _point_query_executor_mem_tracker;
     }
@@ -377,13 +385,15 @@ class ExecEnv {
     // Ideally, all threads are expected to attach to the specified tracker, so that "all memory has its own ownership",
     // and the consumption of the orphan mem tracker is close to 0, but greater than 0.
     std::shared_ptr<MemTrackerLimiter> _orphan_mem_tracker;
-    // page size not in cache, data page/index page/etc.
-    std::shared_ptr<MemTracker> _page_no_cache_mem_tracker;
     std::shared_ptr<MemTrackerLimiter> _brpc_iobuf_block_memory_tracker;
     // Count the memory consumption of segment compaction tasks.
     std::shared_ptr<MemTrackerLimiter> _segcompaction_mem_tracker;
     std::shared_ptr<MemTrackerLimiter> _stream_load_pipe_tracker;
 
+    std::shared_ptr<MemTrackerLimiter> _tablets_no_cache_mem_tracker;
+    std::shared_ptr<MemTrackerLimiter> _rowsets_no_cache_mem_tracker;
+    std::shared_ptr<MemTrackerLimiter> _segments_no_cache_mem_tracker;
+
     // Tracking memory may be shared between multiple queries.
     std::shared_ptr<MemTrackerLimiter> _point_query_executor_mem_tracker;
     std::shared_ptr<MemTrackerLimiter> _block_compression_mem_tracker;
diff --git a/be/src/runtime/exec_env_init.cpp b/be/src/runtime/exec_env_init.cpp
index b7f926cc3b4512..a371cdb947ff56 100644
--- a/be/src/runtime/exec_env_init.cpp
+++ b/be/src/runtime/exec_env_init.cpp
@@ -599,15 +599,20 @@ void ExecEnv::init_mem_tracker() {
     _s_tracking_memory = true;
     _orphan_mem_tracker =
             MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "Orphan");
-    _page_no_cache_mem_tracker = std::make_shared<MemTracker>("PageNoCache");
     _brpc_iobuf_block_memory_tracker =
             MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "IOBufBlockMemory");
     _segcompaction_mem_tracker =
-            MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "SegCompaction");
+            MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::COMPACTION, "SegCompaction");
+    _tablets_no_cache_mem_tracker = MemTrackerLimiter::create_shared(
+            MemTrackerLimiter::Type::METADATA, "Tablets(not in SchemaCache, TabletSchemaCache)");
+    _segments_no_cache_mem_tracker = MemTrackerLimiter::create_shared(
+            MemTrackerLimiter::Type::METADATA, "Segments(not in SegmentCache)");
+    _rowsets_no_cache_mem_tracker =
+            MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::METADATA, "Rowsets");
     _point_query_executor_mem_tracker =
             MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "PointQueryExecutor");
     _query_cache_mem_tracker =
-            MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "QueryCache");
+            MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::CACHE, "QueryCache");
     _block_compression_mem_tracker =
             MemTrackerLimiter::create_shared(MemTrackerLimiter::Type::GLOBAL, "BlockCompression");
     _rowid_storage_reader_tracker =
@@ -716,7 +721,7 @@ void ExecEnv::destroy() {
     _file_cache_open_fd_cache.reset();
     SAFE_STOP(_write_cooldown_meta_executors);
 
-    // StorageEngine must be destoried before _page_no_cache_mem_tracker.reset and _cache_manager destory
+    // StorageEngine must be destoried before _cache_manager destory
     SAFE_STOP(_storage_engine);
     _storage_engine.reset();
 
diff --git a/be/src/runtime/fragment_mgr.cpp b/be/src/runtime/fragment_mgr.cpp
index 1e72fa756d3dd3..f96e4152500808 100644
--- a/be/src/runtime/fragment_mgr.cpp
+++ b/be/src/runtime/fragment_mgr.cpp
@@ -269,8 +269,11 @@ void FragmentMgr::stop() {
 
     // Only me can delete
     {
-        std::lock_guard<std::mutex> lock(_lock);
+        std::unique_lock lock(_query_ctx_map_mutex);
         _query_ctx_map.clear();
+    }
+    {
+        std::unique_lock lock(_pipeline_map_mutex);
         _pipeline_map.clear();
     }
     _thread_pool->shutdown();
@@ -583,11 +586,7 @@ Status FragmentMgr::start_query_execution(const PExecPlanFragmentStartRequest* r
     TUniqueId query_id;
     query_id.__set_hi(request->query_id().hi());
     query_id.__set_lo(request->query_id().lo());
-    std::shared_ptr<QueryContext> q_ctx = nullptr;
-    {
-        std::lock_guard<std::mutex> lock(_lock);
-        q_ctx = _get_or_erase_query_ctx(query_id);
-    }
+    auto q_ctx = get_query_ctx(query_id);
     if (q_ctx) {
         q_ctx->set_ready_to_execute(Status::OK());
         LOG_INFO("Query {} start execution", print_id(query_id));
@@ -602,114 +601,107 @@ Status FragmentMgr::start_query_execution(const PExecPlanFragmentStartRequest* r
 
 void FragmentMgr::remove_pipeline_context(
         std::shared_ptr<pipeline::PipelineFragmentContext> f_context) {
-    {
-        std::lock_guard<std::mutex> lock(_lock);
-        auto query_id = f_context->get_query_id();
-        int64 now = duration_cast<std::chrono::milliseconds>(
-                            std::chrono::system_clock::now().time_since_epoch())
-                            .count();
-        g_fragment_executing_count << -1;
-        g_fragment_last_active_time.set_value(now);
-        _pipeline_map.erase({query_id, f_context->get_fragment_id()});
-    }
+    auto query_id = f_context->get_query_id();
+    int64 now = duration_cast<std::chrono::milliseconds>(
+                        std::chrono::system_clock::now().time_since_epoch())
+                        .count();
+    g_fragment_executing_count << -1;
+    g_fragment_last_active_time.set_value(now);
+
+    std::unique_lock lock(_pipeline_map_mutex);
+    _pipeline_map.erase({query_id, f_context->get_fragment_id()});
 }
 
-std::shared_ptr<QueryContext> FragmentMgr::_get_or_erase_query_ctx(const TUniqueId& query_id) {
+std::shared_ptr<QueryContext> FragmentMgr::get_query_ctx(const TUniqueId& query_id) {
+    std::shared_lock lock(_query_ctx_map_mutex);
     auto search = _query_ctx_map.find(query_id);
     if (search != _query_ctx_map.end()) {
         if (auto q_ctx = search->second.lock()) {
             return q_ctx;
-        } else {
-            LOG(WARNING) << "Query context (query id = " << print_id(query_id)
-                         << ") has been released.";
-            _query_ctx_map.erase(search);
-            return nullptr;
         }
     }
     return nullptr;
 }
 
-std::shared_ptr<QueryContext> FragmentMgr::get_or_erase_query_ctx_with_lock(
-        const TUniqueId& query_id) {
-    std::unique_lock<std::mutex> lock(_lock);
-    return _get_or_erase_query_ctx(query_id);
-}
-
-template <typename Params>
-Status FragmentMgr::_get_query_ctx(const Params& params, TUniqueId query_id, bool pipeline,
-                                   QuerySource query_source,
-                                   std::shared_ptr<QueryContext>& query_ctx) {
+Status FragmentMgr::_get_or_create_query_ctx(const TPipelineFragmentParams& params,
+                                             TUniqueId query_id, bool pipeline,
+                                             QuerySource query_source,
+                                             std::shared_ptr<QueryContext>& query_ctx) {
     DBUG_EXECUTE_IF("FragmentMgr._get_query_ctx.failed", {
         return Status::InternalError("FragmentMgr._get_query_ctx.failed, query id {}",
                                      print_id(query_id));
     });
+
+    // Find _query_ctx_map, in case some other request has already
+    // create the query fragments context.
+    query_ctx = get_query_ctx(query_id);
     if (params.is_simplified_param) {
         // Get common components from _query_ctx_map
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
-            query_ctx = q_ctx;
-        } else {
+        if (!query_ctx) {
             return Status::InternalError(
                     "Failed to get query fragments context. Query {} may be timeout or be "
                     "cancelled. host: {}",
                     print_id(query_id), BackendOptions::get_localhost());
         }
     } else {
-        // Find _query_ctx_map, in case some other request has already
-        // create the query fragments context.
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
-            query_ctx = q_ctx;
-            return Status::OK();
-        }
+        if (!query_ctx) {
+            std::unique_lock lock(_query_ctx_map_mutex);
+            // Only one thread need create query ctx. other thread just get query_ctx in _query_ctx_map.
+            auto search = _query_ctx_map.find(query_id);
+            if (search != _query_ctx_map.end()) {
+                query_ctx = search->second.lock();
+            }
 
-        // First time a fragment of a query arrived. print logs.
-        LOG(INFO) << "query_id: " << print_id(query_id) << ", coord_addr: " << params.coord
-                  << ", total fragment num on current host: " << params.fragment_num_on_host
-                  << ", fe process uuid: " << params.query_options.fe_process_uuid
-                  << ", query type: " << params.query_options.query_type
-                  << ", report audit fe:" << params.current_connect_fe;
-
-        // This may be a first fragment request of the query.
-        // Create the query fragments context.
-        query_ctx = QueryContext::create_shared(query_id, _exec_env, params.query_options,
-                                                params.coord, params.is_nereids,
-                                                params.current_connect_fe, query_source);
-        SCOPED_SWITCH_THREAD_MEM_TRACKER_LIMITER(query_ctx->query_mem_tracker);
-        RETURN_IF_ERROR(DescriptorTbl::create(&(query_ctx->obj_pool), params.desc_tbl,
-                                              &(query_ctx->desc_tbl)));
-        // set file scan range params
-        if (params.__isset.file_scan_params) {
-            query_ctx->file_scan_range_params_map = params.file_scan_params;
-        }
+            if (!query_ctx) {
+                // First time a fragment of a query arrived. print logs.
+                LOG(INFO) << "query_id: " << print_id(query_id) << ", coord_addr: " << params.coord
+                          << ", total fragment num on current host: " << params.fragment_num_on_host
+                          << ", fe process uuid: " << params.query_options.fe_process_uuid
+                          << ", query type: " << params.query_options.query_type
+                          << ", report audit fe:" << params.current_connect_fe;
+
+                // This may be a first fragment request of the query.
+                // Create the query fragments context.
+                query_ctx = QueryContext::create_shared(query_id, _exec_env, params.query_options,
+                                                        params.coord, params.is_nereids,
+                                                        params.current_connect_fe, query_source);
+                SCOPED_SWITCH_THREAD_MEM_TRACKER_LIMITER(query_ctx->query_mem_tracker);
+                RETURN_IF_ERROR(DescriptorTbl::create(&(query_ctx->obj_pool), params.desc_tbl,
+                                                      &(query_ctx->desc_tbl)));
+                // set file scan range params
+                if (params.__isset.file_scan_params) {
+                    query_ctx->file_scan_range_params_map = params.file_scan_params;
+                }
 
-        query_ctx->query_globals = params.query_globals;
+                query_ctx->query_globals = params.query_globals;
 
-        if (params.__isset.resource_info) {
-            query_ctx->user = params.resource_info.user;
-            query_ctx->group = params.resource_info.group;
-            query_ctx->set_rsc_info = true;
-        }
+                if (params.__isset.resource_info) {
+                    query_ctx->user = params.resource_info.user;
+                    query_ctx->group = params.resource_info.group;
+                    query_ctx->set_rsc_info = true;
+                }
 
-        _set_scan_concurrency(params, query_ctx.get());
-
-        if (params.__isset.workload_groups && !params.workload_groups.empty()) {
-            uint64_t tg_id = params.workload_groups[0].id;
-            WorkloadGroupPtr workload_group_ptr =
-                    _exec_env->workload_group_mgr()->get_task_group_by_id(tg_id);
-            if (workload_group_ptr != nullptr) {
-                RETURN_IF_ERROR(workload_group_ptr->add_query(query_id, query_ctx));
-                RETURN_IF_ERROR(query_ctx->set_workload_group(workload_group_ptr));
-                _exec_env->runtime_query_statistics_mgr()->set_workload_group_id(print_id(query_id),
-                                                                                 tg_id);
-            } else {
-                LOG(WARNING) << "Query/load id: " << print_id(query_ctx->query_id())
-                             << "can't find its workload group " << tg_id;
+                _set_scan_concurrency(params, query_ctx.get());
+
+                if (params.__isset.workload_groups && !params.workload_groups.empty()) {
+                    uint64_t tg_id = params.workload_groups[0].id;
+                    WorkloadGroupPtr workload_group_ptr =
+                            _exec_env->workload_group_mgr()->get_task_group_by_id(tg_id);
+                    if (workload_group_ptr != nullptr) {
+                        RETURN_IF_ERROR(workload_group_ptr->add_query(query_id, query_ctx));
+                        RETURN_IF_ERROR(query_ctx->set_workload_group(workload_group_ptr));
+                        _exec_env->runtime_query_statistics_mgr()->set_workload_group_id(
+                                print_id(query_id), tg_id);
+                    } else {
+                        LOG(WARNING) << "Query/load id: " << print_id(query_ctx->query_id())
+                                     << "can't find its workload group " << tg_id;
+                    }
+                }
+                // There is some logic in query ctx's dctor, we could not check if exists and delete the
+                // temp query ctx now. For example, the query id maybe removed from workload group's queryset.
+                _query_ctx_map.insert({query_id, query_ctx});
             }
         }
-        // There is some logic in query ctx's dctor, we could not check if exists and delete the
-        // temp query ctx now. For example, the query id maybe removed from workload group's queryset.
-        _query_ctx_map.insert(std::make_pair(query_ctx->query_id(), query_ctx));
     }
     return Status::OK();
 }
@@ -723,13 +715,13 @@ std::string FragmentMgr::dump_pipeline_tasks(int64_t duration) {
     fmt::memory_buffer debug_string_buffer;
     size_t i = 0;
     {
-        std::lock_guard<std::mutex> lock(_lock);
         fmt::format_to(debug_string_buffer,
                        "{} pipeline fragment contexts are still running! duration_limit={}\n",
                        _pipeline_map.size(), duration);
-
         timespec now;
         clock_gettime(CLOCK_MONOTONIC, &now);
+
+        std::shared_lock lock(_pipeline_map_mutex);
         for (auto& it : _pipeline_map) {
             auto elapsed = it.second->elapsed_time() / 1000000000.0;
             if (elapsed < duration) {
@@ -748,7 +740,7 @@ std::string FragmentMgr::dump_pipeline_tasks(int64_t duration) {
 }
 
 std::string FragmentMgr::dump_pipeline_tasks(TUniqueId& query_id) {
-    if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
+    if (auto q_ctx = get_query_ctx(query_id)) {
         return q_ctx->print_all_pipeline_context();
     } else {
         return fmt::format(
@@ -767,7 +759,8 @@ Status FragmentMgr::exec_plan_fragment(const TPipelineFragmentParams& params,
              << apache::thrift::ThriftDebugString(params.query_options).c_str();
 
     std::shared_ptr<QueryContext> query_ctx;
-    RETURN_IF_ERROR(_get_query_ctx(params, params.query_id, true, query_source, query_ctx));
+    RETURN_IF_ERROR(
+            _get_or_create_query_ctx(params, params.query_id, true, query_source, query_ctx));
     SCOPED_ATTACH_TASK(query_ctx.get());
     int64_t duration_ns = 0;
     std::shared_ptr<pipeline::PipelineFragmentContext> context =
@@ -800,16 +793,8 @@ Status FragmentMgr::exec_plan_fragment(const TPipelineFragmentParams& params,
     }
 
     {
-        // (query_id, fragment_id) is executed only on one BE, locks _pipeline_map.
-        std::lock_guard<std::mutex> lock(_lock);
         for (const auto& local_param : params.local_params) {
             const TUniqueId& fragment_instance_id = local_param.fragment_instance_id;
-            auto iter = _pipeline_map.find({params.query_id, params.fragment_id});
-            if (iter != _pipeline_map.end()) {
-                return Status::InternalError(
-                        "exec_plan_fragment query_id({}) input duplicated fragment_id({})",
-                        print_id(params.query_id), params.fragment_id);
-            }
             query_ctx->fragment_instance_ids.push_back(fragment_instance_id);
         }
 
@@ -818,7 +803,15 @@ Status FragmentMgr::exec_plan_fragment(const TPipelineFragmentParams& params,
                             .count();
         g_fragment_executing_count << 1;
         g_fragment_last_active_time.set_value(now);
-        // TODO: simplify this mapping
+
+        // (query_id, fragment_id) is executed only on one BE, locks _pipeline_map.
+        std::unique_lock lock(_pipeline_map_mutex);
+        auto iter = _pipeline_map.find({params.query_id, params.fragment_id});
+        if (iter != _pipeline_map.end()) {
+            return Status::InternalError(
+                    "exec_plan_fragment query_id({}) input duplicated fragment_id({})",
+                    print_id(params.query_id), params.fragment_id);
+        }
         _pipeline_map.insert({{params.query_id, params.fragment_id}, context});
     }
 
@@ -848,8 +841,7 @@ void FragmentMgr::cancel_query(const TUniqueId query_id, const Status reason) {
     std::shared_ptr<QueryContext> query_ctx = nullptr;
     std::vector<TUniqueId> all_instance_ids;
     {
-        std::lock_guard<std::mutex> state_lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
+        if (auto q_ctx = get_query_ctx(query_id)) {
             query_ctx = q_ctx;
             // Copy instanceids to avoid concurrent modification.
             // And to reduce the scope of lock.
@@ -862,7 +854,7 @@ void FragmentMgr::cancel_query(const TUniqueId query_id, const Status reason) {
     }
     query_ctx->cancel(reason);
     {
-        std::lock_guard<std::mutex> state_lock(_lock);
+        std::unique_lock l(_query_ctx_map_mutex);
         _query_ctx_map.erase(query_id);
     }
     LOG(INFO) << "Query " << print_id(query_id)
@@ -898,7 +890,7 @@ void FragmentMgr::cancel_worker() {
 
         std::vector<std::shared_ptr<pipeline::PipelineFragmentContext>> ctx;
         {
-            std::lock_guard<std::mutex> lock(_lock);
+            std::shared_lock lock(_pipeline_map_mutex);
             ctx.reserve(_pipeline_map.size());
             for (auto& pipeline_itr : _pipeline_map) {
                 ctx.push_back(pipeline_itr.second);
@@ -910,29 +902,34 @@ void FragmentMgr::cancel_worker() {
 
         std::unordered_map<std::shared_ptr<PBackendService_Stub>, BrpcItem> brpc_stub_with_queries;
         {
-            std::lock_guard<std::mutex> lock(_lock);
-            for (auto it = _query_ctx_map.begin(); it != _query_ctx_map.end();) {
-                if (auto q_ctx = it->second.lock()) {
-                    if (q_ctx->is_timeout(now)) {
-                        LOG_WARNING("Query {} is timeout", print_id(it->first));
-                        queries_timeout.push_back(it->first);
-                    } else if (config::enable_brpc_connection_check) {
-                        auto brpc_stubs = q_ctx->get_using_brpc_stubs();
-                        for (auto& item : brpc_stubs) {
-                            if (!brpc_stub_with_queries.contains(item.second)) {
-                                brpc_stub_with_queries.emplace(item.second,
-                                                               BrpcItem {item.first, {q_ctx}});
-                            } else {
-                                brpc_stub_with_queries[item.second].queries.emplace_back(q_ctx);
+            {
+                // TODO: Now only the cancel worker do the GC the _query_ctx_map. each query must
+                // do erase the finish query unless in _query_ctx_map. Rethink the logic is ok
+                std::unique_lock lock(_query_ctx_map_mutex);
+                for (auto it = _query_ctx_map.begin(); it != _query_ctx_map.end();) {
+                    if (auto q_ctx = it->second.lock()) {
+                        if (q_ctx->is_timeout(now)) {
+                            LOG_WARNING("Query {} is timeout", print_id(it->first));
+                            queries_timeout.push_back(it->first);
+                        } else if (config::enable_brpc_connection_check) {
+                            auto brpc_stubs = q_ctx->get_using_brpc_stubs();
+                            for (auto& item : brpc_stubs) {
+                                if (!brpc_stub_with_queries.contains(item.second)) {
+                                    brpc_stub_with_queries.emplace(item.second,
+                                                                   BrpcItem {item.first, {q_ctx}});
+                                } else {
+                                    brpc_stub_with_queries[item.second].queries.emplace_back(q_ctx);
+                                }
                             }
                         }
+                        ++it;
+                    } else {
+                        it = _query_ctx_map.erase(it);
                     }
-                    ++it;
-                } else {
-                    it = _query_ctx_map.erase(it);
                 }
             }
 
+            std::shared_lock lock(_query_ctx_map_mutex);
             // We use a very conservative cancel strategy.
             // 0. If there are no running frontends, do not cancel any queries.
             // 1. If query's process uuid is zero, do not cancel
@@ -1215,7 +1212,7 @@ Status FragmentMgr::apply_filterv2(const PPublishFilterRequestV2* request,
 
     const auto& fragment_ids = request->fragment_ids();
     {
-        std::unique_lock<std::mutex> lock(_lock);
+        std::shared_lock lock(_pipeline_map_mutex);
         for (auto fragment_id : fragment_ids) {
             auto iter =
                     _pipeline_map.find({UniqueId(request->query_id()).to_thrift(), fragment_id});
@@ -1267,8 +1264,7 @@ Status FragmentMgr::send_filter_size(const PSendFilterSizeRequest* request) {
         TUniqueId query_id;
         query_id.__set_hi(queryid.hi);
         query_id.__set_lo(queryid.lo);
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
+        if (auto q_ctx = get_query_ctx(query_id)) {
             query_ctx = q_ctx;
         } else {
             return Status::EndOfFile(
@@ -1291,8 +1287,7 @@ Status FragmentMgr::sync_filter_size(const PSyncFilterSizeRequest* request) {
         TUniqueId query_id;
         query_id.__set_hi(queryid.hi);
         query_id.__set_lo(queryid.lo);
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
+        if (auto q_ctx = get_query_ctx(query_id)) {
             query_ctx = q_ctx;
         } else {
             return Status::EndOfFile(
@@ -1312,8 +1307,7 @@ Status FragmentMgr::merge_filter(const PMergeFilterRequest* request,
         TUniqueId query_id;
         query_id.__set_hi(queryid.hi);
         query_id.__set_lo(queryid.lo);
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
+        if (auto q_ctx = get_query_ctx(query_id)) {
             query_ctx = q_ctx;
         } else {
             return Status::EndOfFile(
@@ -1330,7 +1324,7 @@ Status FragmentMgr::merge_filter(const PMergeFilterRequest* request,
 
 void FragmentMgr::get_runtime_query_info(std::vector<WorkloadQueryInfo>* query_info_list) {
     {
-        std::lock_guard<std::mutex> lock(_lock);
+        std::unique_lock lock(_query_ctx_map_mutex);
         for (auto iter = _query_ctx_map.begin(); iter != _query_ctx_map.end();) {
             if (auto q_ctx = iter->second.lock()) {
                 WorkloadQueryInfo workload_query_info;
@@ -1353,19 +1347,9 @@ Status FragmentMgr::get_realtime_exec_status(const TUniqueId& query_id,
         return Status::InvalidArgument("exes_status is nullptr");
     }
 
-    std::shared_ptr<QueryContext> query_context = nullptr;
-
-    {
-        std::lock_guard<std::mutex> lock(_lock);
-        if (auto q_ctx = _get_or_erase_query_ctx(query_id)) {
-            query_context = q_ctx;
-        } else {
-            return Status::NotFound("Query {} has been released", print_id(query_id));
-        }
-    }
-
+    std::shared_ptr<QueryContext> query_context = get_query_ctx(query_id);
     if (query_context == nullptr) {
-        return Status::NotFound("Query {} not found", print_id(query_id));
+        return Status::NotFound("Query {} not found or released", print_id(query_id));
     }
 
     *exec_status = query_context->get_realtime_exec_status();
diff --git a/be/src/runtime/fragment_mgr.h b/be/src/runtime/fragment_mgr.h
index 0eac0469683961..63d666788d0a5f 100644
--- a/be/src/runtime/fragment_mgr.h
+++ b/be/src/runtime/fragment_mgr.h
@@ -133,7 +133,7 @@ class FragmentMgr : public RestMonitorIface {
     ThreadPool* get_thread_pool() { return _thread_pool.get(); }
 
     int32_t running_query_num() {
-        std::unique_lock<std::mutex> ctx_lock(_lock);
+        std::shared_lock lock(_query_ctx_map_mutex);
         return _query_ctx_map.size();
     }
 
@@ -145,7 +145,7 @@ class FragmentMgr : public RestMonitorIface {
     Status get_realtime_exec_status(const TUniqueId& query_id,
                                     TReportExecStatusParams* exec_status);
 
-    std::shared_ptr<QueryContext> get_or_erase_query_ctx_with_lock(const TUniqueId& query_id);
+    std::shared_ptr<QueryContext> get_query_ctx(const TUniqueId& query_id);
 
 private:
     struct BrpcItem {
@@ -153,14 +153,12 @@ class FragmentMgr : public RestMonitorIface {
         std::vector<std::weak_ptr<QueryContext>> queries;
     };
 
-    std::shared_ptr<QueryContext> _get_or_erase_query_ctx(const TUniqueId& query_id);
-
     template <typename Param>
     void _set_scan_concurrency(const Param& params, QueryContext* query_ctx);
 
-    template <typename Params>
-    Status _get_query_ctx(const Params& params, TUniqueId query_id, bool pipeline,
-                          QuerySource query_type, std::shared_ptr<QueryContext>& query_ctx);
+    Status _get_or_create_query_ctx(const TPipelineFragmentParams& params, TUniqueId query_id,
+                                    bool pipeline, QuerySource query_type,
+                                    std::shared_ptr<QueryContext>& query_ctx);
 
     void _check_brpc_available(const std::shared_ptr<PBackendService_Stub>& brpc_stub,
                                const BrpcItem& brpc_item);
@@ -168,20 +166,21 @@ class FragmentMgr : public RestMonitorIface {
     // This is input params
     ExecEnv* _exec_env = nullptr;
 
+    // The lock protect the `_pipeline_map`
+    std::shared_mutex _pipeline_map_mutex;
+    // (QueryID, FragmentID) -> PipelineFragmentContext
+    phmap::flat_hash_map<std::pair<TUniqueId, int>,
+                         std::shared_ptr<pipeline::PipelineFragmentContext>>
+            _pipeline_map;
+
     // The lock should only be used to protect the structures in fragment manager. Has to be
     // used in a very small scope because it may dead lock. For example, if the _lock is used
     // in prepare stage, the call path is  prepare --> expr prepare --> may call allocator
     // when allocate failed, allocator may call query_is_cancelled, query is callced will also
     // call _lock, so that there is dead lock.
-    std::mutex _lock;
-
-    // (QueryID, FragmentID) -> PipelineFragmentContext
-    std::unordered_map<std::pair<TUniqueId, int>,
-                       std::shared_ptr<pipeline::PipelineFragmentContext>>
-            _pipeline_map;
-
+    std::shared_mutex _query_ctx_map_mutex;
     // query id -> QueryContext
-    std::unordered_map<TUniqueId, std::weak_ptr<QueryContext>> _query_ctx_map;
+    phmap::flat_hash_map<TUniqueId, std::weak_ptr<QueryContext>> _query_ctx_map;
     std::unordered_map<TUniqueId, std::unordered_map<int, int64_t>> _bf_size_map;
 
     CountDownLatch _stop_background_threads_latch;
diff --git a/be/src/runtime/load_channel.cpp b/be/src/runtime/load_channel.cpp
index 0cb313747b0373..dd426f1ab81d3e 100644
--- a/be/src/runtime/load_channel.cpp
+++ b/be/src/runtime/load_channel.cpp
@@ -45,8 +45,7 @@ LoadChannel::LoadChannel(const UniqueId& load_id, int64_t timeout_s, bool is_hig
           _backend_id(backend_id),
           _enable_profile(enable_profile) {
     std::shared_ptr<QueryContext> query_context =
-            ExecEnv::GetInstance()->fragment_mgr()->get_or_erase_query_ctx_with_lock(
-                    _load_id.to_thrift());
+            ExecEnv::GetInstance()->fragment_mgr()->get_query_ctx(_load_id.to_thrift());
     std::shared_ptr<MemTrackerLimiter> mem_tracker = nullptr;
     WorkloadGroupPtr wg_ptr = nullptr;
 
diff --git a/be/src/runtime/load_stream.cpp b/be/src/runtime/load_stream.cpp
index 752e2ff95b2917..60da45fa685fbf 100644
--- a/be/src/runtime/load_stream.cpp
+++ b/be/src/runtime/load_stream.cpp
@@ -428,7 +428,7 @@ LoadStream::LoadStream(PUniqueId load_id, LoadStreamMgr* load_stream_mgr, bool e
     TUniqueId load_tid = ((UniqueId)load_id).to_thrift();
 #ifndef BE_TEST
     std::shared_ptr<QueryContext> query_context =
-            ExecEnv::GetInstance()->fragment_mgr()->get_or_erase_query_ctx_with_lock(load_tid);
+            ExecEnv::GetInstance()->fragment_mgr()->get_query_ctx(load_tid);
     if (query_context != nullptr) {
         _query_thread_context = {load_tid, query_context->query_mem_tracker,
                                  query_context->workload_group()};
diff --git a/be/src/runtime/memory/cache_policy.h b/be/src/runtime/memory/cache_policy.h
index e7e1c73e7cbb41..8f077a4eb45bb1 100644
--- a/be/src/runtime/memory/cache_policy.h
+++ b/be/src/runtime/memory/cache_policy.h
@@ -17,6 +17,8 @@
 
 #pragma once
 
+#include <vector>
+
 #include "util/runtime_profile.h"
 
 namespace doris {
@@ -123,6 +125,7 @@ class CachePolicy {
             {"CloudTabletCache", CacheType::CLOUD_TABLET_CACHE},
             {"CloudTxnDeleteBitmapCache", CacheType::CLOUD_TXN_DELETE_BITMAP_CACHE},
             {"ForUTCacheNumber", CacheType::FOR_UT_CACHE_NUMBER},
+            {"QueryCache", CacheType::QUERY_CACHE},
             {"TabletColumnObjectPool", CacheType::TABLET_COLUMN_OBJECT_POOL}};
 
     static CacheType string_to_type(std::string type) {
@@ -133,6 +136,9 @@ class CachePolicy {
         }
     }
 
+    inline static std::vector<CacheType> MetadataCache {
+            CacheType::SEGMENT_CACHE, CacheType::SCHEMA_CACHE, CacheType::TABLET_SCHEMA_CACHE};
+
     CachePolicy(CacheType type, size_t capacity, uint32_t stale_sweep_time_s, bool enable_prune);
     virtual ~CachePolicy();
 
diff --git a/be/src/runtime/memory/lru_cache_policy.h b/be/src/runtime/memory/lru_cache_policy.h
index ea34e2837f1313..3fdb43facd7715 100644
--- a/be/src/runtime/memory/lru_cache_policy.h
+++ b/be/src/runtime/memory/lru_cache_policy.h
@@ -104,20 +104,26 @@ class LRUCachePolicy : public CachePolicy {
         return _mem_tracker->consumption();
     }
 
+    int64_t value_mem_consumption() {
+        DCHECK(_value_mem_tracker != nullptr);
+        return _value_mem_tracker->consumption();
+    }
+
     // Insert will consume tracking_bytes to _mem_tracker and cache value destroy will release tracking_bytes.
-    // If LRUCacheType::SIZE, tracking_bytes usually equal to charge.
-    // If LRUCacheType::NUMBER, tracking_bytes usually not equal to charge, at this time charge is an weight.
-    // If LRUCacheType::SIZE and tracking_bytes equals 0, memory must be tracked in Doris Allocator,
+    // If LRUCacheType::SIZE, value_tracking_bytes usually equal to charge.
+    // If LRUCacheType::NUMBER, value_tracking_bytes usually not equal to charge, at this time charge is an weight.
+    // If LRUCacheType::SIZE and value_tracking_bytes equals 0, memory must be tracked in Doris Allocator,
     //    cache value is allocated using Alloctor.
-    // If LRUCacheType::NUMBER and tracking_bytes equals 0, usually currently cannot accurately tracking memory size,
+    // If LRUCacheType::NUMBER and value_tracking_bytes equals 0, usually currently cannot accurately tracking memory size,
     //    only tracking handle_size(106).
-    Cache::Handle* insert(const CacheKey& key, void* value, size_t charge, size_t tracking_bytes,
+    Cache::Handle* insert(const CacheKey& key, void* value, size_t charge,
+                          size_t value_tracking_bytes,
                           CachePriority priority = CachePriority::NORMAL) {
-        size_t tracking_bytes_with_handle = sizeof(LRUHandle) - 1 + key.size() + tracking_bytes;
+        size_t tracking_bytes = sizeof(LRUHandle) - 1 + key.size() + value_tracking_bytes;
         if (value != nullptr) {
-            mem_tracker()->consume(tracking_bytes_with_handle);
             ((LRUCacheValueBase*)value)
-                    ->set_tracking_bytes(tracking_bytes_with_handle, _mem_tracker);
+                    ->set_tracking_bytes(tracking_bytes, _mem_tracker, value_tracking_bytes,
+                                         _value_mem_tracker);
         }
         return _cache->insert(key, value, charge, priority);
     }
@@ -265,9 +271,18 @@ class LRUCachePolicy : public CachePolicy {
 
 protected:
     void _init_mem_tracker(const std::string& type_name) {
-        _mem_tracker = MemTrackerLimiter::create_shared(
-                MemTrackerLimiter::Type::GLOBAL,
-                fmt::format("{}[{}]", type_string(_type), type_name));
+        if (std::find(CachePolicy::MetadataCache.begin(), CachePolicy::MetadataCache.end(),
+                      _type) == CachePolicy::MetadataCache.end()) {
+            _mem_tracker = MemTrackerLimiter::create_shared(
+                    MemTrackerLimiter::Type::CACHE,
+                    fmt::format("{}[{}]", type_string(_type), type_name));
+        } else {
+            _mem_tracker = MemTrackerLimiter::create_shared(
+                    MemTrackerLimiter::Type::METADATA,
+                    fmt::format("{}[{}]", type_string(_type), type_name));
+        }
+        _value_mem_tracker = std::make_shared<MemTracker>(
+                fmt::format("{}::Value[{}]", type_string(_type), type_name));
     }
 
     // if check_capacity failed, will return dummy lru cache,
@@ -277,6 +292,7 @@ class LRUCachePolicy : public CachePolicy {
     LRUCacheType _lru_cache_type;
 
     std::shared_ptr<MemTrackerLimiter> _mem_tracker;
+    std::shared_ptr<MemTracker> _value_mem_tracker;
 };
 
 } // namespace doris
diff --git a/be/src/runtime/memory/lru_cache_value_base.h b/be/src/runtime/memory/lru_cache_value_base.h
index f9e534e6600df8..a9a3ae5ddab632 100644
--- a/be/src/runtime/memory/lru_cache_value_base.h
+++ b/be/src/runtime/memory/lru_cache_value_base.h
@@ -28,18 +28,27 @@ class LRUCacheValueBase {
     virtual ~LRUCacheValueBase() {
         if (_tracking_bytes > 0) {
             _mem_tracker->release(_tracking_bytes);
+            _value_mem_tracker->release(_value_tracking_bytes);
         }
     }
 
     void set_tracking_bytes(size_t tracking_bytes,
-                            const std::shared_ptr<MemTrackerLimiter>& mem_tracker) {
+                            const std::shared_ptr<MemTrackerLimiter>& mem_tracker,
+                            size_t value_tracking_bytes,
+                            const std::shared_ptr<MemTracker>& value_mem_tracker) {
         this->_tracking_bytes = tracking_bytes;
         this->_mem_tracker = mem_tracker;
+        this->_value_tracking_bytes = value_tracking_bytes;
+        this->_value_mem_tracker = value_mem_tracker;
+        _mem_tracker->consume(_tracking_bytes);
+        _value_mem_tracker->consume(_value_tracking_bytes);
     }
 
 protected:
     size_t _tracking_bytes = 0;
+    size_t _value_tracking_bytes = 0;
     std::shared_ptr<MemTrackerLimiter> _mem_tracker;
+    std::shared_ptr<MemTracker> _value_mem_tracker;
 };
 
 } // namespace doris
diff --git a/be/src/runtime/memory/mem_tracker_limiter.cpp b/be/src/runtime/memory/mem_tracker_limiter.cpp
index 05ff13f0e7c646..ac4684835a670c 100644
--- a/be/src/runtime/memory/mem_tracker_limiter.cpp
+++ b/be/src/runtime/memory/mem_tracker_limiter.cpp
@@ -66,9 +66,13 @@ MemTrackerLimiter::MemTrackerLimiter(Type type, const std::string& label, int64_
     _uid = UniqueId::gen_uid();
     if (_type == Type::GLOBAL) {
         _group_num = 0;
+    } else if (_type == Type::METADATA) {
+        _group_num = 1;
+    } else if (_type == Type::CACHE) {
+        _group_num = 2;
     } else {
         _group_num =
-                mem_tracker_limiter_group_counter.fetch_add(1) % (MEM_TRACKER_GROUP_NUM - 1) + 1;
+                mem_tracker_limiter_group_counter.fetch_add(1) % (MEM_TRACKER_GROUP_NUM - 3) + 3;
     }
 
     // currently only select/load need runtime query statistics
@@ -208,24 +212,20 @@ std::string MemTrackerLimiter::print_address_sanitizers() {
 RuntimeProfile* MemTrackerLimiter::make_profile(RuntimeProfile* profile) const {
     RuntimeProfile* profile_snapshot = profile->create_child(
             fmt::format("{}@{}@id={}", _label, type_string(_type), _uid.to_string()), true, false);
-    RuntimeProfile::Counter* current_usage_counter =
-            ADD_COUNTER(profile_snapshot, "CurrentUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* peak_usage_counter =
-            ADD_COUNTER(profile_snapshot, "PeakUsage", TUnit::BYTES);
-    COUNTER_SET(current_usage_counter, consumption());
-    COUNTER_SET(peak_usage_counter, peak_consumption());
+    RuntimeProfile::HighWaterMarkCounter* usage_counter =
+            profile_snapshot->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+    COUNTER_SET(usage_counter, peak_consumption());
+    COUNTER_SET(usage_counter, consumption());
     if (has_limit()) {
         RuntimeProfile::Counter* limit_counter =
                 ADD_COUNTER(profile_snapshot, "Limit", TUnit::BYTES);
         COUNTER_SET(limit_counter, _limit);
     }
     if (reserved_peak_consumption() != 0) {
-        RuntimeProfile::Counter* reserved_counter =
-                ADD_COUNTER(profile_snapshot, "ReservedMemory", TUnit::BYTES);
-        RuntimeProfile::Counter* reserved_peak_counter =
-                ADD_COUNTER(profile_snapshot, "ReservedPeakMemory", TUnit::BYTES);
+        RuntimeProfile::HighWaterMarkCounter* reserved_counter =
+                profile_snapshot->AddHighWaterMarkCounter("ReservedMemory", TUnit::BYTES);
+        COUNTER_SET(reserved_counter, reserved_peak_consumption());
         COUNTER_SET(reserved_counter, reserved_consumption());
-        COUNTER_SET(reserved_peak_counter, reserved_peak_consumption());
     }
     return profile_snapshot;
 }
@@ -268,8 +268,26 @@ void MemTrackerLimiter::make_type_trackers_profile(RuntimeProfile* profile,
                 tracker->make_profile(profile);
             }
         }
+    } else if (type == Type::METADATA) {
+        std::lock_guard<std::mutex> l(
+                ExecEnv::GetInstance()->mem_tracker_limiter_pool[1].group_lock);
+        for (auto trackerWptr : ExecEnv::GetInstance()->mem_tracker_limiter_pool[1].trackers) {
+            auto tracker = trackerWptr.lock();
+            if (tracker != nullptr) {
+                tracker->make_profile(profile);
+            }
+        }
+    } else if (type == Type::CACHE) {
+        std::lock_guard<std::mutex> l(
+                ExecEnv::GetInstance()->mem_tracker_limiter_pool[2].group_lock);
+        for (auto trackerWptr : ExecEnv::GetInstance()->mem_tracker_limiter_pool[2].trackers) {
+            auto tracker = trackerWptr.lock();
+            if (tracker != nullptr) {
+                tracker->make_profile(profile);
+            }
+        }
     } else {
-        for (unsigned i = 1; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
+        for (unsigned i = 3; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
             std::lock_guard<std::mutex> l(
                     ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].group_lock);
             for (auto trackerWptr : ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].trackers) {
@@ -296,8 +314,8 @@ void MemTrackerLimiter::make_top_consumption_tasks_tracker_profile(RuntimeProfil
     std::unique_ptr<RuntimeProfile> tmp_profile_snapshot =
             std::make_unique<RuntimeProfile>("tmpSnapshot");
     std::priority_queue<std::pair<int64_t, RuntimeProfile*>> max_pq;
-    // start from 2, not include global type.
-    for (unsigned i = 1; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
+    // start from 3, not include global/metadata/cache type.
+    for (unsigned i = 3; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
         std::lock_guard<std::mutex> l(
                 ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].group_lock);
         for (auto trackerWptr : ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].trackers) {
@@ -326,13 +344,19 @@ void MemTrackerLimiter::make_all_tasks_tracker_profile(RuntimeProfile* profile)
     types_profile[Type::SCHEMA_CHANGE] = profile->create_child("SchemaChangeTasks", true, false);
     types_profile[Type::OTHER] = profile->create_child("OtherTasks", true, false);
 
-    // start from 2, not include global type.
-    for (unsigned i = 1; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
+    // start from 3, not include global/metadata/cache type.
+    for (unsigned i = 3; i < ExecEnv::GetInstance()->mem_tracker_limiter_pool.size(); ++i) {
         std::lock_guard<std::mutex> l(
                 ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].group_lock);
         for (auto trackerWptr : ExecEnv::GetInstance()->mem_tracker_limiter_pool[i].trackers) {
             auto tracker = trackerWptr.lock();
             if (tracker != nullptr) {
+                // BufferControlBlock will continue to exist for 5 minutes after the query ends, even if the
+                // result buffer is empty, and will not be shown in the profile. of course, this code is tricky.
+                if (tracker->consumption() == 0 &&
+                    tracker->label().starts_with("BufferControlBlock")) {
+                    continue;
+                }
                 tracker->make_profile(types_profile[tracker->type()]);
             }
         }
diff --git a/be/src/runtime/memory/mem_tracker_limiter.h b/be/src/runtime/memory/mem_tracker_limiter.h
index 445856b1f6af83..43b20a410ff27c 100644
--- a/be/src/runtime/memory/mem_tracker_limiter.h
+++ b/be/src/runtime/memory/mem_tracker_limiter.h
@@ -77,12 +77,14 @@ class MemTrackerLimiter final {
     enum class GCType { PROCESS = 0, WORK_LOAD_GROUP = 1 };
 
     enum class Type {
-        GLOBAL = 0,        // Life cycle is the same as the process, e.g. Cache and default Orphan
+        GLOBAL = 0,        // Life cycle is the same as the process, except cache and metadata.
         QUERY = 1,         // Count the memory consumption of all Query tasks.
         LOAD = 2,          // Count the memory consumption of all Load tasks.
         COMPACTION = 3,    // Count the memory consumption of all Base and Cumulative tasks.
         SCHEMA_CHANGE = 4, // Count the memory consumption of all SchemaChange tasks.
-        OTHER = 5,
+        METADATA = 5,      // Count the memory consumption of all Metadata.
+        CACHE = 6,         // Count the memory consumption of all Cache.
+        OTHER = 7, // Count the memory consumption of all other tasks, such as Clone, Snapshot, etc..
     };
 
     static std::string type_string(Type type) {
@@ -97,8 +99,12 @@ class MemTrackerLimiter final {
             return "compaction";
         case Type::SCHEMA_CHANGE:
             return "schema_change";
+        case Type::METADATA:
+            return "metadata";
+        case Type::CACHE:
+            return "cache";
         case Type::OTHER:
-            return "other";
+            return "other_task";
         default:
             LOG(FATAL) << "not match type of mem tracker limiter :" << static_cast<int>(type);
         }
@@ -158,6 +164,8 @@ class MemTrackerLimiter final {
     int64_t consumption() const { return _mem_counter.current_value(); }
     int64_t peak_consumption() const { return _mem_counter.peak_value(); }
 
+    // Use carefully! only memory that cannot be allocated using Doris Allocator needs to be consumed manually.
+    // Ideally, all memory should use Doris Allocator.
     void consume(int64_t bytes) {
         _mem_counter.add(bytes);
         if (_query_statistics) {
diff --git a/be/src/runtime/memory/memory_profile.cpp b/be/src/runtime/memory/memory_profile.cpp
index 8dbdcbdd3af769..5d649c526014af 100644
--- a/be/src/runtime/memory/memory_profile.cpp
+++ b/be/src/runtime/memory/memory_profile.cpp
@@ -18,6 +18,9 @@
 #include "runtime/memory/memory_profile.h"
 
 #include "bvar/reducer.h"
+#include "olap/metadata_adder.h"
+#include "olap/schema_cache.h"
+#include "olap/tablet_schema_cache.h"
 #include "runtime/exec_env.h"
 #include "runtime/memory/global_memory_arbitrator.h"
 #include "runtime/memory/mem_tracker_limiter.h"
@@ -28,6 +31,9 @@ namespace doris {
 
 static bvar::Adder<int64_t> memory_all_tracked_sum_bytes("memory_all_tracked_sum_bytes");
 static bvar::Adder<int64_t> memory_global_trackers_sum_bytes("memory_global_trackers_sum_bytes");
+static bvar::Adder<int64_t> memory_metadata_trackers_sum_bytes(
+        "memory_metadata_trackers_sum_bytes");
+static bvar::Adder<int64_t> memory_cache_trackers_sum_bytes("memory_cache_trackers_sum_bytes");
 static bvar::Adder<int64_t> memory_query_trackers_sum_bytes("memory_query_trackers_sum_bytes");
 static bvar::Adder<int64_t> memory_load_trackers_sum_bytes("memory_load_trackers_sum_bytes");
 static bvar::Adder<int64_t> memory_compaction_trackers_sum_bytes(
@@ -40,140 +46,122 @@ static bvar::Adder<int64_t> memory_all_tasks_memory_bytes("memory_all_tasks_memo
 static bvar::Adder<int64_t> memory_untracked_memory_bytes("memory_untracked_memory_bytes");
 
 MemoryProfile::MemoryProfile() {
-    _memory_overview_profile.set(std::make_unique<RuntimeProfile>("MemoryOverviewSnapshot"));
+#ifdef ADDRESS_SANITIZER
+    _memory_overview_profile = std::make_unique<RuntimeProfile>("[ASAN]MemoryOverviewSnapshot");
+#else
+    _memory_overview_profile = std::make_unique<RuntimeProfile>("MemoryOverviewSnapshot");
+#endif
     _global_memory_profile.set(std::make_unique<RuntimeProfile>("GlobalMemorySnapshot"));
+    _metadata_memory_profile.set(std::make_unique<RuntimeProfile>("MetadataMemorySnapshot"));
+    _cache_memory_profile.set(std::make_unique<RuntimeProfile>("CacheMemorySnapshot"));
     _top_memory_tasks_profile.set(std::make_unique<RuntimeProfile>("TopMemoryTasksSnapshot"));
     _tasks_memory_profile.set(std::make_unique<RuntimeProfile>("TasksMemorySnapshot"));
+    init_memory_overview_counter();
 }
 
-void MemoryProfile::refresh_memory_overview_profile() {
-#ifdef ADDRESS_SANITIZER
-    std::unique_ptr<RuntimeProfile> memory_overview_profile =
-            std::make_unique<RuntimeProfile>("[ASAN]MemoryOverviewSnapshot");
-#else
-    std::unique_ptr<RuntimeProfile> memory_overview_profile =
-            std::make_unique<RuntimeProfile>("MemoryOverviewSnapshot");
-#endif
-    std::unique_ptr<RuntimeProfile> global_memory_profile =
-            std::make_unique<RuntimeProfile>("GlobalMemorySnapshot");
-    std::unique_ptr<RuntimeProfile> top_memory_tasks_profile =
-            std::make_unique<RuntimeProfile>("TopMemoryTasksSnapshot");
-
-    // 1. create profile
+void MemoryProfile::init_memory_overview_counter() {
     RuntimeProfile* untracked_memory_profile =
-            memory_overview_profile->create_child("UntrackedMemory", true, false);
+            _memory_overview_profile->create_child("UntrackedMemory", true, false);
     RuntimeProfile* tracked_memory_profile =
-            memory_overview_profile->create_child("TrackedMemory", true, false);
+            _memory_overview_profile->create_child("TrackedMemory", true, false);
     RuntimeProfile* tasks_memory_overview_profile =
             tracked_memory_profile->create_child("TasksMemory", true, false);
     RuntimeProfile* tasks_memory_overview_details_profile =
             tasks_memory_overview_profile->create_child("Details", true, false);
     RuntimeProfile* global_memory_overview_profile =
             tracked_memory_profile->create_child("GlobalMemory", true, false);
+    RuntimeProfile* metadata_memory_overview_profile =
+            tracked_memory_profile->create_child("MetadataMemory", true, false);
+    RuntimeProfile* cache_memory_overview_profile =
+            tracked_memory_profile->create_child("CacheMemory", true, false);
     RuntimeProfile* jemalloc_memory_profile =
             tracked_memory_profile->create_child("JemallocMemory", true, false);
     RuntimeProfile* jemalloc_memory_details_profile =
             jemalloc_memory_profile->create_child("Details", true, false);
 
-    // 2. add counter
-    // 2.1 add process memory counter
-    RuntimeProfile::Counter* process_physical_memory_current_usage_counter =
-            ADD_COUNTER(memory_overview_profile, "PhysicalMemory(VmRSS)", TUnit::BYTES);
-    RuntimeProfile::Counter* process_physical_memory_peak_usage_counter =
-            memory_overview_profile->AddHighWaterMarkCounter("PhysicalMemoryPeak", TUnit::BYTES);
-    RuntimeProfile::Counter* process_virtual_memory_current_usage_counter =
-            ADD_COUNTER(memory_overview_profile, "VirtualMemory(VmSize)", TUnit::BYTES);
-    RuntimeProfile::Counter* process_virtual_memory_peak_usage_counter =
-            memory_overview_profile->AddHighWaterMarkCounter("VirtualMemoryPeak", TUnit::BYTES);
-
-    // 2.2 add untracked memory counter
-    RuntimeProfile::Counter* untracked_memory_current_usage_counter =
-            ADD_COUNTER(untracked_memory_profile, "CurrentUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* untracked_memory_peak_usage_counter =
-            untracked_memory_profile->AddHighWaterMarkCounter("PeakUsage", TUnit::BYTES);
-
-    // 2.3 add tracked memory counter
-    RuntimeProfile::Counter* tracked_memory_current_usage_counter =
-            ADD_COUNTER(tracked_memory_profile, "CurrentUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* tracked_memory_peak_usage_counter =
-            tracked_memory_profile->AddHighWaterMarkCounter("PeakUsage", TUnit::BYTES);
-
-    // 2.4 add jemalloc memory counter
-    RuntimeProfile::Counter* jemalloc_memory_current_usage_counter =
-            ADD_COUNTER(jemalloc_memory_profile, "CurrentUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* jemalloc_memory_peak_usage_counter =
-            jemalloc_memory_profile->AddHighWaterMarkCounter("PeakUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* jemalloc_cache_current_usage_counter =
-            ADD_COUNTER(jemalloc_memory_details_profile, "Cache", TUnit::BYTES);
-    RuntimeProfile::Counter* jemalloc_cache_peak_usage_counter =
-            jemalloc_memory_details_profile->AddHighWaterMarkCounter("CachePeak", TUnit::BYTES);
-    RuntimeProfile::Counter* jemalloc_metadata_current_usage_counter =
-            ADD_COUNTER(jemalloc_memory_details_profile, "Metadata", TUnit::BYTES);
-    RuntimeProfile::Counter* jemalloc_metadata_peak_usage_counter =
-            jemalloc_memory_details_profile->AddHighWaterMarkCounter("MetadataPeak", TUnit::BYTES);
-
-    // 2.5 add global memory counter
-    RuntimeProfile::Counter* global_current_usage_counter =
-            ADD_COUNTER(global_memory_overview_profile, "CurrentUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* global_peak_usage_counter =
-            global_memory_overview_profile->AddHighWaterMarkCounter("PeakUsage", TUnit::BYTES);
-
-    // 2.6 add tasks memory counter
-    RuntimeProfile::Counter* tasks_memory_current_usage_counter =
-            ADD_COUNTER_WITH_LEVEL(tasks_memory_overview_profile, "CurrentUsage", TUnit::BYTES, 1);
+    // 1 add process memory counter
+    _process_physical_memory_usage_counter = _memory_overview_profile->AddHighWaterMarkCounter(
+            "PhysicalMemory(VmRSS)", TUnit::BYTES);
+    _process_virtual_memory_usage_counter = _memory_overview_profile->AddHighWaterMarkCounter(
+            "VirtualMemory(VmSize)", TUnit::BYTES);
+
+    // 2 add untracked/tracked memory counter
+    _untracked_memory_usage_counter =
+            untracked_memory_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+    _tracked_memory_usage_counter =
+            tracked_memory_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+
+    // 3 add Jemalloc memory counter
+    _jemalloc_memory_usage_counter =
+            jemalloc_memory_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+    _jemalloc_cache_usage_counter =
+            jemalloc_memory_details_profile->AddHighWaterMarkCounter("Cache", TUnit::BYTES);
+    _jemalloc_metadata_usage_counter =
+            jemalloc_memory_details_profile->AddHighWaterMarkCounter("Metadata", TUnit::BYTES);
+
+    // 4 add global/metadata/cache memory counter
+    _global_usage_counter =
+            global_memory_overview_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+    _metadata_usage_counter =
+            metadata_memory_overview_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+    _cache_usage_counter =
+            cache_memory_overview_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
+
+    // 5 add tasks memory counter
+    _tasks_memory_usage_counter =
+            tasks_memory_overview_profile->AddHighWaterMarkCounter("Memory", TUnit::BYTES);
     // Reserved memory is the sum of all task reserved memory, is duplicated with all task memory counter.
-    RuntimeProfile::Counter* reserved_memory_current_usage_counter = ADD_CHILD_COUNTER_WITH_LEVEL(
-            tasks_memory_overview_profile, "ReservedMemory", TUnit::BYTES, "CurrentUsage", 1);
-    RuntimeProfile::Counter* reserved_memory_peak_usage_counter =
-            tasks_memory_overview_profile->AddHighWaterMarkCounter("ReservedMemoryPeak",
-                                                                   TUnit::BYTES, "CurrentUsage", 1);
-    RuntimeProfile::Counter* tasks_memory_peak_usage_counter =
-            tasks_memory_overview_profile->AddHighWaterMarkCounter("PeakUsage", TUnit::BYTES);
-    RuntimeProfile::Counter* query_current_usage_counter =
-            ADD_COUNTER_WITH_LEVEL(tasks_memory_overview_details_profile, "Query", TUnit::BYTES, 1);
-    RuntimeProfile::Counter* query_peak_usage_counter =
-            tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
-                    "QueryPeak", TUnit::BYTES, "Query", 1);
-    RuntimeProfile::Counter* load_current_usage_counter =
-            ADD_COUNTER_WITH_LEVEL(tasks_memory_overview_details_profile, "Load", TUnit::BYTES, 1);
-    RuntimeProfile::Counter* load_peak_usage_counter =
-            tasks_memory_overview_details_profile->AddHighWaterMarkCounter("LoadPeak", TUnit::BYTES,
-                                                                           "Load", 1);
-    RuntimeProfile::Counter* load_all_memtables_current_usage_counter =
-            ADD_CHILD_COUNTER_WITH_LEVEL(tasks_memory_overview_details_profile,
-                                         "AllMemTablesMemory", TUnit::BYTES, "Load", 1);
-    RuntimeProfile::Counter* load_all_memtables_peak_usage_counter =
-            ADD_CHILD_COUNTER_WITH_LEVEL(tasks_memory_overview_details_profile,
-                                         "AllMemTablesMemoryPeak", TUnit::BYTES, "Load", 1);
-    RuntimeProfile::Counter* compaction_current_usage_counter = ADD_COUNTER_WITH_LEVEL(
-            tasks_memory_overview_details_profile, "Compaction", TUnit::BYTES, 1);
-    RuntimeProfile::Counter* compaction_peak_usage_counter =
-            tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
-                    "CompactionPeak", TUnit::BYTES, "Compaction", 1);
-    RuntimeProfile::Counter* schema_change_current_usage_counter = ADD_COUNTER_WITH_LEVEL(
-            tasks_memory_overview_details_profile, "SchemaChange", TUnit::BYTES, 1);
-    RuntimeProfile::Counter* schema_change_peak_usage_counter =
-            tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
-                    "SchemaChangePeak", TUnit::BYTES, "SchemaChange", 1);
-    RuntimeProfile::Counter* other_current_usage_counter =
-            ADD_COUNTER_WITH_LEVEL(tasks_memory_overview_details_profile, "Other", TUnit::BYTES, 1);
-    RuntimeProfile::Counter* other_peak_usage_counter =
-            tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
-                    "OtherPeak", TUnit::BYTES, "Other", 1);
-    // 3. refresh counter
-    // 3.1 refresh process memory counter
-    COUNTER_SET(process_physical_memory_current_usage_counter,
+    _reserved_memory_usage_counter = tasks_memory_overview_profile->AddHighWaterMarkCounter(
+            "ReservedMemory", TUnit::BYTES, "Memory", 1);
+    _query_usage_counter =
+            tasks_memory_overview_details_profile->AddHighWaterMarkCounter("Query", TUnit::BYTES);
+    _load_usage_counter =
+            tasks_memory_overview_details_profile->AddHighWaterMarkCounter("Load", TUnit::BYTES);
+    _load_all_memtables_usage_counter =
+            tasks_memory_overview_details_profile->AddHighWaterMarkCounter("AllMemTablesMemory",
+                                                                           TUnit::BYTES, "Load", 1);
+    _compaction_usage_counter = tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
+            "Compaction", TUnit::BYTES);
+    _schema_change_usage_counter = tasks_memory_overview_details_profile->AddHighWaterMarkCounter(
+            "SchemaChange", TUnit::BYTES);
+    _other_usage_counter =
+            tasks_memory_overview_details_profile->AddHighWaterMarkCounter("Other", TUnit::BYTES);
+}
+
+void MemoryProfile::refresh_memory_overview_profile() {
+    // 1 create profile
+    std::unique_ptr<RuntimeProfile> global_memory_profile =
+            std::make_unique<RuntimeProfile>("GlobalMemorySnapshot");
+    std::unique_ptr<RuntimeProfile> metadata_memory_profile =
+            std::make_unique<RuntimeProfile>("MetadataMemorySnapshot");
+    std::unique_ptr<RuntimeProfile> cache_memory_profile =
+            std::make_unique<RuntimeProfile>("CacheMemorySnapshot");
+    std::unique_ptr<RuntimeProfile> top_memory_tasks_profile =
+            std::make_unique<RuntimeProfile>("TopMemoryTasksSnapshot");
+
+    // 2 refresh process memory counter
+    COUNTER_SET(_process_physical_memory_usage_counter,
                 PerfCounters::get_vm_rss()); // from /proc VmRSS VmHWM
-    COUNTER_SET(process_physical_memory_peak_usage_counter, PerfCounters::get_vm_hwm());
-    COUNTER_SET(process_virtual_memory_current_usage_counter,
+    COUNTER_SET(_process_virtual_memory_usage_counter,
                 PerfCounters::get_vm_size()); // from /proc VmSize VmPeak
-    COUNTER_SET(process_virtual_memory_peak_usage_counter, PerfCounters::get_vm_peak());
 
-    // 3.2 refresh tracked memory counter
+    // 2 refresh metadata memory tracker
+    ExecEnv::GetInstance()->tablets_no_cache_mem_tracker()->set_consumption(
+            MetadataAdder<TabletMeta>::get_all_tablets_size() -
+            TabletSchemaCache::instance()->value_mem_consumption() -
+            SchemaCache::instance()->value_mem_consumption());
+    ExecEnv::GetInstance()->rowsets_no_cache_mem_tracker()->set_consumption(
+            MetadataAdder<RowsetMeta>::get_all_rowsets_size());
+    ExecEnv::GetInstance()->segments_no_cache_mem_tracker()->set_consumption(
+            MetadataAdder<segment_v2::Segment>::get_all_segments_estimate_size() -
+            SegmentLoader::instance()->cache_mem_usage());
+
+    // 4 refresh tracked memory counter
     std::unordered_map<MemTrackerLimiter::Type, int64_t> type_mem_sum = {
             {MemTrackerLimiter::Type::GLOBAL, 0},        {MemTrackerLimiter::Type::QUERY, 0},
             {MemTrackerLimiter::Type::LOAD, 0},          {MemTrackerLimiter::Type::COMPACTION, 0},
-            {MemTrackerLimiter::Type::SCHEMA_CHANGE, 0}, {MemTrackerLimiter::Type::OTHER, 0}};
+            {MemTrackerLimiter::Type::SCHEMA_CHANGE, 0}, {MemTrackerLimiter::Type::METADATA, 0},
+            {MemTrackerLimiter::Type::CACHE, 0},         {MemTrackerLimiter::Type::OTHER, 0}};
     // always ExecEnv::ready(), because Daemon::_stop_background_threads_latch
     for (auto& group : ExecEnv::GetInstance()->mem_tracker_limiter_pool) {
         std::lock_guard<std::mutex> l(group.group_lock);
@@ -191,42 +179,46 @@ void MemoryProfile::refresh_memory_overview_profile() {
         all_tracked_mem_sum += it.second;
         switch (it.first) {
         case MemTrackerLimiter::Type::GLOBAL:
-            COUNTER_SET(global_current_usage_counter, it.second);
-            COUNTER_SET(global_peak_usage_counter, it.second);
+            COUNTER_SET(_global_usage_counter, it.second);
             memory_global_trackers_sum_bytes
                     << it.second - memory_global_trackers_sum_bytes.get_value();
             break;
         case MemTrackerLimiter::Type::QUERY:
-            COUNTER_SET(query_current_usage_counter, it.second);
-            COUNTER_SET(query_peak_usage_counter, it.second);
+            COUNTER_SET(_query_usage_counter, it.second);
             tasks_trackers_mem_sum += it.second;
             memory_query_trackers_sum_bytes
                     << it.second - memory_query_trackers_sum_bytes.get_value();
             break;
         case MemTrackerLimiter::Type::LOAD:
-            COUNTER_SET(load_current_usage_counter, it.second);
-            COUNTER_SET(load_peak_usage_counter, it.second);
+            COUNTER_SET(_load_usage_counter, it.second);
             tasks_trackers_mem_sum += it.second;
             memory_load_trackers_sum_bytes
                     << it.second - memory_load_trackers_sum_bytes.get_value();
             break;
         case MemTrackerLimiter::Type::COMPACTION:
-            COUNTER_SET(compaction_current_usage_counter, it.second);
-            COUNTER_SET(compaction_peak_usage_counter, it.second);
+            COUNTER_SET(_compaction_usage_counter, it.second);
             tasks_trackers_mem_sum += it.second;
             memory_compaction_trackers_sum_bytes
                     << it.second - memory_compaction_trackers_sum_bytes.get_value();
             break;
         case MemTrackerLimiter::Type::SCHEMA_CHANGE:
-            COUNTER_SET(schema_change_current_usage_counter, it.second);
-            COUNTER_SET(schema_change_peak_usage_counter, it.second);
+            COUNTER_SET(_schema_change_usage_counter, it.second);
             tasks_trackers_mem_sum += it.second;
             memory_schema_change_trackers_sum_bytes
                     << it.second - memory_schema_change_trackers_sum_bytes.get_value();
             break;
+        case MemTrackerLimiter::Type::METADATA:
+            COUNTER_SET(_metadata_usage_counter, it.second);
+            memory_metadata_trackers_sum_bytes
+                    << it.second - memory_metadata_trackers_sum_bytes.get_value();
+            break;
+        case MemTrackerLimiter::Type::CACHE:
+            COUNTER_SET(_cache_usage_counter, it.second);
+            memory_cache_trackers_sum_bytes
+                    << it.second - memory_cache_trackers_sum_bytes.get_value();
+            break;
         case MemTrackerLimiter::Type::OTHER:
-            COUNTER_SET(other_current_usage_counter, it.second);
-            COUNTER_SET(other_peak_usage_counter, it.second);
+            COUNTER_SET(_other_usage_counter, it.second);
             tasks_trackers_mem_sum += it.second;
             memory_other_trackers_sum_bytes
                     << it.second - memory_other_trackers_sum_bytes.get_value();
@@ -235,60 +227,52 @@ void MemoryProfile::refresh_memory_overview_profile() {
 
     MemTrackerLimiter::make_type_trackers_profile(global_memory_profile.get(),
                                                   MemTrackerLimiter::Type::GLOBAL);
+    MemTrackerLimiter::make_type_trackers_profile(metadata_memory_profile.get(),
+                                                  MemTrackerLimiter::Type::METADATA);
+    MemTrackerLimiter::make_type_trackers_profile(cache_memory_profile.get(),
+                                                  MemTrackerLimiter::Type::CACHE);
 
     MemTrackerLimiter::make_top_consumption_tasks_tracker_profile(top_memory_tasks_profile.get(),
                                                                   15);
 
-    COUNTER_SET(tasks_memory_current_usage_counter, tasks_trackers_mem_sum);
-    COUNTER_SET(tasks_memory_peak_usage_counter, tasks_trackers_mem_sum);
+    COUNTER_SET(_tasks_memory_usage_counter, tasks_trackers_mem_sum);
     memory_all_tasks_memory_bytes << tasks_trackers_mem_sum -
                                              memory_all_tasks_memory_bytes.get_value();
 
-    COUNTER_SET(reserved_memory_current_usage_counter,
-                GlobalMemoryArbitrator::process_reserved_memory());
-    COUNTER_SET(reserved_memory_peak_usage_counter,
-                GlobalMemoryArbitrator::process_reserved_memory());
+    COUNTER_SET(_reserved_memory_usage_counter, GlobalMemoryArbitrator::process_reserved_memory());
     memory_reserved_memory_bytes << GlobalMemoryArbitrator::process_reserved_memory() -
                                             memory_reserved_memory_bytes.get_value();
 
     all_tracked_mem_sum += MemInfo::allocator_cache_mem();
-    COUNTER_SET(jemalloc_cache_current_usage_counter,
-                static_cast<int64_t>(MemInfo::allocator_cache_mem()));
-    COUNTER_SET(jemalloc_cache_peak_usage_counter,
+    COUNTER_SET(_jemalloc_cache_usage_counter,
                 static_cast<int64_t>(MemInfo::allocator_cache_mem()));
     all_tracked_mem_sum += MemInfo::allocator_metadata_mem();
-    COUNTER_SET(jemalloc_metadata_current_usage_counter,
-                static_cast<int64_t>(MemInfo::allocator_metadata_mem()));
-    COUNTER_SET(jemalloc_metadata_peak_usage_counter,
+    COUNTER_SET(_jemalloc_metadata_usage_counter,
                 static_cast<int64_t>(MemInfo::allocator_metadata_mem()));
-    COUNTER_SET(jemalloc_memory_current_usage_counter,
-                jemalloc_cache_current_usage_counter->value() +
-                        jemalloc_metadata_current_usage_counter->value());
-    COUNTER_SET(jemalloc_memory_peak_usage_counter,
-                jemalloc_cache_current_usage_counter->value() +
-                        jemalloc_metadata_current_usage_counter->value());
-
-    COUNTER_SET(tracked_memory_current_usage_counter, all_tracked_mem_sum);
-    COUNTER_SET(tracked_memory_peak_usage_counter, all_tracked_mem_sum);
+    COUNTER_SET(_jemalloc_memory_usage_counter,
+                _jemalloc_cache_usage_counter->current_value() +
+                        _jemalloc_metadata_usage_counter->current_value());
+
+    COUNTER_SET(_tracked_memory_usage_counter, all_tracked_mem_sum);
     memory_all_tracked_sum_bytes << all_tracked_mem_sum - memory_all_tracked_sum_bytes.get_value();
 
-    // 3.3 refresh untracked memory counter
+    // 5 refresh untracked memory counter
     int64_t untracked_memory =
-            process_physical_memory_current_usage_counter->value() - all_tracked_mem_sum;
-    COUNTER_SET(untracked_memory_current_usage_counter, untracked_memory);
-    COUNTER_SET(untracked_memory_peak_usage_counter, untracked_memory);
+            _process_physical_memory_usage_counter->current_value() - all_tracked_mem_sum;
+    COUNTER_SET(_untracked_memory_usage_counter, untracked_memory);
     memory_untracked_memory_bytes << untracked_memory - memory_untracked_memory_bytes.get_value();
 
-    // 3.4 refresh additional tracker printed when memory exceeds limit.
-    COUNTER_SET(load_all_memtables_current_usage_counter,
-                ExecEnv::GetInstance()->memtable_memory_limiter()->mem_tracker()->consumption());
+    // 6 refresh additional tracker printed when memory exceeds limit.
     COUNTER_SET(
-            load_all_memtables_peak_usage_counter,
+            _load_all_memtables_usage_counter,
             ExecEnv::GetInstance()->memtable_memory_limiter()->mem_tracker()->peak_consumption());
+    COUNTER_SET(_load_all_memtables_usage_counter,
+                ExecEnv::GetInstance()->memtable_memory_limiter()->mem_tracker()->consumption());
 
-    // 4. reset profile
-    _memory_overview_profile.set(std::move(memory_overview_profile));
+    // 7. reset profile
     _global_memory_profile.set(std::move(global_memory_profile));
+    _metadata_memory_profile.set(std::move(metadata_memory_profile));
+    _cache_memory_profile.set(std::move(cache_memory_profile));
     _top_memory_tasks_profile.set(std::move(top_memory_tasks_profile));
 }
 
@@ -302,16 +286,25 @@ void MemoryProfile::refresh_tasks_memory_profile() {
 void MemoryProfile::make_memory_profile(RuntimeProfile* profile) const {
     RuntimeProfile* memory_profile_snapshot = profile->create_child("MemoryProfile", true, false);
 
-    auto memory_overview_version_ptr = _memory_overview_profile.get();
     RuntimeProfile* memory_overview_profile =
-            memory_profile_snapshot->create_child(memory_overview_version_ptr->name(), true, false);
-    memory_overview_profile->merge(const_cast<RuntimeProfile*>(memory_overview_version_ptr.get()));
+            memory_profile_snapshot->create_child(_memory_overview_profile->name(), true, false);
+    memory_overview_profile->merge(const_cast<RuntimeProfile*>(_memory_overview_profile.get()));
 
     auto global_memory_version_ptr = _global_memory_profile.get();
     RuntimeProfile* global_memory_profile =
             memory_profile_snapshot->create_child(global_memory_version_ptr->name(), true, false);
     global_memory_profile->merge(const_cast<RuntimeProfile*>(global_memory_version_ptr.get()));
 
+    auto metadata_memory_version_ptr = _metadata_memory_profile.get();
+    RuntimeProfile* metadata_memory_profile =
+            memory_profile_snapshot->create_child(metadata_memory_version_ptr->name(), true, false);
+    metadata_memory_profile->merge(const_cast<RuntimeProfile*>(metadata_memory_version_ptr.get()));
+
+    auto cache_memory_version_ptr = _cache_memory_profile.get();
+    RuntimeProfile* cache_memory_profile =
+            memory_profile_snapshot->create_child(cache_memory_version_ptr->name(), true, false);
+    cache_memory_profile->merge(const_cast<RuntimeProfile*>(cache_memory_version_ptr.get()));
+
     auto top_memory_tasks_version_ptr = _top_memory_tasks_profile.get();
     RuntimeProfile* top_memory_tasks_profile = memory_profile_snapshot->create_child(
             top_memory_tasks_version_ptr->name(), true, false);
@@ -346,6 +339,8 @@ void MemoryProfile::print_log_process_usage() {
         LOG(WARNING) << "Process Memory Summary: " + GlobalMemoryArbitrator::process_mem_log_str();
         LOG(WARNING) << "\n" << print_memory_overview_profile();
         LOG(WARNING) << "\n" << print_global_memory_profile();
+        LOG(WARNING) << "\n" << print_metadata_memory_profile();
+        LOG(WARNING) << "\n" << print_cache_memory_profile();
         LOG(WARNING) << "\n" << print_top_memory_tasks_profile();
     }
 }
diff --git a/be/src/runtime/memory/memory_profile.h b/be/src/runtime/memory/memory_profile.h
index 9f1bab0c02a802..c6aefb72f22e1a 100644
--- a/be/src/runtime/memory/memory_profile.h
+++ b/be/src/runtime/memory/memory_profile.h
@@ -33,31 +33,27 @@ class MemoryProfile {
     void make_memory_profile(RuntimeProfile* profile) const;
 
     std::string print_memory_overview_profile() const {
-        std::stringstream ss;
-        auto version_ptr = _memory_overview_profile.get();
-        version_ptr->pretty_print(&ss);
-        return ss.str();
+        return return_memory_profile_str(_memory_overview_profile.get());
     }
 
     std::string print_global_memory_profile() const {
-        std::stringstream ss;
-        auto version_ptr = _global_memory_profile.get();
-        version_ptr->pretty_print(&ss);
-        return ss.str();
+        return return_memory_profile_str(_global_memory_profile.get().get());
+    }
+
+    std::string print_metadata_memory_profile() const {
+        return return_memory_profile_str(_metadata_memory_profile.get().get());
+    }
+
+    std::string print_cache_memory_profile() const {
+        return return_memory_profile_str(_cache_memory_profile.get().get());
     }
 
     std::string print_top_memory_tasks_profile() const {
-        std::stringstream ss;
-        auto version_ptr = _top_memory_tasks_profile.get();
-        version_ptr->pretty_print(&ss);
-        return ss.str();
+        return return_memory_profile_str(_top_memory_tasks_profile.get().get());
     }
 
     std::string print_tasks_memory_profile() const {
-        std::stringstream ss;
-        auto version_ptr = _tasks_memory_profile.get();
-        version_ptr->pretty_print(&ss);
-        return ss.str();
+        return return_memory_profile_str(_tasks_memory_profile.get().get());
     }
 
     static int64_t query_current_usage();
@@ -71,11 +67,50 @@ class MemoryProfile {
     void print_log_process_usage();
 
 private:
-    MultiVersion<RuntimeProfile> _memory_overview_profile;
+    std::string return_memory_profile_str(const RuntimeProfile* profile) const {
+        std::stringstream ss;
+        profile->pretty_print(&ss);
+        return ss.str();
+    }
+
+    void init_memory_overview_counter();
+
+    std::unique_ptr<RuntimeProfile> _memory_overview_profile;
     MultiVersion<RuntimeProfile> _global_memory_profile;
+    MultiVersion<RuntimeProfile> _metadata_memory_profile;
+    MultiVersion<RuntimeProfile> _cache_memory_profile;
     MultiVersion<RuntimeProfile> _top_memory_tasks_profile;
     MultiVersion<RuntimeProfile> _tasks_memory_profile;
 
+    // process memory counter
+    RuntimeProfile::HighWaterMarkCounter* _process_physical_memory_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _process_virtual_memory_usage_counter;
+
+    // untracked/tracked memory counter
+    RuntimeProfile::HighWaterMarkCounter* _untracked_memory_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _tracked_memory_usage_counter;
+
+    // Jemalloc memory counter
+    RuntimeProfile::HighWaterMarkCounter* _jemalloc_memory_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _jemalloc_cache_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _jemalloc_metadata_usage_counter;
+
+    // global/metadata/cache memory counter
+    RuntimeProfile::HighWaterMarkCounter* _global_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _metadata_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _cache_usage_counter;
+
+    // tasks memory counter
+    RuntimeProfile::HighWaterMarkCounter* _tasks_memory_usage_counter;
+    // reserved memory is the sum of all task reserved memory, is duplicated with all task memory counter.
+    RuntimeProfile::HighWaterMarkCounter* _reserved_memory_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _query_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _load_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _load_all_memtables_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _compaction_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _schema_change_usage_counter;
+    RuntimeProfile::HighWaterMarkCounter* _other_usage_counter;
+
     std::atomic<bool> _enable_print_log_process_usage {true};
 };
 
diff --git a/be/src/runtime/routine_load/routine_load_task_executor.h b/be/src/runtime/routine_load/routine_load_task_executor.h
index 0e597d796c9f77..b1196f7824afac 100644
--- a/be/src/runtime/routine_load/routine_load_task_executor.h
+++ b/be/src/runtime/routine_load/routine_load_task_executor.h
@@ -73,6 +73,8 @@ class RoutineLoadTaskExecutor {
                                                  std::vector<PIntegerPair>* partition_offsets,
                                                  int timeout);
 
+    ThreadPool& get_thread_pool() { return *_thread_pool; }
+
 private:
     // execute the task
     void exec_task(std::shared_ptr<StreamLoadContext> ctx, DataConsumerPool* pool,
diff --git a/be/src/runtime/runtime_filter_mgr.cpp b/be/src/runtime/runtime_filter_mgr.cpp
index bb100fcbb42ec5..c16db7c67d3420 100644
--- a/be/src/runtime/runtime_filter_mgr.cpp
+++ b/be/src/runtime/runtime_filter_mgr.cpp
@@ -90,7 +90,7 @@ std::vector<std::shared_ptr<IRuntimeFilter>> RuntimeFilterMgr::get_consume_filte
 Status RuntimeFilterMgr::register_consumer_filter(const TRuntimeFilterDesc& desc,
                                                   const TQueryOptions& options, int node_id,
                                                   std::shared_ptr<IRuntimeFilter>* consumer_filter,
-                                                  bool build_bf_exactly, bool need_local_merge) {
+                                                  bool need_local_merge) {
     SCOPED_CONSUME_MEM_TRACKER(_tracker.get());
     int32_t key = desc.filter_id;
     bool has_exist = false;
@@ -110,7 +110,7 @@ Status RuntimeFilterMgr::register_consumer_filter(const TRuntimeFilterDesc& desc
     if (!has_exist) {
         std::shared_ptr<IRuntimeFilter> filter;
         RETURN_IF_ERROR(IRuntimeFilter::create(_state, &desc, &options, RuntimeFilterRole::CONSUMER,
-                                               node_id, &filter, build_bf_exactly));
+                                               node_id, &filter));
         _consumer_map[key].emplace_back(node_id, filter);
         *consumer_filter = filter;
     } else if (!need_local_merge) {
@@ -122,7 +122,7 @@ Status RuntimeFilterMgr::register_consumer_filter(const TRuntimeFilterDesc& desc
 
 Status RuntimeFilterMgr::register_local_merge_producer_filter(
         const doris::TRuntimeFilterDesc& desc, const doris::TQueryOptions& options,
-        std::shared_ptr<IRuntimeFilter> producer_filter, bool build_bf_exactly) {
+        std::shared_ptr<IRuntimeFilter> producer_filter) {
     DCHECK(_is_global);
     SCOPED_CONSUME_MEM_TRACKER(_tracker.get());
     int32_t key = desc.filter_id;
@@ -143,8 +143,7 @@ Status RuntimeFilterMgr::register_local_merge_producer_filter(
         if (iter->second.filters.empty()) {
             std::shared_ptr<IRuntimeFilter> merge_filter;
             RETURN_IF_ERROR(IRuntimeFilter::create(_state, &desc, &options,
-                                                   RuntimeFilterRole::PRODUCER, -1, &merge_filter,
-                                                   build_bf_exactly));
+                                                   RuntimeFilterRole::PRODUCER, -1, &merge_filter));
             merge_filter->set_ignored();
             iter->second.filters.emplace_back(merge_filter);
         }
@@ -181,10 +180,9 @@ doris::LocalMergeFilters* RuntimeFilterMgr::get_local_merge_producer_filters(int
     return &iter->second;
 }
 
-Status RuntimeFilterMgr::register_producer_filter(const TRuntimeFilterDesc& desc,
-                                                  const TQueryOptions& options,
-                                                  std::shared_ptr<IRuntimeFilter>* producer_filter,
-                                                  bool build_bf_exactly) {
+Status RuntimeFilterMgr::register_producer_filter(
+        const TRuntimeFilterDesc& desc, const TQueryOptions& options,
+        std::shared_ptr<IRuntimeFilter>* producer_filter) {
     DCHECK(!_is_global);
     SCOPED_CONSUME_MEM_TRACKER(_tracker.get());
     int32_t key = desc.filter_id;
@@ -196,7 +194,7 @@ Status RuntimeFilterMgr::register_producer_filter(const TRuntimeFilterDesc& desc
         return Status::InvalidArgument("filter has registed");
     }
     RETURN_IF_ERROR(IRuntimeFilter::create(_state, &desc, &options, RuntimeFilterRole::PRODUCER, -1,
-                                           producer_filter, build_bf_exactly));
+                                           producer_filter));
     _producer_map.emplace(key, *producer_filter);
     return Status::OK();
 }
@@ -233,8 +231,8 @@ Status RuntimeFilterMergeControllerEntity::_init_with_desc(
     cnt_val->filter = cnt_val->pool->add(new IRuntimeFilter(_state, runtime_filter_desc));
 
     auto filter_id = runtime_filter_desc->filter_id;
-    RETURN_IF_ERROR(cnt_val->filter->init_with_desc(&cnt_val->runtime_filter_desc, query_options,
-                                                    -1, false));
+    RETURN_IF_ERROR(
+            cnt_val->filter->init_with_desc(&cnt_val->runtime_filter_desc, query_options, -1));
     cnt_val->filter->set_ignored();
     _filter_map.emplace(filter_id, cnt_val);
     return Status::OK();
diff --git a/be/src/runtime/runtime_filter_mgr.h b/be/src/runtime/runtime_filter_mgr.h
index 0a6f8318feaba0..9f4cf5f4e22a07 100644
--- a/be/src/runtime/runtime_filter_mgr.h
+++ b/be/src/runtime/runtime_filter_mgr.h
@@ -100,19 +100,17 @@ class RuntimeFilterMgr {
     // register filter
     Status register_consumer_filter(const TRuntimeFilterDesc& desc, const TQueryOptions& options,
                                     int node_id, std::shared_ptr<IRuntimeFilter>* consumer_filter,
-                                    bool build_bf_exactly = false, bool need_local_merge = false);
+                                    bool need_local_merge = false);
 
     Status register_local_merge_producer_filter(const TRuntimeFilterDesc& desc,
                                                 const TQueryOptions& options,
-                                                std::shared_ptr<IRuntimeFilter> producer_filter,
-                                                bool build_bf_exactly = false);
+                                                std::shared_ptr<IRuntimeFilter> producer_filter);
 
     Status get_local_merge_producer_filters(int filter_id, LocalMergeFilters** local_merge_filters);
     LocalMergeFilters* get_local_merge_producer_filters(int filter_id);
 
     Status register_producer_filter(const TRuntimeFilterDesc& desc, const TQueryOptions& options,
-                                    std::shared_ptr<IRuntimeFilter>* producer_filter,
-                                    bool build_bf_exactly = false);
+                                    std::shared_ptr<IRuntimeFilter>* producer_filter);
 
     // update filter by remote
     void set_runtime_filter_params(const TRuntimeFilterParams& runtime_filter_params);
diff --git a/be/src/runtime/runtime_state.cpp b/be/src/runtime/runtime_state.cpp
index 344180bad771ac..f3376d06858ec0 100644
--- a/be/src/runtime/runtime_state.cpp
+++ b/be/src/runtime/runtime_state.cpp
@@ -123,37 +123,6 @@ RuntimeState::RuntimeState(const TUniqueId& instance_id, const TUniqueId& query_
     DCHECK(_query_mem_tracker != nullptr && _query_mem_tracker->label() != "Orphan");
 }
 
-RuntimeState::RuntimeState(pipeline::PipelineFragmentContext*, const TUniqueId& instance_id,
-                           const TUniqueId& query_id, int32_t fragment_id,
-                           const TQueryOptions& query_options, const TQueryGlobals& query_globals,
-                           ExecEnv* exec_env, QueryContext* ctx)
-        : _profile("Fragment " + print_id(instance_id)),
-          _load_channel_profile("<unnamed>"),
-          _obj_pool(new ObjectPool()),
-          _unreported_error_idx(0),
-          _query_id(query_id),
-          _fragment_id(fragment_id),
-          _per_fragment_instance_idx(0),
-          _num_rows_load_total(0),
-          _num_rows_load_filtered(0),
-          _num_rows_load_unselected(0),
-          _num_rows_filtered_in_strict_mode_partial_update(0),
-          _num_print_error_rows(0),
-          _num_bytes_load_total(0),
-          _num_finished_scan_range(0),
-          _error_row_number(0),
-          _query_ctx(ctx) {
-    [[maybe_unused]] auto status = init(instance_id, query_options, query_globals, exec_env);
-    _query_mem_tracker = ctx->query_mem_tracker;
-#ifdef BE_TEST
-    if (_query_mem_tracker == nullptr) {
-        init_mem_trackers();
-    }
-#endif
-    DCHECK(_query_mem_tracker != nullptr && _query_mem_tracker->label() != "Orphan");
-    DCHECK(status.ok());
-}
-
 RuntimeState::RuntimeState(const TUniqueId& query_id, int32_t fragment_id,
                            const TQueryOptions& query_options, const TQueryGlobals& query_globals,
                            ExecEnv* exec_env, QueryContext* ctx)
@@ -295,7 +264,7 @@ Status RuntimeState::init(const TUniqueId& fragment_instance_id, const TQueryOpt
 }
 
 std::weak_ptr<QueryContext> RuntimeState::get_query_ctx_weak() {
-    return _exec_env->fragment_mgr()->get_or_erase_query_ctx_with_lock(_query_ctx->query_id());
+    return _exec_env->fragment_mgr()->get_query_ctx(_query_ctx->query_id());
 }
 
 void RuntimeState::init_mem_trackers(const std::string& name, const TUniqueId& id) {
@@ -516,14 +485,13 @@ RuntimeFilterMgr* RuntimeState::global_runtime_filter_mgr() {
 }
 
 Status RuntimeState::register_producer_runtime_filter(
-        const TRuntimeFilterDesc& desc, std::shared_ptr<IRuntimeFilter>* producer_filter,
-        bool build_bf_exactly) {
+        const TRuntimeFilterDesc& desc, std::shared_ptr<IRuntimeFilter>* producer_filter) {
     // Producers are created by local runtime filter mgr and shared by global runtime filter manager.
     // When RF is published, consumers in both global and local RF mgr will be found.
-    RETURN_IF_ERROR(local_runtime_filter_mgr()->register_producer_filter(
-            desc, query_options(), producer_filter, build_bf_exactly));
+    RETURN_IF_ERROR(local_runtime_filter_mgr()->register_producer_filter(desc, query_options(),
+                                                                         producer_filter));
     RETURN_IF_ERROR(global_runtime_filter_mgr()->register_local_merge_producer_filter(
-            desc, query_options(), *producer_filter, build_bf_exactly));
+            desc, query_options(), *producer_filter));
     return Status::OK();
 }
 
@@ -532,10 +500,10 @@ Status RuntimeState::register_consumer_runtime_filter(
         std::shared_ptr<IRuntimeFilter>* consumer_filter) {
     if (desc.has_remote_targets || need_local_merge) {
         return global_runtime_filter_mgr()->register_consumer_filter(desc, query_options(), node_id,
-                                                                     consumer_filter, false, true);
+                                                                     consumer_filter, true);
     } else {
         return local_runtime_filter_mgr()->register_consumer_filter(desc, query_options(), node_id,
-                                                                    consumer_filter, false, false);
+                                                                    consumer_filter, false);
     }
 }
 
diff --git a/be/src/runtime/runtime_state.h b/be/src/runtime/runtime_state.h
index 0bc81bca4d99a1..a49567109a3b31 100644
--- a/be/src/runtime/runtime_state.h
+++ b/be/src/runtime/runtime_state.h
@@ -85,12 +85,7 @@ class RuntimeState {
                  const TQueryOptions& query_options, const TQueryGlobals& query_globals,
                  ExecEnv* exec_env, QueryContext* ctx);
 
-    // for only use in pipelineX
-    RuntimeState(pipeline::PipelineFragmentContext*, const TUniqueId& instance_id,
-                 const TUniqueId& query_id, int32 fragment_id, const TQueryOptions& query_options,
-                 const TQueryGlobals& query_globals, ExecEnv* exec_env, QueryContext* ctx);
-
-    // Used by pipelineX. This runtime state is only used for setup.
+    // Used by pipeline. This runtime state is only used for setup.
     RuntimeState(const TUniqueId& query_id, int32 fragment_id, const TQueryOptions& query_options,
                  const TQueryGlobals& query_globals, ExecEnv* exec_env, QueryContext* ctx);
 
@@ -561,8 +556,7 @@ class RuntimeState {
     }
 
     Status register_producer_runtime_filter(const doris::TRuntimeFilterDesc& desc,
-                                            std::shared_ptr<IRuntimeFilter>* producer_filter,
-                                            bool build_bf_exactly);
+                                            std::shared_ptr<IRuntimeFilter>* producer_filter);
 
     Status register_consumer_runtime_filter(const doris::TRuntimeFilterDesc& desc,
                                             bool need_local_merge, int node_id,
diff --git a/be/src/service/arrow_flight/arrow_flight_batch_reader.cpp b/be/src/service/arrow_flight/arrow_flight_batch_reader.cpp
index e935aff996d55e..c24fcb73384494 100644
--- a/be/src/service/arrow_flight/arrow_flight_batch_reader.cpp
+++ b/be/src/service/arrow_flight/arrow_flight_batch_reader.cpp
@@ -56,7 +56,7 @@ arrow::Status ArrowFlightBatchReaderBase::_return_invalid_status(const std::stri
 }
 
 ArrowFlightBatchReaderBase::~ArrowFlightBatchReaderBase() {
-    VLOG_NOTICE << fmt::format(
+    LOG(INFO) << fmt::format(
             "ArrowFlightBatchReader finished, packet_seq={}, result_addr={}:{}, finistId={}, "
             "convert_arrow_batch_timer={}, deserialize_block_timer={}, peak_memory_usage={}",
             _packet_seq, _statement->result_addr.hostname, _statement->result_addr.port,
diff --git a/be/src/service/http_service.cpp b/be/src/service/http_service.cpp
index 57600d1f56aae9..912f9f5ff403e7 100644
--- a/be/src/service/http_service.cpp
+++ b/be/src/service/http_service.cpp
@@ -80,6 +80,7 @@
 #include "util/doris_metrics.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace {
 std::shared_ptr<bufferevent_rate_limit_group> get_rate_limit_group(event_base* event_base) {
     auto rate_limit = config::download_binlog_rate_limit_kbs;
@@ -473,4 +474,5 @@ int HttpService::get_real_port() const {
     return _ev_http_server->get_real_port();
 }
 
+#include "common/compile_check_end.h"
 } // namespace doris
diff --git a/be/src/service/internal_service.cpp b/be/src/service/internal_service.cpp
index adcd07e7de7484..439f3f17faf00f 100644
--- a/be/src/service/internal_service.cpp
+++ b/be/src/service/internal_service.cpp
@@ -1240,7 +1240,10 @@ void PInternalService::report_stream_load_status(google::protobuf::RpcController
 void PInternalService::get_info(google::protobuf::RpcController* controller,
                                 const PProxyRequest* request, PProxyResult* response,
                                 google::protobuf::Closure* done) {
-    bool ret = _heavy_work_pool.try_offer([this, request, response, done]() {
+    bool ret = _exec_env->routine_load_task_executor()->get_thread_pool().submit_func([this,
+                                                                                       request,
+                                                                                       response,
+                                                                                       done]() {
         brpc::ClosureGuard closure_guard(done);
         // PProxyRequest is defined in gensrc/proto/internal_service.proto
         // Currently it supports 2 kinds of requests:
diff --git a/be/src/util/hash_util.hpp b/be/src/util/hash_util.hpp
index d444daa8c68d11..fbf10b75ae02c0 100644
--- a/be/src/util/hash_util.hpp
+++ b/be/src/util/hash_util.hpp
@@ -38,14 +38,6 @@ namespace doris {
 // Utility class to compute hash values.
 class HashUtil {
 public:
-    template <typename T>
-    static uint32_t fixed_len_to_uint32(T value) {
-        if constexpr (sizeof(T) <= sizeof(uint32_t)) {
-            return (uint32_t)value;
-        }
-        return std::hash<T>()(value);
-    }
-
     static uint32_t zlib_crc_hash(const void* data, uint32_t bytes, uint32_t hash) {
         return crc32(hash, (const unsigned char*)data, bytes);
     }
@@ -305,7 +297,7 @@ class HashUtil {
 #endif
     }
 
-    static uint64_t hash64(const void* data, uint32_t bytes, uint64_t seed) {
+    static uint64_t hash64(const void* data, uint64_t bytes, uint64_t seed) {
 #ifdef _SSE4_2_
         if (LIKELY(CpuInfo::is_supported(CpuInfo::SSE4_2))) {
             return crc_hash64(data, bytes, seed);
diff --git a/be/src/util/runtime_profile.cpp b/be/src/util/runtime_profile.cpp
index 45db607a342743..1df4d8b55c278e 100644
--- a/be/src/util/runtime_profile.cpp
+++ b/be/src/util/runtime_profile.cpp
@@ -28,6 +28,7 @@
 #include <algorithm>
 #include <iomanip>
 #include <iostream>
+#include <type_traits>
 
 #include "common/object_pool.h"
 #include "util/container_util.hpp"
@@ -72,8 +73,7 @@ void RuntimeProfile::merge(RuntimeProfile* other) {
             dst_iter = _counter_map.find(src_iter->first);
 
             if (dst_iter == _counter_map.end()) {
-                _counter_map[src_iter->first] = _pool->add(
-                        new Counter(src_iter->second->type(), src_iter->second->value()));
+                _counter_map[src_iter->first] = _pool->add(src_iter->second->clone());
             } else {
                 DCHECK(dst_iter->second->type() == src_iter->second->type());
 
@@ -574,8 +574,6 @@ void RuntimeProfile::to_thrift(TRuntimeProfileTree* tree) {
 }
 
 void RuntimeProfile::to_thrift(std::vector<TRuntimeProfileNode>* nodes) {
-    nodes->reserve(nodes->size() + _children.size());
-
     int index = nodes->size();
     nodes->push_back(TRuntimeProfileNode());
     TRuntimeProfileNode& node = (*nodes)[index];
@@ -602,10 +600,13 @@ void RuntimeProfile::to_thrift(std::vector<TRuntimeProfileNode>* nodes) {
 
     ChildVector children;
     {
+        // _children may be modified during to_thrift(),
+        // so we have to lock and copy _children to avoid race condition
         std::lock_guard<std::mutex> l(_children_lock);
         children = _children;
     }
     node.num_children = children.size();
+    nodes->reserve(nodes->size() + children.size());
 
     for (int i = 0; i < children.size(); ++i) {
         int child_idx = nodes->size();
diff --git a/be/src/util/runtime_profile.h b/be/src/util/runtime_profile.h
index 6e393ac673a628..7130acbd2f9427 100644
--- a/be/src/util/runtime_profile.h
+++ b/be/src/util/runtime_profile.h
@@ -100,6 +100,8 @@ class RuntimeProfile {
                 : _value(value), _type(type), _level(level) {}
         virtual ~Counter() = default;
 
+        virtual Counter* clone() const { return new Counter(type(), value(), _level); }
+
         virtual void update(int64_t delta) { _value.fetch_add(delta, std::memory_order_relaxed); }
 
         void bit_or(int64_t delta) { _value.fetch_or(delta, std::memory_order_relaxed); }
@@ -137,7 +139,7 @@ class RuntimeProfile {
 
         TUnit::type type() const { return _type; }
 
-        virtual int64_t level() { return _level; }
+        virtual int64_t level() const { return _level; }
 
     private:
         friend class RuntimeProfile;
@@ -151,8 +153,16 @@ class RuntimeProfile {
     /// as value()) and the current value.
     class HighWaterMarkCounter : public Counter {
     public:
-        HighWaterMarkCounter(TUnit::type unit, int64_t level, const std::string& parent_name)
-                : Counter(unit, 0, level), current_value_(0), _parent_name(parent_name) {}
+        HighWaterMarkCounter(TUnit::type unit, int64_t level, const std::string& parent_name,
+                             int64_t value = 0, int64_t current_value = 0)
+                : Counter(unit, value, level),
+                  current_value_(current_value),
+                  _parent_name(parent_name) {}
+
+        virtual Counter* clone() const override {
+            return new HighWaterMarkCounter(type(), level(), parent_name(), value(),
+                                            current_value());
+        }
 
         void add(int64_t delta) {
             current_value_.fetch_add(delta, std::memory_order_relaxed);
@@ -188,10 +198,9 @@ class RuntimeProfile {
         virtual void pretty_print(std::ostream* s, const std::string& prefix,
                                   const std::string& name) const override {
             std::ostream& stream = *s;
-            stream << prefix << "   - " << name << ": "
-                   << PrettyPrinter::print(current_value(), type()) << std::endl;
-            stream << prefix << "      - " << name << "Peak: "
-                   << PrettyPrinter::print(_value.load(std::memory_order_relaxed), type())
+            stream << prefix << "   - " << name
+                   << " Current: " << PrettyPrinter::print(current_value(), type()) << " (Peak: "
+                   << PrettyPrinter::print(_value.load(std::memory_order_relaxed), type()) << ")"
                    << std::endl;
         }
 
@@ -217,6 +226,8 @@ class RuntimeProfile {
 
         int64_t current_value() const { return current_value_.load(std::memory_order_relaxed); }
 
+        std::string parent_name() const { return _parent_name; }
+
     private:
         /// Set '_value' to 'v' if 'v' is larger than '_value'. The entire operation is
         /// atomic.
@@ -247,8 +258,13 @@ class RuntimeProfile {
     // Do not call Set() and Update().
     class DerivedCounter : public Counter {
     public:
-        DerivedCounter(TUnit::type type, const DerivedCounterFunction& counter_fn)
-                : Counter(type, 0), _counter_fn(counter_fn) {}
+        DerivedCounter(TUnit::type type, const DerivedCounterFunction& counter_fn,
+                       int64_t value = 0, int64_t level = 1)
+                : Counter(type, value, level), _counter_fn(counter_fn) {}
+
+        virtual Counter* clone() const override {
+            return new DerivedCounter(type(), _counter_fn, value(), level());
+        }
 
         int64_t value() const override { return _counter_fn(); }
 
@@ -259,8 +275,13 @@ class RuntimeProfile {
     // NonZeroCounter will not be converted to Thrift if the value is 0.
     class NonZeroCounter : public Counter {
     public:
-        NonZeroCounter(TUnit::type type, int64_t level, const std::string& parent_name)
-                : Counter(type, 0, level), _parent_name(parent_name) {}
+        NonZeroCounter(TUnit::type type, int64_t level, const std::string& parent_name,
+                       int64_t value = 0)
+                : Counter(type, value, level), _parent_name(parent_name) {}
+
+        virtual Counter* clone() const override {
+            return new NonZeroCounter(type(), level(), parent_name(), value());
+        }
 
         void to_thrift(const std::string& name, std::vector<TCounter>& tcounters,
                        std::map<std::string, std::set<std::string>>& child_counters_map) override {
@@ -272,6 +293,8 @@ class RuntimeProfile {
             }
         }
 
+        std::string parent_name() const { return _parent_name; }
+
     private:
         const std::string _parent_name;
     };
diff --git a/be/src/vec/aggregate_functions/aggregate_function.h b/be/src/vec/aggregate_functions/aggregate_function.h
index 32fc9d5efce771..e0ec2bef62fc2a 100644
--- a/be/src/vec/aggregate_functions/aggregate_function.h
+++ b/be/src/vec/aggregate_functions/aggregate_function.h
@@ -36,6 +36,7 @@
 #include "vec/data_types/data_type_string.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 class Arena;
 class IColumn;
@@ -598,3 +599,5 @@ class AggregateFunctionGuard {
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.cpp b/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.cpp
index 18662bf66cf38c..8bf6c32c0872de 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.cpp
@@ -29,6 +29,7 @@
 #include "vec/functions/function.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_approx_count_distinct(
         const std::string& name, const DataTypes& argument_types, const bool result_is_nullable,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.h b/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.h
index d267499e059818..3ef22be9fca74c 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_approx_count_distinct.h
@@ -38,6 +38,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -64,8 +65,7 @@ struct AggregateFunctionApproxCountDistinctData {
     void write(BufferWritable& buf) const {
         std::string result;
         result.resize(hll_data.max_serialized_size());
-        int size = hll_data.serialize((uint8_t*)result.data());
-        result.resize(size);
+        result.resize(hll_data.serialize((uint8_t*)result.data()));
         write_binary(result, buf);
     }
 
@@ -136,3 +136,5 @@ class AggregateFunctionApproxCountDistinct final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_avg.cpp b/be/src/vec/aggregate_functions/aggregate_function_avg.cpp
index 6a6711f90f983e..6109f0b0c601cd 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_avg.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_avg.cpp
@@ -25,6 +25,7 @@
 #include "vec/core/field.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 struct Avg {
diff --git a/be/src/vec/aggregate_functions/aggregate_function_avg.h b/be/src/vec/aggregate_functions/aggregate_function_avg.h
index 62fbb8078ea949..8b24db692aef05 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_avg.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_avg.h
@@ -41,6 +41,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -72,7 +73,8 @@ struct AggregateFunctionAvgData {
     ResultT result() const {
         if constexpr (std::is_floating_point_v<ResultT>) {
             if constexpr (std::numeric_limits<ResultT>::is_iec559) {
-                return static_cast<ResultT>(sum) / count; /// allow division by zero
+                return static_cast<ResultT>(sum) /
+                       static_cast<ResultT>(count); /// allow division by zero
             }
         }
 
@@ -91,7 +93,7 @@ struct AggregateFunctionAvgData {
             if constexpr (IsDecimal256<T>) {
                 return static_cast<ResultT>(sum / T(count));
             } else {
-                return static_cast<ResultT>(sum) / count;
+                return static_cast<ResultT>(sum) / static_cast<ResultT>(count);
             }
         }
     }
@@ -124,7 +126,11 @@ class AggregateFunctionAvg final
             IsDecimalV2<T>, ColumnDecimal<Decimal128V2>,
             std::conditional_t<IsDecimalNumber<T>, ColumnDecimal<typename Data::ResultType>,
                                ColumnFloat64>>;
+    // The result calculated by PercentileApprox is an approximate value,
+    // so the underlying storage uses float. The following calls will involve
+    // an implicit cast to float.
 
+    using DataType = typename Data::ResultType;
     /// ctor for native types
     AggregateFunctionAvg(const DataTypes& argument_types_)
             : IAggregateFunctionDataHelper<Data, AggregateFunctionAvg<T, Data>>(argument_types_),
@@ -148,9 +154,9 @@ class AggregateFunctionAvg final
         const auto& column =
                 assert_cast<const ColVecType&, TypeCheckOnRelease::DISABLE>(*columns[0]);
         if constexpr (IsDecimalNumber<T>) {
-            this->data(place).sum += column.get_data()[row_num].value;
+            this->data(place).sum += (DataType)column.get_data()[row_num].value;
         } else {
-            this->data(place).sum += column.get_data()[row_num];
+            this->data(place).sum += (DataType)column.get_data()[row_num];
         }
         ++this->data(place).count;
     }
@@ -282,3 +288,5 @@ class AggregateFunctionAvg final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.cpp b/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.cpp
index fc5df5303fd15d..70a707b02e992b 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 void register_aggregate_function_avg_weighted(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both("avg_weighted",
                                    creator_with_type::creator<AggregateFunctionAvgWeight>);
diff --git a/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.h b/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.h
index b59a3dccf0cea8..d1a5921b45039f 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_avg_weighted.h
@@ -35,6 +35,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -57,7 +58,7 @@ struct AggregateFunctionAvgWeightedData {
             DecimalV2Value value = binary_cast<Int128, DecimalV2Value>(data_val);
             data_sum = data_sum + (double(value) * weight_val);
         } else {
-            data_sum = data_sum + (data_val * weight_val);
+            data_sum = data_sum + (double(data_val) * weight_val);
         }
         weight_sum = weight_sum + weight_val;
     }
@@ -138,3 +139,5 @@ class AggregateFunctionAvgWeight final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_binary.h b/be/src/vec/aggregate_functions/aggregate_function_binary.h
index 9fba9d11a1013a..fd5fc55d253661 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_binary.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_binary.h
@@ -36,6 +36,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T1, typename T2, template <typename> typename Moments>
 struct StatFunc {
@@ -127,3 +128,5 @@ AggregateFunctionPtr create_with_two_basic_numeric_types(const DataTypePtr& firs
 }
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bit.cpp b/be/src/vec/aggregate_functions/aggregate_function_bit.cpp
index 97a6c0e92fa723..981ced1fbd5a46 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bit.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_bit.cpp
@@ -24,6 +24,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_bit(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both(
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bit.h b/be/src/vec/aggregate_functions/aggregate_function_bit.h
index 1ab01b03ceea38..d9760fdd30080b 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bit.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_bit.h
@@ -30,6 +30,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -142,4 +143,5 @@ class AggregateFunctionBitwise final
     }
 };
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bitmap.cpp b/be/src/vec/aggregate_functions/aggregate_function_bitmap.cpp
index e9c86d4b9556da..47ddf2d81b6a71 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bitmap.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_bitmap.cpp
@@ -23,6 +23,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <bool nullable, template <bool, typename> class AggregateFunctionTemplate>
 AggregateFunctionPtr create_with_int_data_type(const DataTypes& argument_type) {
@@ -33,7 +34,11 @@ AggregateFunctionPtr create_with_int_data_type(const DataTypes& argument_type) {
         return std::make_shared<AggregateFunctionTemplate<nullable, ColumnVector<TYPE>>>( \
                 argument_type);                                                           \
     }
-    FOR_INTEGER_TYPES(DISPATCH)
+    // Keep consistent with the FE definition; the function does not have an int128 type.
+    DISPATCH(Int8)
+    DISPATCH(Int16)
+    DISPATCH(Int32)
+    DISPATCH(Int64)
 #undef DISPATCH
     LOG(WARNING) << "with unknowed type, failed in create_with_int_data_type bitmap_union_int"
                  << " and type is: " << argument_type[0]->get_name();
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bitmap.h b/be/src/vec/aggregate_functions/aggregate_function_bitmap.h
index b0619a63e1ffe8..fb17b0a80be092 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bitmap.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_bitmap.h
@@ -38,6 +38,7 @@
 #include "vec/data_types/data_type_number.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -432,4 +433,5 @@ AggregateFunctionPtr create_aggregate_function_bitmap_union(const std::string& n
                                                             const DataTypes& argument_types,
                                                             const bool result_is_nullable);
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.cpp b/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.cpp
index 0b95ddfd46f0d5..2a2c86303f3000 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.cpp
@@ -23,6 +23,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <bool nullable>
 AggregateFunctionPtr create_with_int_data_type(const DataTypes& argument_types) {
@@ -32,7 +33,11 @@ AggregateFunctionPtr create_with_int_data_type(const DataTypes& argument_types)
     if (which.idx == TypeIndex::TYPE) {                                                      \
         return std::make_shared<AggregateFunctionBitmapAgg<nullable, TYPE>>(argument_types); \
     }
-    FOR_INTEGER_TYPES(DISPATCH)
+    // Keep consistent with the FE definition; the function does not have an int128 type.
+    DISPATCH(Int8)
+    DISPATCH(Int16)
+    DISPATCH(Int32)
+    DISPATCH(Int64)
 #undef DISPATCH
     LOG(WARNING) << "with unknown type, failed in create_with_int_data_type bitmap_union_int"
                  << " and type is: " << argument_types[0]->get_name();
diff --git a/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.h b/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.h
index 5747faf1b8e8c1..bff32aa606ccd2 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_bitmap_agg.h
@@ -31,6 +31,7 @@
 #include "vec/data_types/data_type_bitmap.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -226,4 +227,5 @@ class AggregateFunctionBitmapAgg final
     }
 };
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_collect.cpp b/be/src/vec/aggregate_functions/aggregate_function_collect.cpp
index d726b7c6355318..15806c739ed58c 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_collect.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_collect.cpp
@@ -26,6 +26,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T, typename HasLimit, typename ShowNull>
 AggregateFunctionPtr do_create_agg_function_collect(bool distinct, const DataTypes& argument_types,
@@ -72,12 +73,18 @@ AggregateFunctionPtr create_aggregate_function_collect_impl(const std::string& n
     if (which.is_date_or_datetime()) {
         return do_create_agg_function_collect<Int64, HasLimit, ShowNull>(distinct, argument_types,
                                                                          result_is_nullable);
-    } else if (which.is_date_v2() || which.is_ipv4()) {
+    } else if (which.is_date_v2()) {
         return do_create_agg_function_collect<UInt32, HasLimit, ShowNull>(distinct, argument_types,
                                                                           result_is_nullable);
-    } else if (which.is_date_time_v2() || which.is_ipv6()) {
+    } else if (which.is_date_time_v2()) {
         return do_create_agg_function_collect<UInt64, HasLimit, ShowNull>(distinct, argument_types,
                                                                           result_is_nullable);
+    } else if (which.is_ipv6()) {
+        return do_create_agg_function_collect<IPv6, HasLimit, ShowNull>(distinct, argument_types,
+                                                                        result_is_nullable);
+    } else if (which.is_ipv4()) {
+        return do_create_agg_function_collect<IPv4, HasLimit, ShowNull>(distinct, argument_types,
+                                                                        result_is_nullable);
     } else if (which.is_string()) {
         return do_create_agg_function_collect<StringRef, HasLimit, ShowNull>(
                 distinct, argument_types, result_is_nullable);
diff --git a/be/src/vec/aggregate_functions/aggregate_function_collect.h b/be/src/vec/aggregate_functions/aggregate_function_collect.h
index da310c6e0cc4c2..2d18a56313f3f9 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_collect.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_collect.h
@@ -46,6 +46,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 } // namespace vectorized
@@ -836,3 +837,5 @@ class AggregateFunctionCollect
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_combinator.h b/be/src/vec/aggregate_functions/aggregate_function_combinator.h
index 1593d74ed4e59d..0908ac8d0278f1 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_combinator.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_combinator.h
@@ -26,6 +26,7 @@
 #include "vec/data_types/data_type.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 /** Aggregate function combinator allows to take one aggregate function
   *  and transform it to another aggregate function.
@@ -69,3 +70,5 @@ class IAggregateFunctionCombinator {
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_corr.cpp b/be/src/vec/aggregate_functions/aggregate_function_corr.cpp
index cdaab6e086f4a5..e0a51ca6629a06 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_corr.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_corr.cpp
@@ -21,6 +21,7 @@
 #include "vec/core/types.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 struct CorrMoment {
diff --git a/be/src/vec/aggregate_functions/aggregate_function_count.cpp b/be/src/vec/aggregate_functions/aggregate_function_count.cpp
index 5cfe5af41982f6..72d12cf65fe9d0 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_count.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_count.cpp
@@ -26,6 +26,7 @@
 #include "vec/aggregate_functions/factory_helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_count(const std::string& name,
                                                      const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_count.h b/be/src/vec/aggregate_functions/aggregate_function_count.h
index 7b54d074683b04..630994a7967957 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_count.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_count.h
@@ -41,6 +41,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -321,3 +322,5 @@ class AggregateFunctionCountNotNullUnary final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.cpp b/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.cpp
index 093b31d57db554..20235d9e2ef2e9 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.cpp
@@ -26,6 +26,7 @@
 #include "vec/core/types.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_count_by_enum(const std::string& name,
                                                              const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.h b/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.h
index 1f5093de68263e..543ae55f872da6 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_count_by_enum.h
@@ -32,6 +32,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 struct CountByEnumData {
     std::unordered_map<std::string, uint64_t> cbe;
@@ -46,8 +47,7 @@ void build_json_from_vec(rapidjson::StringBuffer& buffer,
     doc.SetArray();
     rapidjson::Document::AllocatorType& allocator = doc.GetAllocator();
 
-    int vec_size_number = data_vec.size();
-    for (int idx = 0; idx < vec_size_number; ++idx) {
+    for (size_t idx = 0; idx < data_vec.size(); ++idx) {
         rapidjson::Value obj(rapidjson::kObjectType);
 
         rapidjson::Value obj_cbe(rapidjson::kObjectType);
@@ -239,4 +239,5 @@ class AggregateFunctionCountByEnum final
     size_t arg_count;
 };
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_covar.cpp b/be/src/vec/aggregate_functions/aggregate_function_covar.cpp
index 4c5fe1321952d6..d9c091fb601868 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_covar.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_covar.cpp
@@ -28,6 +28,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename> class Function, template <typename> class Data>
 AggregateFunctionPtr create_function_single_value(const String& name,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_covar.h b/be/src/vec/aggregate_functions/aggregate_function_covar.h
index b01d1ba11c80df..56dd443f050e6e 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_covar.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_covar.h
@@ -75,11 +75,12 @@ struct BaseData {
         if (count == 1) {
             return 0.0;
         }
-        return sum_xy / count - sum_x * sum_y / (count * count);
+        return sum_xy / (double)count - sum_x * sum_y / ((double)count * (double)count);
     }
 
     double get_samp_result() const {
-        return sum_xy / (count - 1) - sum_x * sum_y / (count * (count - 1));
+        return sum_xy / double(count - 1) -
+               sum_x * sum_y / ((double)(count) * ((double)(count - 1)));
     }
 
     void merge(const BaseData& rhs) {
@@ -95,10 +96,10 @@ struct BaseData {
     void add(const IColumn* column_x, const IColumn* column_y, size_t row_num) {
         const auto& sources_x =
                 assert_cast<const ColumnVector<T>&, TypeCheckOnRelease::DISABLE>(*column_x);
-        double source_data_x = sources_x.get_data()[row_num];
+        double source_data_x = double(sources_x.get_data()[row_num]);
         const auto& sources_y =
                 assert_cast<const ColumnVector<T>&, TypeCheckOnRelease::DISABLE>(*column_y);
-        double source_data_y = sources_y.get_data()[row_num];
+        double source_data_y = double(sources_y.get_data()[row_num]);
 
         sum_x += source_data_x;
         sum_y += source_data_y;
diff --git a/be/src/vec/aggregate_functions/aggregate_function_distinct.cpp b/be/src/vec/aggregate_functions/aggregate_function_distinct.cpp
index fce58b38688b28..566d74dc4d537e 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_distinct.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_distinct.cpp
@@ -28,6 +28,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 struct Reducer {
diff --git a/be/src/vec/aggregate_functions/aggregate_function_distinct.h b/be/src/vec/aggregate_functions/aggregate_function_distinct.h
index 64f60319aac545..46450394627474 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_distinct.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_distinct.h
@@ -42,6 +42,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -347,3 +348,5 @@ class AggregateFunctionDistinct
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_foreach.cpp b/be/src/vec/aggregate_functions/aggregate_function_foreach.cpp
index c1cbcc89996caf..4dba4dd52ebdf3 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_foreach.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_foreach.cpp
@@ -32,6 +32,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_combinator_foreach(AggregateFunctionSimpleFactory& factory) {
     AggregateFunctionCreator creator =
diff --git a/be/src/vec/aggregate_functions/aggregate_function_foreach.h b/be/src/vec/aggregate_functions/aggregate_function_foreach.h
index 7f746e53daac70..9a4801c43bdf2b 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_foreach.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_foreach.h
@@ -31,6 +31,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 struct AggregateFunctionForEachData {
     size_t dynamic_array_size = 0;
@@ -259,3 +260,5 @@ class AggregateFunctionForEach : public IAggregateFunctionDataHelper<AggregateFu
     }
 };
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.cpp b/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.cpp
index 24faf58b2e1ff9..395f1ea1e4ceaf 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/aggregate_function_group_array_intersect.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 IAggregateFunction* create_with_extra_types(const DataTypePtr& nested_type,
                                             const DataTypes& argument_types) {
diff --git a/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.h b/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.h
index fd6076686acb65..1bb6a7a170486c 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_group_array_intersect.h
@@ -37,6 +37,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 class Arena;
 class BufferReadable;
 class BufferWritable;
@@ -98,7 +99,7 @@ struct AggregateFunctionGroupArrayIntersectData {
         value = std::make_unique<NullableNumericOrDateSetType>();
     }
 
-    void process_col_data(auto& column_data, size_t offset, size_t arr_size, bool& init, Set& set) {
+    void process_col_data(auto& column_data, size_t offset, size_t arr_size, Set& set) {
         const bool is_column_data_nullable = column_data.is_nullable();
 
         const ColumnNullable* col_null = nullptr;
@@ -174,7 +175,6 @@ class AggregateFunctionGroupArrayIntersect
     void add(AggregateDataPtr __restrict place, const IColumn** columns, ssize_t row_num,
              Arena*) const override {
         auto& data = this->data(place);
-        auto& init = data.init;
         auto& set = data.value;
 
         const bool col_is_nullable = (*columns[0]).is_nullable();
@@ -191,7 +191,7 @@ class AggregateFunctionGroupArrayIntersect
         const auto arr_size = offsets[row_num] - offset;
         const auto& column_data = column.get_data();
 
-        data.process_col_data(column_data, offset, arr_size, init, set);
+        data.process_col_data(column_data, offset, arr_size, set);
     }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs,
@@ -541,3 +541,5 @@ class AggregateFunctionGroupArrayIntersectGeneric
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_group_concat.cpp b/be/src/vec/aggregate_functions/aggregate_function_group_concat.cpp
index 286795ea2ba70c..b5ee82875f3f80 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_group_concat.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_group_concat.cpp
@@ -23,6 +23,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 const std::string AggregateFunctionGroupConcatImplStr::separator = ",";
 
diff --git a/be/src/vec/aggregate_functions/aggregate_function_group_concat.h b/be/src/vec/aggregate_functions/aggregate_function_group_concat.h
index a0cac9ab78016d..5f598e411b28ab 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_group_concat.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_group_concat.h
@@ -32,6 +32,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -169,3 +170,5 @@ class AggregateFunctionGroupConcat final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_histogram.cpp b/be/src/vec/aggregate_functions/aggregate_function_histogram.cpp
index fb2fa9c2513ec0..9df12c4c55142d 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_histogram.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_histogram.cpp
@@ -28,6 +28,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 AggregateFunctionPtr create_agg_function_histogram(const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_histogram.h b/be/src/vec/aggregate_functions/aggregate_function_histogram.h
index 1d2c5725ed370f..aae5ab00ce34f0 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_histogram.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_histogram.h
@@ -44,6 +44,7 @@
 #include "vec/utils/histogram_helpers.hpp"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -243,3 +244,5 @@ class AggregateFunctionHistogram final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.cpp b/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.cpp
index 4f2232d00d5f1e..42399a77f9b100 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.cpp
@@ -23,6 +23,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_HLL_union_agg(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both(
diff --git a/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.h b/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.h
index 44835194eb4b88..40e964eba782d1 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_hll_union_agg.h
@@ -38,6 +38,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -58,8 +59,7 @@ struct AggregateFunctionHLLData {
 
     void write(BufferWritable& buf) const {
         std::string result(dst_hll.max_serialized_size(), '0');
-        int size = dst_hll.serialize((uint8_t*)result.c_str());
-        result.resize(size);
+        result.resize(dst_hll.serialize((uint8_t*)result.c_str()));
         write_binary(result, buf);
     }
 
@@ -149,3 +149,5 @@ AggregateFunctionPtr create_aggregate_function_HLL(const std::string& name,
                                                    const bool result_is_nullable);
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_java_udaf.h b/be/src/vec/aggregate_functions/aggregate_function_java_udaf.h
index d16da1a34e66e3..c4c050f807954a 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_java_udaf.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_java_udaf.h
@@ -23,6 +23,7 @@
 #include <cstdint>
 #include <memory>
 
+#include "common/cast_set.h"
 #include "common/compiler_util.h"
 #include "common/exception.h"
 #include "common/logging.h"
@@ -41,6 +42,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 const char* UDAF_EXECUTOR_CLASS = "org/apache/doris/udf/UdafExecutor";
 const char* UDAF_EXECUTOR_CTOR_SIGNATURE = "([B)V";
@@ -57,7 +59,7 @@ const char* UDAF_EXECUTOR_RESET_SIGNATURE = "(J)V";
 struct AggregateJavaUdafData {
 public:
     AggregateJavaUdafData() = default;
-    AggregateJavaUdafData(int64_t num_args) { argument_size = num_args; }
+    AggregateJavaUdafData(int64_t num_args) { cast_set(argument_size, num_args); }
 
     ~AggregateJavaUdafData() = default;
 
@@ -115,8 +117,8 @@ struct AggregateJavaUdafData {
     }
 
     Status add(int64_t places_address, bool is_single_place, const IColumn** columns,
-               int row_num_start, int row_num_end, const DataTypes& argument_types,
-               int place_offset) {
+               int64_t row_num_start, int64_t row_num_end, const DataTypes& argument_types,
+               int64_t place_offset) {
         JNIEnv* env = nullptr;
         RETURN_NOT_OK_STATUS_WITH_WARN(JniUtil::GetJNIEnv(&env), "Java-Udaf add function");
 
@@ -134,8 +136,10 @@ struct AggregateJavaUdafData {
                 {"columns_types", input_table_schema.second}};
         jobject input_map = JniUtil::convert_to_java_map(env, input_params);
         // invoke add batch
-        env->CallObjectMethod(executor_obj, executor_add_batch_id, is_single_place, row_num_start,
-                              row_num_end, places_address, place_offset, input_map);
+        // Keep consistent with the function signature of executor_add_batch_id.
+        env->CallObjectMethod(executor_obj, executor_add_batch_id, is_single_place,
+                              cast_set<int>(row_num_start), cast_set<int>(row_num_end),
+                              places_address, cast_set<int>(place_offset), input_map);
         env->DeleteLocalRef(input_map);
         return JniUtil::GetJniExceptionMsg(env);
     }
@@ -144,7 +148,7 @@ struct AggregateJavaUdafData {
         JNIEnv* env = nullptr;
         RETURN_NOT_OK_STATUS_WITH_WARN(JniUtil::GetJNIEnv(&env), "Java-Udaf merge function");
         serialize_data = rhs.serialize_data;
-        long len = serialize_data.length();
+        jsize len = cast_set<jsize>(serialize_data.length()); // jsize needs to be used.
         jbyteArray arr = env->NewByteArray(len);
         env->SetByteArrayRegion(arr, 0, len, reinterpret_cast<jbyte*>(serialize_data.data()));
         env->CallNonvirtualVoidMethod(executor_obj, executor_cl, executor_merge_id, place, arr);
@@ -417,3 +421,5 @@ class AggregateJavaUdaf final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_kurtosis.cpp b/be/src/vec/aggregate_functions/aggregate_function_kurtosis.cpp
index a763721f3f4061..777bb4393cc770 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_kurtosis.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_kurtosis.cpp
@@ -25,6 +25,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 AggregateFunctionPtr type_dispatch_for_aggregate_function_kurt(const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.cpp b/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.cpp
index 683cf1a18f78ba..e61a97aca9f6c0 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.cpp
@@ -20,6 +20,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 const std::string AggregateFunctionLinearHistogramConsts::NAME = "linear_histogram";
 
diff --git a/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.h b/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.h
index 173324b9463750..f4d4b5455f1f83 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_linear_histogram.h
@@ -35,6 +35,7 @@
 // TODO: support foreach
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 struct AggregateFunctionLinearHistogramData {
@@ -70,7 +71,8 @@ struct AggregateFunctionLinearHistogramData {
         double val = 0;
         if constexpr (IsDecimalNumber<T>) {
             using NativeType = typename T::NativeType;
-            val = static_cast<double>(value.value) / decimal_scale_multiplier<NativeType>(scale);
+            val = static_cast<double>(value.value) /
+                  static_cast<double>(decimal_scale_multiplier<NativeType>(scale));
         } else {
             val = static_cast<double>(value);
         }
@@ -255,3 +257,5 @@ class AggregateFunctionLinearHistogram final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_map.cpp b/be/src/vec/aggregate_functions/aggregate_function_map.cpp
index f289d885f48f52..627a6019080a03 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_map.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_map.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename K>
 AggregateFunctionPtr create_agg_function_map_agg(const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_map.h b/be/src/vec/aggregate_functions/aggregate_function_map.h
index 3ec25cdc706152..17bc54f7499adb 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_map.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_map.h
@@ -33,6 +33,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename K>
 struct AggregateFunctionMapAggData {
@@ -345,3 +346,5 @@ class AggregateFunctionMapAgg final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_max_by.cpp b/be/src/vec/aggregate_functions/aggregate_function_max_by.cpp
index 35b4a4400da0d8..50e611b11d8b3e 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_max_by.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_max_by.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/aggregate_function_simple_factory.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_max_by(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both(
diff --git a/be/src/vec/aggregate_functions/aggregate_function_min_by.cpp b/be/src/vec/aggregate_functions/aggregate_function_min_by.cpp
index 6e1d96ddf5d9c5..0af34292bbb2eb 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_min_by.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_min_by.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/aggregate_function_simple_factory.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_min_by(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both(
diff --git a/be/src/vec/aggregate_functions/aggregate_function_min_max.cpp b/be/src/vec/aggregate_functions/aggregate_function_min_max.cpp
index c1a72fd52bdd76..e6e558b7fdc2db 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_min_max.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_min_max.cpp
@@ -26,6 +26,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 /// min, max, any
 template <template <typename> class Data>
 AggregateFunctionPtr create_aggregate_function_single_value(const String& name,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_min_max.h b/be/src/vec/aggregate_functions/aggregate_function_min_max.h
index efc2854ff149c8..4ced874e36d488 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_min_max.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_min_max.h
@@ -26,6 +26,7 @@
 #include <memory>
 #include <vector>
 
+#include "common/cast_set.h"
 #include "common/logging.h"
 #include "vec/aggregate_functions/aggregate_function.h"
 #include "vec/columns/column.h"
@@ -41,6 +42,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 template <typename T>
@@ -302,7 +304,8 @@ struct SingleValueDataDecimal {
 struct SingleValueDataString {
 private:
     using Self = SingleValueDataString;
-
+    // This function uses int32 for storage, which triggers a 64-bit to 32-bit conversion warning.
+    // However, considering compatibility with future upgrades, no changes will be made here.
     Int32 size = -1;    /// -1 indicates that there is no value.
     Int32 capacity = 0; /// power of two or zero
     std::unique_ptr<char[]> large_data;
@@ -364,7 +367,7 @@ struct SingleValueDataString {
                 }
             } else {
                 if (capacity < rhs_size) {
-                    capacity = round_up_to_power_of_two_or_zero(rhs_size);
+                    capacity = (Int32)round_up_to_power_of_two_or_zero(rhs_size);
                     large_data.reset(new char[capacity]);
                 }
 
@@ -381,8 +384,7 @@ struct SingleValueDataString {
 
     /// Assuming to.has()
     void change_impl(StringRef value, Arena*) {
-        Int32 value_size = value.size;
-
+        Int32 value_size = cast_set<Int32>(value.size);
         if (value_size <= MAX_SMALL_STRING_SIZE) {
             /// Don't free large_data here.
             size = value_size;
@@ -393,7 +395,7 @@ struct SingleValueDataString {
         } else {
             if (capacity < value_size) {
                 /// Don't free large_data here.
-                capacity = round_up_to_power_of_two_or_zero(value_size);
+                capacity = (Int32)round_up_to_power_of_two_or_zero(value_size);
                 large_data.reset(new char[capacity]);
             }
 
@@ -717,3 +719,5 @@ AggregateFunctionPtr create_aggregate_function_single_value(const String& name,
                                                             const bool result_is_nullable,
                                                             const AggregateFunctionAttr& attr = {});
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_min_max_by.h b/be/src/vec/aggregate_functions/aggregate_function_min_max_by.h
index 5c73ac9aa67cbe..3b8d182ff46862 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_min_max_by.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_min_max_by.h
@@ -30,6 +30,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 /// For bitmap value
 struct BitmapValueData {
@@ -295,3 +296,5 @@ AggregateFunctionPtr create_aggregate_function_min_max_by(const String& name,
 }
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_null.h b/be/src/vec/aggregate_functions/aggregate_function_null.h
index 014a3e9c603b88..b3fa3b8230dc52 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_null.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_null.h
@@ -31,6 +31,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename NestFunction, bool result_is_nullable, typename Derived>
 class AggregateFunctionNullBaseInline : public IAggregateFunctionHelper<Derived> {
@@ -334,3 +335,5 @@ class AggregateFunctionNullVariadicInline final
             is_nullable; /// Plain array is better than std::vector due to one indirection less.
 };
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.cpp b/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.cpp
index fe41aba2f0bf8d..94f942ec6443ac 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.cpp
@@ -26,6 +26,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 struct StringRef;
 } // namespace doris
 
diff --git a/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.h b/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.h
index a81bdcddaa3310..340ba5325fbe6a 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_orthogonal_bitmap.h
@@ -39,6 +39,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 class Arena;
 class BufferReadable;
 class BufferWritable;
@@ -234,7 +235,7 @@ struct AggOrthBitmapExprCalBaseData {
         if (first_init) {
             DCHECK(argument_size > 1);
             const auto& col =
-                    assert_cast<const ColVecData&, TypeCheckOnRelease::DISABLE>(*columns[2]);
+                    assert_cast<const ColumnString&, TypeCheckOnRelease::DISABLE>(*columns[2]);
             std::string expr = col.get_data_at(row_num).to_string();
             bitmap_expr_cal.bitmap_calculation_init(expr);
             first_init = false;
@@ -379,7 +380,8 @@ class AggFunctionOrthBitmapFunc final
 
     AggFunctionOrthBitmapFunc(const DataTypes& argument_types_)
             : IAggregateFunctionDataHelper<Impl, AggFunctionOrthBitmapFunc<Impl>>(argument_types_),
-              _argument_size(argument_types_.size()) {}
+              // The number of arguments will not exceed the size of an int
+              _argument_size(int(argument_types_.size())) {}
 
     DataTypePtr get_return_type() const override { return Impl::get_return_type(); }
 
@@ -413,3 +415,5 @@ class AggFunctionOrthBitmapFunc final
     int _argument_size;
 };
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_product.h b/be/src/vec/aggregate_functions/aggregate_function_product.h
index 82f765a909d42a..bbec428b25acef 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_product.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_product.h
@@ -31,6 +31,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 
 template <typename T>
@@ -174,3 +175,5 @@ class AggregateFunctionProduct final
 
 } // namespace vectorized
 } // namespace doris
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_quantile_state.cpp b/be/src/vec/aggregate_functions/aggregate_function_quantile_state.cpp
index 128edc59915525..1af3bfb3529f13 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_quantile_state.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_quantile_state.cpp
@@ -23,6 +23,7 @@
 #include "vec/data_types/data_type.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_quantile_state_union(
         const std::string& name, const DataTypes& argument_types, const bool result_is_nullable,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_quantile_state.h b/be/src/vec/aggregate_functions/aggregate_function_quantile_state.h
index c48ac920919cf6..7da2118b5b0d0d 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_quantile_state.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_quantile_state.h
@@ -32,6 +32,7 @@
 #include "vec/data_types/data_type_quantilestate.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -157,3 +158,5 @@ AggregateFunctionPtr create_aggregate_function_quantile_state_union(
         const AggregateFunctionAttr& attr);
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_reader.cpp b/be/src/vec/aggregate_functions/aggregate_function_reader.cpp
index 6f27a5dd128241..737f66832dab61 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_reader.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_reader.cpp
@@ -30,6 +30,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 // auto spread at nullable condition, null value do not participate aggregate
 void register_aggregate_function_reader_load(AggregateFunctionSimpleFactory& factory) {
diff --git a/be/src/vec/aggregate_functions/aggregate_function_reader.h b/be/src/vec/aggregate_functions/aggregate_function_reader.h
index ef35ea16fd41a3..7aa6f00ee81a65 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_reader.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_reader.h
@@ -18,6 +18,7 @@
 #pragma once
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class AggregateFunctionSimpleFactory;
 } // namespace vectorized
@@ -33,3 +34,5 @@ void register_aggregate_function_reader_load(AggregateFunctionSimpleFactory& fac
 void register_aggregate_function_replace_reader_load(AggregateFunctionSimpleFactory& factory);
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_reader_first_last.h b/be/src/vec/aggregate_functions/aggregate_function_reader_first_last.h
index 066ef2a257914c..2657feb9380acd 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_reader_first_last.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_reader_first_last.h
@@ -30,6 +30,7 @@
 #include "vec/functions/function.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename ColVecType, bool arg_is_nullable>
 struct Value {
@@ -309,4 +310,5 @@ CREATE_READER_FUNCTION_WITH_NAME_AND_DATA(create_aggregate_function_last_non_nul
                                           ReaderFunctionLastNonNullData);
 #undef CREATE_READER_FUNCTION_WITH_NAME_AND_DATA
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
\ No newline at end of file
diff --git a/be/src/vec/aggregate_functions/aggregate_function_regr_union.cpp b/be/src/vec/aggregate_functions/aggregate_function_regr_union.cpp
index c20b5977f2198b..8f17456ad2e5c3 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_regr_union.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_regr_union.cpp
@@ -26,6 +26,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T, template <typename> class StatFunctionTemplate>
 AggregateFunctionPtr type_dispatch_for_aggregate_function_regr(const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_regr_union.h b/be/src/vec/aggregate_functions/aggregate_function_regr_union.h
index a95daaf0d840cd..b16763745a48f1 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_regr_union.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_regr_union.h
@@ -36,6 +36,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 struct AggregateFunctionRegrData {
@@ -82,19 +83,19 @@ struct AggregateFunctionRegrData {
     }
 
     void add(T value_y, T value_x) {
-        sum_x += value_x;
-        sum_y += value_y;
-        sum_of_x_mul_y += value_x * value_y;
-        sum_of_x_squared += value_x * value_x;
+        sum_x += (double)value_x;
+        sum_y += (double)value_y;
+        sum_of_x_mul_y += (double)value_x * (double)value_y;
+        sum_of_x_squared += (double)value_x * (double)value_x;
         count += 1;
     }
 
     Float64 get_slope() const {
-        Float64 denominator = count * sum_of_x_squared - sum_x * sum_x;
+        Float64 denominator = (double)count * sum_of_x_squared - sum_x * sum_x;
         if (count < 2 || denominator == 0.0) {
             return std::numeric_limits<Float64>::quiet_NaN();
         }
-        Float64 slope = (count * sum_of_x_mul_y - sum_x * sum_y) / denominator;
+        Float64 slope = ((double)count * sum_of_x_mul_y - sum_x * sum_y) / denominator;
         return slope;
     }
 };
@@ -115,7 +116,7 @@ struct RegrInterceptFunc : AggregateFunctionRegrData<T> {
         if (std::isnan(slope)) {
             return slope;
         } else {
-            Float64 intercept = (this->sum_y - slope * this->sum_x) / this->count;
+            Float64 intercept = (this->sum_y - slope * this->sum_x) / (double)this->count;
             return intercept;
         }
     }
@@ -214,3 +215,5 @@ class AggregateFunctionRegrSimple
     }
 };
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_retention.cpp b/be/src/vec/aggregate_functions/aggregate_function_retention.cpp
index 38dd8f9de6667d..ba45950f55510e 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_retention.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_retention.cpp
@@ -21,6 +21,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 void register_aggregate_function_retention(AggregateFunctionSimpleFactory& factory) {
     factory.register_function_both("retention",
                                    creator_without_type::creator<AggregateFunctionRetention>);
diff --git a/be/src/vec/aggregate_functions/aggregate_function_retention.h b/be/src/vec/aggregate_functions/aggregate_function_retention.h
index f6bf03282e5711..95b2c8f9bb2e7a 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_retention.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_retention.h
@@ -43,6 +43,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -93,18 +94,18 @@ struct RetentionState {
         }
     }
 
-    void insert_result_into(IColumn& to, size_t events_size, const uint8_t* events) const {
+    void insert_result_into(IColumn& to, size_t events_size, const uint8_t* arg_events) const {
         auto& data_to = assert_cast<ColumnUInt8&>(to).get_data();
 
         ColumnArray::Offset64 current_offset = data_to.size();
         data_to.resize(current_offset + events_size);
 
-        bool first_flag = events[0];
+        bool first_flag = arg_events[0];
         data_to[current_offset] = first_flag;
         ++current_offset;
 
         for (size_t i = 1; i < events_size; ++i) {
-            data_to[current_offset] = (first_flag && events[i]);
+            data_to[current_offset] = (first_flag && arg_events[i]);
             ++current_offset;
         }
     }
@@ -166,4 +167,5 @@ class AggregateFunctionRetention
         to_arr.get_offsets().push_back(to_nested_col.size());
     }
 };
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sequence_match.cpp b/be/src/vec/aggregate_functions/aggregate_function_sequence_match.cpp
index c49ee021dbfae7..f9e901b34daf63 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sequence_match.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_sequence_match.cpp
@@ -26,6 +26,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename, typename> typename AggregateFunction>
 AggregateFunctionPtr create_aggregate_function_sequence_base(const std::string& name,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sequence_match.h b/be/src/vec/aggregate_functions/aggregate_function_sequence_match.h
index 586003043311c4..8fd0a1f5525cd1 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sequence_match.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_sequence_match.h
@@ -51,6 +51,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -88,10 +89,10 @@ struct AggregateFunctionSequenceMatchData final {
 
     size_t get_arg_count() const { return arg_count; }
 
-    void init(const std::string pattern, size_t arg_count) {
+    void init(const std::string pattern_, size_t arg_count_) {
         if (!init_flag) {
-            this->pattern = pattern;
-            this->arg_count = arg_count;
+            this->pattern = pattern_;
+            this->arg_count = arg_count_;
             parse_pattern();
             init_flag = true;
         }
@@ -144,7 +145,8 @@ struct AggregateFunctionSequenceMatchData final {
             write_binary(events.second.to_ulong(), buf);
         }
 
-        UInt32 conditions_met_value = conditions_met.to_ulong();
+        // This is std::bitset<32>, which will not exceed 32 bits.
+        UInt32 conditions_met_value = (UInt32)conditions_met.to_ulong();
         write_binary(conditions_met_value, buf);
 
         write_binary(pattern, buf);
@@ -627,8 +629,7 @@ class AggregateFunctionSequenceBase
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs,
                Arena*) const override {
         const std::string pattern = this->data(rhs).get_pattern();
-        size_t arg_count = this->data(rhs).get_arg_count();
-        this->data(place).init(pattern, arg_count);
+        this->data(place).init(pattern, this->data(rhs).get_arg_count());
         this->data(place).merge(this->data(rhs));
     }
 
@@ -640,8 +641,7 @@ class AggregateFunctionSequenceBase
                      Arena*) const override {
         this->data(place).read(buf);
         const std::string pattern = this->data(place).get_pattern();
-        size_t arg_count = this->data(place).get_arg_count();
-        this->data(place).init(pattern, arg_count);
+        this->data(place).init(pattern, this->data(place).get_arg_count());
     }
 
 private:
@@ -754,3 +754,5 @@ class AggregateFunctionSequenceCount final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_simple_factory.cpp b/be/src/vec/aggregate_functions/aggregate_function_simple_factory.cpp
index 90bdab70522cf1..6869263882344e 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_simple_factory.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_simple_factory.cpp
@@ -25,6 +25,7 @@
 #include "vec/aggregate_functions/aggregate_function_reader.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_combinator_distinct(AggregateFunctionSimpleFactory& factory);
 void register_aggregate_function_combinator_foreach(AggregateFunctionSimpleFactory& factory);
diff --git a/be/src/vec/aggregate_functions/aggregate_function_simple_factory.h b/be/src/vec/aggregate_functions/aggregate_function_simple_factory.h
index aa33e7289df01e..842170c18eba45 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_simple_factory.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_simple_factory.h
@@ -36,6 +36,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 using DataTypePtr = std::shared_ptr<const IDataType>;
 using DataTypes = std::vector<DataTypePtr>;
 using AggregateFunctionCreator = std::function<AggregateFunctionPtr(
@@ -184,3 +185,5 @@ class AggregateFunctionSimpleFactory {
     static AggregateFunctionSimpleFactory& instance();
 };
 }; // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_skew.cpp b/be/src/vec/aggregate_functions/aggregate_function_skew.cpp
index af2eb443eb0603..993a558d290569 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_skew.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_skew.cpp
@@ -25,6 +25,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <typename T>
 AggregateFunctionPtr type_dispatch_for_aggregate_function_skew(const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sort.cpp b/be/src/vec/aggregate_functions/aggregate_function_sort.cpp
index c80d36aec58f33..99d93127f0c29f 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sort.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_sort.cpp
@@ -22,6 +22,7 @@
 #include "vec/aggregate_functions/aggregate_function_simple_factory.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr transform_to_sort_agg_function(const AggregateFunctionPtr& nested_function,
                                                     const DataTypes& arguments,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sort.h b/be/src/vec/aggregate_functions/aggregate_function_sort.h
index 981580f8e6ac38..a0a05cc7ddd397 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sort.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_sort.h
@@ -41,6 +41,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -204,3 +205,5 @@ AggregateFunctionPtr transform_to_sort_agg_function(const AggregateFunctionPtr&
                                                     const SortDescription& sort_desc,
                                                     RuntimeState* state);
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_state_merge.h b/be/src/vec/aggregate_functions/aggregate_function_state_merge.h
index d16c823b0292b7..649873373472c6 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_state_merge.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_state_merge.h
@@ -20,6 +20,7 @@
 #include "vec/aggregate_functions/aggregate_function_state_union.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 const static std::string AGG_MERGE_SUFFIX = "_merge";
 
 class AggregateStateMerge : public AggregateStateUnion {
@@ -55,3 +56,5 @@ class AggregateStateMerge : public AggregateStateUnion {
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_state_union.h b/be/src/vec/aggregate_functions/aggregate_function_state_union.h
index 6ff900c90d38ef..c69a3b9c1577e6 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_state_union.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_state_union.h
@@ -23,6 +23,7 @@
 #include "vec/data_types/data_type_agg_state.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 const static std::string AGG_UNION_SUFFIX = "_union";
 
 class AggregateStateUnion : public IAggregateFunctionHelper<AggregateStateUnion> {
@@ -112,3 +113,5 @@ class AggregateStateUnion : public IAggregateFunctionHelper<AggregateStateUnion>
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_statistic.h b/be/src/vec/aggregate_functions/aggregate_function_statistic.h
index a1fd4395eb848a..9c3ff9cbf73210 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_statistic.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_statistic.h
@@ -35,6 +35,7 @@
 #include "vec/data_types/data_type_number.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 enum class STATISTICS_FUNCTION_KIND : uint8_t { SKEW_POP, KURT_POP };
 
@@ -53,6 +54,7 @@ template <typename T, std::size_t _level>
 struct StatFuncOneArg {
     using Type = T;
     using Data = VarMoments<Float64, _level>;
+    using DataType = Float64;
 };
 
 template <typename StatFunc, bool NullableInput>
@@ -63,6 +65,7 @@ class AggregateFunctionVarianceSimple
 public:
     using InputCol = ColumnVector<typename StatFunc::Type>;
     using ResultCol = ColumnVector<Float64>;
+    using InputType = typename StatFunc::DataType;
 
     explicit AggregateFunctionVarianceSimple(STATISTICS_FUNCTION_KIND kind_,
                                              const DataTypes& argument_types_)
@@ -88,14 +91,16 @@ class AggregateFunctionVarianceSimple
             if (column_with_nullable.is_null_at(row_num)) {
                 return;
             } else {
-                this->data(place).add(assert_cast<const InputCol&, TypeCheckOnRelease::DISABLE>(
-                                              column_with_nullable.get_nested_column())
-                                              .get_data()[row_num]);
+                this->data(place).add(
+                        (InputType)assert_cast<const InputCol&, TypeCheckOnRelease::DISABLE>(
+                                column_with_nullable.get_nested_column())
+                                .get_data()[row_num]);
             }
 
         } else {
             this->data(place).add(
-                    assert_cast<const InputCol&, TypeCheckOnRelease::DISABLE>(*columns[0])
+                    (InputType)assert_cast<const InputCol&, TypeCheckOnRelease::DISABLE>(
+                            *columns[0])
                             .get_data()[row_num]);
         }
     }
@@ -160,4 +165,5 @@ class AggregateFunctionVarianceSimple
     STATISTICS_FUNCTION_KIND kind;
 };
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_stddev.cpp b/be/src/vec/aggregate_functions/aggregate_function_stddev.cpp
index 5a76c3b836d3c1..6c463b8417e0bf 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_stddev.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_stddev.cpp
@@ -28,6 +28,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename> class Function, typename Name,
           template <typename, typename, bool> class Data, bool is_stddev>
diff --git a/be/src/vec/aggregate_functions/aggregate_function_stddev.h b/be/src/vec/aggregate_functions/aggregate_function_stddev.h
index 9b3cd190991fea..d42adc28d73fc5 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_stddev.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_stddev.h
@@ -34,7 +34,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
-
+#include "common/compile_check_begin.h"
 class Arena;
 class BufferReadable;
 class BufferWritable;
@@ -88,12 +88,12 @@ struct BaseData {
         if (count == 1) {
             return 0.0;
         }
-        double res = m2 / count;
+        double res = m2 / (double)count;
         return get_result(res);
     }
 
     double get_samp_result() const {
-        double res = m2 / (count - 1);
+        double res = m2 / double(count - 1);
         return get_result(res);
     }
 
@@ -102,21 +102,21 @@ struct BaseData {
             return;
         }
         double delta = mean - rhs.mean;
-        double sum_count = count + rhs.count;
-        mean = rhs.mean + delta * count / sum_count;
-        m2 = rhs.m2 + m2 + (delta * delta) * rhs.count * count / sum_count;
+        double sum_count = double(count + rhs.count);
+        mean = rhs.mean + delta * (double)count / sum_count;
+        m2 = rhs.m2 + m2 + (delta * delta) * (double)rhs.count * (double)count / sum_count;
         count = int64_t(sum_count);
     }
 
     void add(const IColumn* column, size_t row_num) {
         const auto& sources =
                 assert_cast<const ColumnVector<T>&, TypeCheckOnRelease::DISABLE>(*column);
-        double source_data = sources.get_data()[row_num];
+        double source_data = (double)sources.get_data()[row_num];
 
         double delta = source_data - mean;
-        double r = delta / (1 + count);
+        double r = delta / double(1 + count);
         mean += r;
-        m2 += count * delta * r;
+        m2 += (double)count * delta * r;
         count += 1;
     }
 
@@ -217,3 +217,5 @@ class AggregateFunctionSampVariance
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sum.cpp b/be/src/vec/aggregate_functions/aggregate_function_sum.cpp
index 91063c22dc6376..3ad9efa121c6a4 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sum.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_sum.cpp
@@ -24,6 +24,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 void register_aggregate_function_sum(AggregateFunctionSimpleFactory& factory) {
     AggregateFunctionCreator creator = [&](const std::string& name, const DataTypes& types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_sum.h b/be/src/vec/aggregate_functions/aggregate_function_sum.h
index 13fb3864bd1aaf..68fb1806724e98 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_sum.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_sum.h
@@ -37,6 +37,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -248,3 +249,5 @@ template <typename T>
 using AggregateFunctionSumSimpleReader = typename SumSimple<T, false>::Function;
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_topn.cpp b/be/src/vec/aggregate_functions/aggregate_function_topn.cpp
index 799d8fe1c754fb..ea7a33969b9a88 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_topn.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_topn.cpp
@@ -25,6 +25,7 @@
 #include "vec/data_types/data_type.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_topn(const std::string& name,
                                                     const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_topn.h b/be/src/vec/aggregate_functions/aggregate_function_topn.h
index 1c0fba5099fb17..29eee8eee55805 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_topn.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_topn.h
@@ -50,6 +50,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -385,3 +386,5 @@ class AggregateFunctionTopNArray final : public AggregateFunctionTopNBase<Impl,
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_uniq.cpp b/be/src/vec/aggregate_functions/aggregate_function_uniq.cpp
index 25231025416b83..df0f2321947311 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_uniq.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_uniq.cpp
@@ -30,6 +30,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename> class Data>
 AggregateFunctionPtr create_aggregate_function_uniq(const std::string& name,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_uniq.h b/be/src/vec/aggregate_functions/aggregate_function_uniq.h
index a3bdad635057fd..59f477363f706c 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_uniq.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_uniq.h
@@ -44,6 +44,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -232,3 +233,5 @@ class AggregateFunctionUniq final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.cpp b/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.cpp
index c89c8aa14f01eb..6a7c6b8f3b0a88 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.cpp
@@ -24,6 +24,7 @@
 #include "vec/aggregate_functions/helpers.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename> class Data>
 AggregateFunctionPtr create_aggregate_function_uniq(const std::string& name,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.h b/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.h
index 90d137c62384f6..ee1ae91ab3e85b 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_uniq_distribute_key.h
@@ -42,6 +42,7 @@
 #include "vec/io/var_int.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -258,3 +259,5 @@ class AggregateFunctionUniqDistributeKey final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_window.cpp b/be/src/vec/aggregate_functions/aggregate_function_window.cpp
index 9da838a6b9067c..fcb0072abe8d6f 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_window.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_window.cpp
@@ -30,6 +30,7 @@
 #include "vec/utils/template_helpers.hpp"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 template <template <typename> class AggregateFunctionTemplate,
           template <typename ColVecType, bool, bool> class Data,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_window.h b/be/src/vec/aggregate_functions/aggregate_function_window.h
index cb038fe31168b9..0011ae3aba96b3 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_window.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_window.h
@@ -42,6 +42,7 @@
 #include "vec/data_types/data_type_number.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 class Arena;
 class BufferReadable;
 class BufferWritable;
@@ -181,7 +182,7 @@ class WindowFunctionPercentRank final
         : public IAggregateFunctionDataHelper<PercentRankData, WindowFunctionPercentRank> {
 private:
     static double _cal_percent(int64 rank, int64 total_rows) {
-        return total_rows <= 1 ? 0.0 : (rank - 1) * 1.0 / (total_rows - 1);
+        return total_rows <= 1 ? 0.0 : double(rank - 1) * 1.0 / double(total_rows - 1);
     }
 
 public:
@@ -270,7 +271,7 @@ class WindowFunctionCumeDist final
     }
 
     void insert_result_into(ConstAggregateDataPtr place, IColumn& to) const override {
-        auto cume_dist = data(place).numerator * 1.0 / data(place).denominator;
+        auto cume_dist = (double)data(place).numerator * 1.0 / (double)data(place).denominator;
         assert_cast<ColumnFloat64&>(to).get_data().push_back(cume_dist);
     }
 
@@ -580,3 +581,5 @@ class WindowFunctionData final
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/aggregate_function_window_funnel.cpp b/be/src/vec/aggregate_functions/aggregate_function_window_funnel.cpp
index f95dccd547eb5f..606df4d2c4facf 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_window_funnel.cpp
+++ b/be/src/vec/aggregate_functions/aggregate_function_window_funnel.cpp
@@ -29,6 +29,7 @@
 #include "vec/data_types/data_type_nullable.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 AggregateFunctionPtr create_aggregate_function_window_funnel(const std::string& name,
                                                              const DataTypes& argument_types,
diff --git a/be/src/vec/aggregate_functions/aggregate_function_window_funnel.h b/be/src/vec/aggregate_functions/aggregate_function_window_funnel.h
index 84222f0d01ba0c..efd51444c56560 100644
--- a/be/src/vec/aggregate_functions/aggregate_function_window_funnel.h
+++ b/be/src/vec/aggregate_functions/aggregate_function_window_funnel.h
@@ -32,6 +32,7 @@
 #include <utility>
 
 #include "agent/be_exec_version_manager.h"
+#include "common/cast_set.h"
 #include "common/compiler_util.h"
 #include "common/exception.h"
 #include "util/binary_cast.hpp"
@@ -49,6 +50,7 @@
 #include "vec/runtime/vdatetime_value.h"
 
 namespace doris {
+#include "common/compile_check_begin.h"
 namespace vectorized {
 class Arena;
 class BufferReadable;
@@ -349,7 +351,9 @@ struct WindowFunnelState {
         in.read(buff.data(), data_bytes);
 
         PBlock pblock;
-        if (!pblock.ParseFromArray(buff.data(), data_bytes)) {
+        // It is preferable to change data_bytes to int type here,
+        // but due to compatibility issues, no changes will be made.
+        if (!pblock.ParseFromArray(buff.data(), (int)data_bytes)) {
             throw doris::Exception(ErrorCode::INTERNAL_ERROR,
                                    "Failed to parse window_funnel data to block");
         }
@@ -376,7 +380,7 @@ class AggregateFunctionWindowFunnel
 
     void create(AggregateDataPtr __restrict place) const override {
         auto data = new (place) WindowFunnelState<TYPE_INDEX, NativeType>(
-                IAggregateFunction::get_argument_types().size() - 3);
+                cast_set<int>(IAggregateFunction::get_argument_types().size() - 3));
         /// support window funnel mode from 2.0. See `BeExecVersionManager::max_be_exec_version`
         data->enable_mode = version >= 3;
     }
@@ -424,3 +428,5 @@ class AggregateFunctionWindowFunnel
 };
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/factory_helpers.h b/be/src/vec/aggregate_functions/factory_helpers.h
index 553f05c3665a5b..d5a4a022176304 100644
--- a/be/src/vec/aggregate_functions/factory_helpers.h
+++ b/be/src/vec/aggregate_functions/factory_helpers.h
@@ -25,6 +25,7 @@
 #include "vec/data_types/data_type.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 inline void assert_unary(const std::string& name, const DataTypes& argument_types) {
     CHECK_EQ(argument_types.size(), 1)
@@ -57,3 +58,5 @@ void assert_arity_at_most(const std::string& name, const DataTypes& argument_typ
 }
 
 } // namespace doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/helpers.h b/be/src/vec/aggregate_functions/helpers.h
index 34b7e76c2eaad2..ad21c2ca6c8d40 100644
--- a/be/src/vec/aggregate_functions/helpers.h
+++ b/be/src/vec/aggregate_functions/helpers.h
@@ -99,6 +99,7 @@
     } while (false)
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 struct creator_without_type {
     template <bool multi_arguments, bool f, typename T>
@@ -116,20 +117,21 @@ struct creator_without_type {
     template <typename AggregateFunctionTemplate, typename... TArgs>
     static AggregateFunctionPtr create(const DataTypes& argument_types_,
                                        const bool result_is_nullable, TArgs&&... args) {
-        IAggregateFunction* result(new AggregateFunctionTemplate(std::forward<TArgs>(args)...,
-                                                                 remove_nullable(argument_types_)));
+        std::unique_ptr<IAggregateFunction> result(std::make_unique<AggregateFunctionTemplate>(
+                std::forward<TArgs>(args)..., remove_nullable(argument_types_)));
         if (have_nullable(argument_types_)) {
             std::visit(
                     [&](auto multi_arguments, auto result_is_nullable) {
-                        result = new NullableT<multi_arguments, result_is_nullable,
-                                               AggregateFunctionTemplate>(result, argument_types_);
+                        result.reset(new NullableT<multi_arguments, result_is_nullable,
+                                                   AggregateFunctionTemplate>(result.release(),
+                                                                              argument_types_));
                     },
                     make_bool_variant(argument_types_.size() > 1),
                     make_bool_variant(result_is_nullable));
         }
 
         CHECK_AGG_FUNCTION_SERIALIZED_TYPE(AggregateFunctionTemplate);
-        return AggregateFunctionPtr(result);
+        return AggregateFunctionPtr(result.release());
     }
 
     /// AggregateFunctionTemplate will handle the nullable arguments, no need to use
@@ -138,10 +140,10 @@ struct creator_without_type {
     static AggregateFunctionPtr create_ignore_nullable(const DataTypes& argument_types_,
                                                        const bool /*result_is_nullable*/,
                                                        TArgs&&... args) {
-        IAggregateFunction* result(
-                new AggregateFunctionTemplate(std::forward<TArgs>(args)..., argument_types_));
+        std::unique_ptr<IAggregateFunction> result = std::make_unique<AggregateFunctionTemplate>(
+                std::forward<TArgs>(args)..., argument_types_);
         CHECK_AGG_FUNCTION_SERIALIZED_TYPE(AggregateFunctionTemplate);
-        return AggregateFunctionPtr(result);
+        return AggregateFunctionPtr(result.release());
     }
 };
 
@@ -260,3 +262,5 @@ using creator_with_decimal_type = creator_with_type_base<false, false, true>;
 using creator_with_type = creator_with_type_base<true, true, true>;
 
 } // namespace  doris::vectorized
+
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/aggregate_functions/moments.h b/be/src/vec/aggregate_functions/moments.h
index d9db12774709bc..0628b3116e2120 100644
--- a/be/src/vec/aggregate_functions/moments.h
+++ b/be/src/vec/aggregate_functions/moments.h
@@ -24,6 +24,7 @@
 #include "vec/io/io_helper.h"
 
 namespace doris::vectorized {
+#include "common/compile_check_begin.h"
 
 class BufferReadable;
 class BufferWritable;
@@ -111,4 +112,5 @@ struct VarMoments {
     }
 };
 
-} // namespace doris::vectorized
\ No newline at end of file
+} // namespace doris::vectorized
+#include "common/compile_check_end.h"
diff --git a/be/src/vec/columns/column_decimal.h b/be/src/vec/columns/column_decimal.h
index a8b1f9573ef185..dde7a1c6237481 100644
--- a/be/src/vec/columns/column_decimal.h
+++ b/be/src/vec/columns/column_decimal.h
@@ -259,7 +259,7 @@ class ColumnDecimal final : public COWHelper<IColumn, ColumnDecimal<T>> {
         for (U i = 0; i < s; ++i) res[i] = i;
 
         auto sort_end = res.end();
-        if (limit && limit < static_cast<double>(s) / 8.0L) {
+        if (limit && static_cast<double>(limit) < static_cast<double>(s) / 8.0) {
             sort_end = res.begin() + limit;
             if (reverse)
                 std::partial_sort(res.begin(), sort_end, res.end(),
diff --git a/be/src/vec/columns/column_object.cpp b/be/src/vec/columns/column_object.cpp
index 3e8d3722305e8d..d67a70d2f630f0 100644
--- a/be/src/vec/columns/column_object.cpp
+++ b/be/src/vec/columns/column_object.cpp
@@ -645,8 +645,8 @@ void ColumnObject::resize(size_t n) {
     num_rows = n;
 }
 
-bool ColumnObject::Subcolumn::check_if_sparse_column(size_t num_rows) {
-    if (num_rows < config::variant_threshold_rows_to_estimate_sparse_column) {
+bool ColumnObject::Subcolumn::check_if_sparse_column(size_t arg_num_rows) {
+    if (arg_num_rows < config::variant_threshold_rows_to_estimate_sparse_column) {
         return false;
     }
     std::vector<double> defaults_ratio;
@@ -1603,7 +1603,7 @@ Status ColumnObject::merge_sparse_to_root_column() {
     return Status::OK();
 }
 
-void ColumnObject::unnest(Subcolumns::NodePtr& entry, Subcolumns& subcolumns) const {
+void ColumnObject::unnest(Subcolumns::NodePtr& entry, Subcolumns& arg_subcolumns) const {
     entry->data.finalize();
     auto nested_column = entry->data.get_finalized_column_ptr()->assume_mutable();
     auto* nested_column_nullable = assert_cast<ColumnNullable*>(nested_column.get());
@@ -1634,7 +1634,7 @@ void ColumnObject::unnest(Subcolumns::NodePtr& entry, Subcolumns& subcolumns) co
         auto type = make_nullable(
                 std::make_shared<DataTypeArray>(nested_entry->data.least_common_type.get()));
         Subcolumn subcolumn(nullable_subnested_column->assume_mutable(), type, is_nullable);
-        subcolumns.add(path_builder.build(), subcolumn);
+        arg_subcolumns.add(path_builder.build(), subcolumn);
     }
 }
 
diff --git a/be/src/vec/columns/column_vector.cpp b/be/src/vec/columns/column_vector.cpp
index f0f0bec8b99bb1..396edcc2ad4c3c 100644
--- a/be/src/vec/columns/column_vector.cpp
+++ b/be/src/vec/columns/column_vector.cpp
@@ -243,7 +243,7 @@ void ColumnVector<T>::get_permutation(bool reverse, size_t limit, int nan_direct
     if (s == 0) return;
 
     // std::partial_sort need limit << s can get performance benefit
-    if (limit > (s / 8.0L)) limit = 0;
+    if (static_cast<double>(limit) > (static_cast<double>(s) / 8.0)) limit = 0;
 
     if (limit) {
         for (size_t i = 0; i < s; ++i) res[i] = i;
diff --git a/be/src/vec/common/string_buffer.hpp b/be/src/vec/common/string_buffer.hpp
index 8dca6f057a26d3..769b2e93d7d9dd 100644
--- a/be/src/vec/common/string_buffer.hpp
+++ b/be/src/vec/common/string_buffer.hpp
@@ -76,7 +76,7 @@ class BufferReadable {
         return ref;
     }
 
-    void read(char* data, int len) {
+    void read(char* data, size_t len) {
         memcpy(data, _data, len);
         _data += len;
     }
diff --git a/be/src/vec/data_types/data_type.h b/be/src/vec/data_types/data_type.h
index 6c54241ea18a2a..e193856c05187d 100644
--- a/be/src/vec/data_types/data_type.h
+++ b/be/src/vec/data_types/data_type.h
@@ -151,16 +151,8 @@ class IDataType : private boost::noncopyable {
       */
     virtual bool is_value_represented_by_number() const { return false; }
 
-    /** Integers, Enums, Date, DateTime. Not nullable.
-      */
-    virtual bool is_value_represented_by_integer() const { return false; }
-
     virtual bool is_object() const { return false; }
 
-    /** Unsigned Integers, Date, DateTime. Not nullable.
-      */
-    virtual bool is_value_represented_by_unsigned_integer() const { return false; }
-
     /** Values are unambiguously identified by contents of contiguous memory region,
       *  that can be obtained by IColumn::get_data_at method.
       * Examples: numbers, Date, DateTime, String, FixedString,
@@ -386,10 +378,6 @@ inline bool is_not_decimal_but_comparable_to_decimal(const DataTypePtr& data_typ
     return which.is_int() || which.is_uint();
 }
 
-inline bool is_compilable_type(const DataTypePtr& data_type) {
-    return data_type->is_value_represented_by_number() && !is_decimal(data_type);
-}
-
 inline bool is_complex_type(const DataTypePtr& data_type) {
     WhichDataType which(data_type);
     return which.is_array() || which.is_map() || which.is_struct();
diff --git a/be/src/vec/data_types/data_type_bitmap.h b/be/src/vec/data_types/data_type_bitmap.h
index 24f1e6334431c1..ce0f327f5450a5 100644
--- a/be/src/vec/data_types/data_type_bitmap.h
+++ b/be/src/vec/data_types/data_type_bitmap.h
@@ -77,9 +77,6 @@ class DataTypeBitMap : public IDataType {
     bool should_align_right_in_pretty_formats() const override { return false; }
     bool text_can_contain_only_valid_utf8() const override { return true; }
     bool is_comparable() const override { return false; }
-    bool is_value_represented_by_number() const override { return false; }
-    bool is_value_represented_by_integer() const override { return false; }
-    bool is_value_represented_by_unsigned_integer() const override { return false; }
     // TODO:
     bool is_value_unambiguously_represented_in_contiguous_memory_region() const override {
         return true;
diff --git a/be/src/vec/data_types/data_type_hll.h b/be/src/vec/data_types/data_type_hll.h
index 2c4061cf7b4abd..6d8d085a1550f6 100644
--- a/be/src/vec/data_types/data_type_hll.h
+++ b/be/src/vec/data_types/data_type_hll.h
@@ -69,9 +69,6 @@ class DataTypeHLL : public IDataType {
     bool should_align_right_in_pretty_formats() const override { return false; }
     bool text_can_contain_only_valid_utf8() const override { return true; }
     bool is_comparable() const override { return false; }
-    bool is_value_represented_by_number() const override { return false; }
-    bool is_value_represented_by_integer() const override { return false; }
-    bool is_value_represented_by_unsigned_integer() const override { return false; }
     // TODO:
     bool is_value_unambiguously_represented_in_contiguous_memory_region() const override {
         return true;
diff --git a/be/src/vec/data_types/data_type_number_base.cpp b/be/src/vec/data_types/data_type_number_base.cpp
index da34d82031cda0..1afed3d7d1a394 100644
--- a/be/src/vec/data_types/data_type_number_base.cpp
+++ b/be/src/vec/data_types/data_type_number_base.cpp
@@ -313,16 +313,6 @@ MutableColumnPtr DataTypeNumberBase<T>::create_column() const {
     return ColumnVector<T>::create();
 }
 
-template <typename T>
-bool DataTypeNumberBase<T>::is_value_represented_by_integer() const {
-    return std::is_integral_v<T>;
-}
-
-template <typename T>
-bool DataTypeNumberBase<T>::is_value_represented_by_unsigned_integer() const {
-    return std::is_integral_v<T> && std::is_unsigned_v<T>;
-}
-
 /// Explicit template instantiations - to avoid code bloat in headers.
 template class DataTypeNumberBase<UInt8>;
 template class DataTypeNumberBase<UInt16>;
diff --git a/be/src/vec/data_types/data_type_number_base.h b/be/src/vec/data_types/data_type_number_base.h
index d5ddfe07e831ca..a73bd9951891a3 100644
--- a/be/src/vec/data_types/data_type_number_base.h
+++ b/be/src/vec/data_types/data_type_number_base.h
@@ -145,8 +145,6 @@ class DataTypeNumberBase : public IDataType {
     bool text_can_contain_only_valid_utf8() const override { return true; }
     bool is_comparable() const override { return true; }
     bool is_value_represented_by_number() const override { return true; }
-    bool is_value_represented_by_integer() const override;
-    bool is_value_represented_by_unsigned_integer() const override;
     bool is_value_unambiguously_represented_in_contiguous_memory_region() const override {
         return true;
     }
diff --git a/be/src/vec/data_types/data_type_quantilestate.h b/be/src/vec/data_types/data_type_quantilestate.h
index 5edfe123dca6df..9d34604395cd0d 100644
--- a/be/src/vec/data_types/data_type_quantilestate.h
+++ b/be/src/vec/data_types/data_type_quantilestate.h
@@ -72,9 +72,6 @@ class DataTypeQuantileState : public IDataType {
     bool should_align_right_in_pretty_formats() const override { return false; }
     bool text_can_contain_only_valid_utf8() const override { return true; }
     bool is_comparable() const override { return false; }
-    bool is_value_represented_by_number() const override { return false; }
-    bool is_value_represented_by_integer() const override { return false; }
-    bool is_value_represented_by_unsigned_integer() const override { return false; }
     // TODO:
     bool is_value_unambiguously_represented_in_contiguous_memory_region() const override {
         return true;
diff --git a/be/src/vec/data_types/serde/data_type_jsonb_serde.cpp b/be/src/vec/data_types/serde/data_type_jsonb_serde.cpp
index adc041f511198e..e597cdba224376 100644
--- a/be/src/vec/data_types/serde/data_type_jsonb_serde.cpp
+++ b/be/src/vec/data_types/serde/data_type_jsonb_serde.cpp
@@ -212,9 +212,9 @@ void convert_jsonb_to_rapidjson(const JsonbValue& val, rapidjson::Value& target,
         }
         target.Reserve(array.numElem(), allocator);
         for (auto it = array.begin(); it != array.end(); ++it) {
-            rapidjson::Value val;
-            convert_jsonb_to_rapidjson(*static_cast<const JsonbValue*>(it), val, allocator);
-            target.PushBack(val, allocator);
+            rapidjson::Value array_val;
+            convert_jsonb_to_rapidjson(*static_cast<const JsonbValue*>(it), array_val, allocator);
+            target.PushBack(array_val, allocator);
         }
         break;
     }
@@ -222,9 +222,9 @@ void convert_jsonb_to_rapidjson(const JsonbValue& val, rapidjson::Value& target,
         target.SetObject();
         const ObjectVal& obj = static_cast<const ObjectVal&>(val);
         for (auto it = obj.begin(); it != obj.end(); ++it) {
-            rapidjson::Value val;
-            convert_jsonb_to_rapidjson(*it->value(), val, allocator);
-            target.AddMember(rapidjson::GenericStringRef(it->getKeyStr(), it->klen()), val,
+            rapidjson::Value obj_val;
+            convert_jsonb_to_rapidjson(*it->value(), obj_val, allocator);
+            target.AddMember(rapidjson::GenericStringRef(it->getKeyStr(), it->klen()), obj_val,
                              allocator);
         }
         break;
diff --git a/be/src/vec/exec/format/table/hudi_jni_reader.cpp b/be/src/vec/exec/format/table/hudi_jni_reader.cpp
index 33ba92b540a497..cb109bf05a2393 100644
--- a/be/src/vec/exec/format/table/hudi_jni_reader.cpp
+++ b/be/src/vec/exec/format/table/hudi_jni_reader.cpp
@@ -18,7 +18,6 @@
 #include "hudi_jni_reader.h"
 
 #include <map>
-#include <ostream>
 
 #include "runtime/descriptors.h"
 #include "runtime/runtime_state.h"
@@ -65,7 +64,7 @@ HudiJniReader::HudiJniReader(const TFileScanRangeParams& scan_params,
             {"input_format", _hudi_params.input_format}};
 
     // Use compatible hadoop client to read data
-    for (auto& kv : _scan_params.properties) {
+    for (const auto& kv : _scan_params.properties) {
         if (kv.first.starts_with(HOODIE_CONF_PREFIX)) {
             params[kv.first] = kv.second;
         } else {
@@ -73,8 +72,15 @@ HudiJniReader::HudiJniReader(const TFileScanRangeParams& scan_params,
         }
     }
 
-    _jni_connector = std::make_unique<JniConnector>("org/apache/doris/hudi/HudiJniScanner", params,
-                                                    required_fields);
+    if (_hudi_params.hudi_jni_scanner == "hadoop") {
+        _jni_connector = std::make_unique<JniConnector>(
+                "org/apache/doris/hudi/HadoopHudiJniScanner", params, required_fields);
+    } else if (_hudi_params.hudi_jni_scanner == "spark") {
+        _jni_connector = std::make_unique<JniConnector>("org/apache/doris/hudi/HudiJniScanner",
+                                                        params, required_fields);
+    } else {
+        DCHECK(false) << "Unsupported hudi jni scanner: " << _hudi_params.hudi_jni_scanner;
+    }
 }
 
 Status HudiJniReader::get_next_block(Block* block, size_t* read_rows, bool* eof) {
diff --git a/be/src/vec/exec/format/table/hudi_jni_reader.h b/be/src/vec/exec/format/table/hudi_jni_reader.h
index e9bb55a69a77e7..bfa0291a61035c 100644
--- a/be/src/vec/exec/format/table/hudi_jni_reader.h
+++ b/be/src/vec/exec/format/table/hudi_jni_reader.h
@@ -17,9 +17,7 @@
 
 #pragma once
 
-#include <stddef.h>
-
-#include <memory>
+#include <cstddef>
 #include <string>
 #include <unordered_map>
 #include <unordered_set>
diff --git a/be/src/vec/exec/format/table/max_compute_jni_reader.cpp b/be/src/vec/exec/format/table/max_compute_jni_reader.cpp
index d1a71fd1a2f9d9..665e19b6bcebd9 100644
--- a/be/src/vec/exec/format/table/max_compute_jni_reader.cpp
+++ b/be/src/vec/exec/format/table/max_compute_jni_reader.cpp
@@ -77,7 +77,11 @@ MaxComputeJniReader::MaxComputeJniReader(const MaxComputeTableDescriptor* mc_des
             {"start_offset", std::to_string(_range.start_offset)},
             {"split_size", std::to_string(_range.size)},
             {"required_fields", required_fields.str()},
-            {"columns_types", columns_types.str()}};
+            {"columns_types", columns_types.str()},
+
+            {"connect_timeout", std::to_string(_max_compute_params.connect_timeout)},
+            {"read_timeout", std::to_string(_max_compute_params.read_timeout)},
+            {"retry_count", std::to_string(_max_compute_params.retry_times)}};
     _jni_connector = std::make_unique<JniConnector>(
             "org/apache/doris/maxcompute/MaxComputeJniScanner", params, column_names);
 }
diff --git a/be/src/vec/exec/jni_connector.cpp b/be/src/vec/exec/jni_connector.cpp
index a7b0d5144ee623..4c977b69ad6a42 100644
--- a/be/src/vec/exec/jni_connector.cpp
+++ b/be/src/vec/exec/jni_connector.cpp
@@ -599,68 +599,79 @@ std::string JniConnector::get_jni_type(const TypeDescriptor& desc) {
     }
 }
 
-Status JniConnector::_fill_column_meta(ColumnPtr& doris_column, DataTypePtr& data_type,
+Status JniConnector::_fill_column_meta(const ColumnPtr& doris_column, const DataTypePtr& data_type,
                                        std::vector<long>& meta_data) {
     TypeIndex logical_type = remove_nullable(data_type)->get_type_id();
+    const IColumn* column = nullptr;
+    // insert const flag
+    if (is_column_const(*doris_column)) {
+        meta_data.emplace_back((long)1);
+        const auto& const_column = assert_cast<const ColumnConst&>(*doris_column);
+        column = &(const_column.get_data_column());
+    } else {
+        meta_data.emplace_back((long)0);
+        column = &(*doris_column);
+    }
+
     // insert null map address
-    MutableColumnPtr data_column;
-    if (doris_column->is_nullable()) {
-        auto* nullable_column =
-                reinterpret_cast<vectorized::ColumnNullable*>(doris_column->assume_mutable().get());
-        data_column = nullable_column->get_nested_column_ptr();
-        NullMap& null_map = nullable_column->get_null_map_data();
+    const IColumn* data_column = nullptr;
+    if (column->is_nullable()) {
+        const auto& nullable_column = assert_cast<const vectorized::ColumnNullable&>(*column);
+        data_column = &(nullable_column.get_nested_column());
+        const auto& null_map = nullable_column.get_null_map_data();
         meta_data.emplace_back((long)null_map.data());
     } else {
         meta_data.emplace_back(0);
-        data_column = doris_column->assume_mutable();
+        data_column = column;
     }
     switch (logical_type) {
-#define DISPATCH(TYPE_INDEX, COLUMN_TYPE, CPP_TYPE)                                         \
-    case TYPE_INDEX: {                                                                      \
-        meta_data.emplace_back(_get_fixed_length_column_address<COLUMN_TYPE>(data_column)); \
-        break;                                                                              \
+#define DISPATCH(TYPE_INDEX, COLUMN_TYPE, CPP_TYPE)                                          \
+    case TYPE_INDEX: {                                                                       \
+        meta_data.emplace_back(_get_fixed_length_column_address<COLUMN_TYPE>(*data_column)); \
+        break;                                                                               \
     }
         FOR_FIXED_LENGTH_TYPES(DISPATCH)
 #undef DISPATCH
     case TypeIndex::String:
         [[fallthrough]];
     case TypeIndex::FixedString: {
-        auto& string_column = static_cast<ColumnString&>(*data_column);
+        const auto& string_column = assert_cast<const ColumnString&>(*data_column);
         // inert offsets
         meta_data.emplace_back((long)string_column.get_offsets().data());
         meta_data.emplace_back((long)string_column.get_chars().data());
         break;
     }
     case TypeIndex::Array: {
-        ColumnPtr& element_column = static_cast<ColumnArray&>(*data_column).get_data_ptr();
-        meta_data.emplace_back((long)static_cast<ColumnArray&>(*data_column).get_offsets().data());
-        DataTypePtr& element_type = const_cast<DataTypePtr&>(
-                (reinterpret_cast<const DataTypeArray*>(remove_nullable(data_type).get()))
+        const auto& element_column = assert_cast<const ColumnArray&>(*data_column).get_data_ptr();
+        meta_data.emplace_back(
+                (long)assert_cast<const ColumnArray&>(*data_column).get_offsets().data());
+        const auto& element_type = assert_cast<const DataTypePtr&>(
+                (assert_cast<const DataTypeArray*>(remove_nullable(data_type).get()))
                         ->get_nested_type());
         RETURN_IF_ERROR(_fill_column_meta(element_column, element_type, meta_data));
         break;
     }
     case TypeIndex::Struct: {
-        auto& doris_struct = static_cast<ColumnStruct&>(*data_column);
-        const DataTypeStruct* doris_struct_type =
-                reinterpret_cast<const DataTypeStruct*>(remove_nullable(data_type).get());
+        const auto& doris_struct = assert_cast<const ColumnStruct&>(*data_column);
+        const auto* doris_struct_type =
+                assert_cast<const DataTypeStruct*>(remove_nullable(data_type).get());
         for (int i = 0; i < doris_struct.tuple_size(); ++i) {
-            ColumnPtr& struct_field = doris_struct.get_column_ptr(i);
-            DataTypePtr& field_type = const_cast<DataTypePtr&>(doris_struct_type->get_element(i));
+            const auto& struct_field = doris_struct.get_column_ptr(i);
+            const auto& field_type =
+                    assert_cast<const DataTypePtr&>(doris_struct_type->get_element(i));
             RETURN_IF_ERROR(_fill_column_meta(struct_field, field_type, meta_data));
         }
         break;
     }
     case TypeIndex::Map: {
-        auto& map = static_cast<ColumnMap&>(*data_column);
-        DataTypePtr& key_type = const_cast<DataTypePtr&>(
-                reinterpret_cast<const DataTypeMap*>(remove_nullable(data_type).get())
-                        ->get_key_type());
-        DataTypePtr& value_type = const_cast<DataTypePtr&>(
-                reinterpret_cast<const DataTypeMap*>(remove_nullable(data_type).get())
+        const auto& map = assert_cast<const ColumnMap&>(*data_column);
+        const auto& key_type = assert_cast<const DataTypePtr&>(
+                assert_cast<const DataTypeMap*>(remove_nullable(data_type).get())->get_key_type());
+        const auto& value_type = assert_cast<const DataTypePtr&>(
+                assert_cast<const DataTypeMap*>(remove_nullable(data_type).get())
                         ->get_value_type());
-        ColumnPtr& key_column = map.get_keys_ptr();
-        ColumnPtr& value_column = map.get_values_ptr();
+        const auto& key_column = map.get_keys_ptr();
+        const auto& value_column = map.get_values_ptr();
         meta_data.emplace_back((long)map.get_offsets().data());
         RETURN_IF_ERROR(_fill_column_meta(key_column, key_type, meta_data));
         RETURN_IF_ERROR(_fill_column_meta(value_column, value_type, meta_data));
@@ -686,11 +697,6 @@ Status JniConnector::to_java_table(Block* block, size_t num_rows, const ColumnNu
     // insert number of rows
     meta_data.emplace_back(num_rows);
     for (size_t i : arguments) {
-        if (is_column_const(*(block->get_by_position(i).column))) {
-            auto doris_column = block->get_by_position(i).column->convert_to_full_column_if_const();
-            bool is_nullable = block->get_by_position(i).type->is_nullable();
-            block->replace_by_position(i, is_nullable ? make_nullable(doris_column) : doris_column);
-        }
         auto& column_with_type_and_name = block->get_by_position(i);
         RETURN_IF_ERROR(_fill_column_meta(column_with_type_and_name.column,
                                           column_with_type_and_name.type, meta_data));
diff --git a/be/src/vec/exec/jni_connector.h b/be/src/vec/exec/jni_connector.h
index 52a3fb2e7782ca..e06654dcfe3ca8 100644
--- a/be/src/vec/exec/jni_connector.h
+++ b/be/src/vec/exec/jni_connector.h
@@ -336,13 +336,13 @@ class JniConnector : public ProfileCollector {
     static Status _fill_struct_column(TableMetaAddress& address, MutableColumnPtr& doris_column,
                                       DataTypePtr& data_type, size_t num_rows);
 
-    static Status _fill_column_meta(ColumnPtr& doris_column, DataTypePtr& data_type,
+    static Status _fill_column_meta(const ColumnPtr& doris_column, const DataTypePtr& data_type,
                                     std::vector<long>& meta_data);
 
     template <typename COLUMN_TYPE, typename CPP_TYPE>
     static Status _fill_fixed_length_column(MutableColumnPtr& doris_column, CPP_TYPE* ptr,
                                             size_t num_rows) {
-        auto& column_data = static_cast<COLUMN_TYPE&>(*doris_column).get_data();
+        auto& column_data = assert_cast<COLUMN_TYPE&>(*doris_column).get_data();
         size_t origin_size = column_data.size();
         column_data.resize(origin_size + num_rows);
         memcpy(column_data.data() + origin_size, ptr, sizeof(CPP_TYPE) * num_rows);
@@ -350,8 +350,8 @@ class JniConnector : public ProfileCollector {
     }
 
     template <typename COLUMN_TYPE>
-    static long _get_fixed_length_column_address(MutableColumnPtr& doris_column) {
-        return (long)static_cast<COLUMN_TYPE&>(*doris_column).get_data().data();
+    static long _get_fixed_length_column_address(const IColumn& doris_column) {
+        return (long)assert_cast<const COLUMN_TYPE&>(doris_column).get_data().data();
     }
 
     void _generate_predicates(
diff --git a/be/src/vec/exec/scan/scanner_context.cpp b/be/src/vec/exec/scan/scanner_context.cpp
index 65812cb428a8f8..688204bdff8ca7 100644
--- a/be/src/vec/exec/scan/scanner_context.cpp
+++ b/be/src/vec/exec/scan/scanner_context.cpp
@@ -65,7 +65,10 @@ ScannerContext::ScannerContext(
            _output_row_descriptor->tuple_descriptors().size() == 1);
     _query_id = _state->get_query_ctx()->query_id();
     ctx_id = UniqueId::gen_uid().to_string();
-    _scanners.enqueue_bulk(scanners.begin(), scanners.size());
+    if (!_scanners.enqueue_bulk(scanners.begin(), scanners.size())) [[unlikely]] {
+        throw Exception(ErrorCode::INTERNAL_ERROR,
+                        "Exception occurs during scanners initialization.");
+    };
     if (limit < 0) {
         limit = -1;
     }
@@ -250,6 +253,8 @@ void ScannerContext::return_free_block(vectorized::BlockUPtr block) {
         _block_memory_usage += block_size_to_reuse;
         _scanner_memory_used_counter->set(_block_memory_usage);
         block->clear_column_data();
+        // Free blocks is used to improve memory efficiency. Failure during pushing back
+        // free block will not incur any bad result so just ignore the return value.
         _free_blocks.enqueue(std::move(block));
     }
 }
diff --git a/be/src/vec/exec/scan/vfile_scanner.cpp b/be/src/vec/exec/scan/vfile_scanner.cpp
index 3053adebbb521e..246a2edb082c92 100644
--- a/be/src/vec/exec/scan/vfile_scanner.cpp
+++ b/be/src/vec/exec/scan/vfile_scanner.cpp
@@ -23,18 +23,15 @@
 #include <gen_cpp/PaloInternalService_types.h>
 #include <gen_cpp/PlanNodes_types.h>
 
-#include <algorithm>
 #include <boost/iterator/iterator_facade.hpp>
 #include <iterator>
 #include <map>
-#include <ostream>
 #include <tuple>
 #include <utility>
 
 #include "common/compiler_util.h" // IWYU pragma: keep
 #include "common/config.h"
 #include "common/logging.h"
-#include "common/object_pool.h"
 #include "io/cache/block_file_cache_profile.h"
 #include "runtime/descriptors.h"
 #include "runtime/runtime_state.h"
@@ -47,7 +44,6 @@
 #include "vec/common/string_ref.h"
 #include "vec/core/column_with_type_and_name.h"
 #include "vec/core/columns_with_type_and_name.h"
-#include "vec/core/field.h"
 #include "vec/data_types/data_type.h"
 #include "vec/data_types/data_type_factory.hpp"
 #include "vec/data_types/data_type_nullable.h"
@@ -754,17 +750,16 @@ Status VFileScanner::_get_next_reader() {
 
         // create reader for specific format
         Status init_status;
-        TFileFormatType::type format_type = _params->format_type;
+        // for compatibility, if format_type is not set in range, use the format type of params
+        TFileFormatType::type format_type =
+                range.__isset.format_type ? range.format_type : _params->format_type;
         // JNI reader can only push down column value range
         bool push_down_predicates =
                 !_is_load && _params->format_type != TFileFormatType::FORMAT_JNI;
+        // for compatibility, this logic is deprecated in 3.1
         if (format_type == TFileFormatType::FORMAT_JNI && range.__isset.table_format_params) {
-            if (range.table_format_params.table_format_type == "hudi" &&
-                range.table_format_params.hudi_params.delta_logs.empty()) {
-                // fall back to native reader if there is no log file
-                format_type = TFileFormatType::FORMAT_PARQUET;
-            } else if (range.table_format_params.table_format_type == "paimon" &&
-                       !range.table_format_params.paimon_params.__isset.paimon_split) {
+            if (range.table_format_params.table_format_type == "paimon" &&
+                !range.table_format_params.paimon_params.__isset.paimon_split) {
                 // use native reader
                 auto format = range.table_format_params.paimon_params.file_format;
                 if (format == "orc") {
diff --git a/be/src/vec/exprs/lambda_function/lambda_function.h b/be/src/vec/exprs/lambda_function/lambda_function.h
index 184b4c2cc38abf..07302954688271 100644
--- a/be/src/vec/exprs/lambda_function/lambda_function.h
+++ b/be/src/vec/exprs/lambda_function/lambda_function.h
@@ -17,7 +17,7 @@
 
 #pragma once
 
-#include <fmt/core.h>
+#include <runtime/runtime_state.h>
 
 #include "common/status.h"
 #include "vec/core/block.h"
@@ -31,9 +31,16 @@ class LambdaFunction {
 
     virtual std::string get_name() const = 0;
 
+    virtual doris::Status prepare(RuntimeState* state) {
+        batch_size = state->batch_size();
+        return Status::OK();
+    }
+
     virtual doris::Status execute(VExprContext* context, doris::vectorized::Block* block,
                                   int* result_column_id, const DataTypePtr& result_type,
                                   const VExprSPtrs& children) = 0;
+
+    int batch_size;
 };
 
 using LambdaFunctionPtr = std::shared_ptr<LambdaFunction>;
diff --git a/be/src/vec/exprs/lambda_function/varray_map_function.cpp b/be/src/vec/exprs/lambda_function/varray_map_function.cpp
index f80cffa166eac4..f7a864b92d3fb4 100644
--- a/be/src/vec/exprs/lambda_function/varray_map_function.cpp
+++ b/be/src/vec/exprs/lambda_function/varray_map_function.cpp
@@ -15,9 +15,13 @@
 // specific language governing permissions and limitations
 // under the License.
 
+#include <vec/data_types/data_type_number.h>
+#include <vec/exprs/vcolumn_ref.h>
+#include <vec/exprs/vslot_ref.h>
+
 #include <memory>
 #include <string>
-#include <utility>
+#include <vector>
 
 #include "common/status.h"
 #include "vec/aggregate_functions/aggregate_function.h"
@@ -39,9 +43,28 @@
 
 namespace doris::vectorized {
 #include "common/compile_check_begin.h"
-
 class VExprContext;
 
+// extend a block with all required parameters
+struct LambdaArgs {
+    // the lambda function need the column ids of all the slots
+    std::vector<int> output_slot_ref_indexs;
+    // which line is extended to the original block
+    int64_t current_row_idx = 0;
+    // when a block is filled, the array may be truncated, recording where it was truncated
+    int64_t current_offset_in_array = 0;
+    // the beginning position of the array
+    size_t array_start = 0;
+    // the size of the array
+    int64_t cur_size = 0;
+    // offset of column array
+    const ColumnArray::Offsets64* offsets_ptr = nullptr;
+    // expend data of repeat times
+    int current_repeat_times = 0;
+    // whether the current row of the original block has been extended
+    bool current_row_eos = false;
+};
+
 class ArrayMapFunction : public LambdaFunction {
     ENABLE_FACTORY_CREATOR(ArrayMapFunction);
 
@@ -57,8 +80,33 @@ class ArrayMapFunction : public LambdaFunction {
     doris::Status execute(VExprContext* context, doris::vectorized::Block* block,
                           int* result_column_id, const DataTypePtr& result_type,
                           const VExprSPtrs& children) override {
-        ///* array_map(lambda,arg1,arg2,.....) *///
+        LambdaArgs args;
+        // collect used slot ref in lambda function body
+        _collect_slot_ref_column_id(children[0], args);
+
+        int gap = 0;
+        if (!args.output_slot_ref_indexs.empty()) {
+            auto max_id = std::max_element(args.output_slot_ref_indexs.begin(),
+                                           args.output_slot_ref_indexs.end());
+            gap = *max_id + 1;
+            _set_column_ref_column_id(children[0], gap);
+        }
 
+        std::vector<std::string> names(gap);
+        DataTypes data_types(gap);
+
+        for (int i = 0; i < gap; ++i) {
+            if (_contains_column_id(args, i)) {
+                names[i] = block->get_by_position(i).name;
+                data_types[i] = block->get_by_position(i).type;
+            } else {
+                // padding some mock data
+                names[i] = "temp";
+                data_types[i] = std::make_shared<DataTypeUInt8>();
+            }
+        }
+
+        ///* array_map(lambda,arg1,arg2,.....) *///
         //1. child[1:end]->execute(src_block)
         doris::vectorized::ColumnNumbers arguments(children.size() - 1);
         for (int i = 1; i < children.size(); ++i) {
@@ -77,14 +125,13 @@ class ArrayMapFunction : public LambdaFunction {
         MutableColumnPtr array_column_offset;
         size_t nested_array_column_rows = 0;
         ColumnPtr first_array_offsets = nullptr;
-
         //2. get the result column from executed expr, and the needed is nested column of array
-        Block lambda_block;
+        std::vector<ColumnPtr> lambda_datas(arguments.size());
+
         for (int i = 0; i < arguments.size(); ++i) {
             const auto& array_column_type_name = block->get_by_position(arguments[i]);
             auto column_array = array_column_type_name.column->convert_to_full_column_if_const();
             auto type_array = array_column_type_name.type;
-
             if (type_array->is_nullable()) {
                 // get the nullmap of nullable column
                 const auto& column_array_nullmap =
@@ -113,6 +160,7 @@ class ArrayMapFunction : public LambdaFunction {
                 const auto& off_data = assert_cast<const ColumnArray::ColumnOffsets&>(
                         col_array.get_offsets_column());
                 array_column_offset = off_data.clone_resized(col_array.get_offsets_column().size());
+                args.offsets_ptr = &col_array.get_offsets();
             } else {
                 // select array_map((x,y)->x+y,c_array1,[0,1,2,3]) from array_test2;
                 // c_array1: [0,1,2,3,4,5,6,7,8,9]
@@ -131,57 +179,164 @@ class ArrayMapFunction : public LambdaFunction {
                             nested_array_column_rows, i + 1, col_array.get_data_ptr()->size());
                 }
             }
-
-            // insert the data column to the new block
-            ColumnWithTypeAndName data_column {col_array.get_data_ptr(), col_type.get_nested_type(),
-                                               "R" + array_column_type_name.name};
-            lambda_block.insert(std::move(data_column));
+            lambda_datas[i] = col_array.get_data_ptr();
+            names.push_back("R" + array_column_type_name.name);
+            data_types.push_back(col_type.get_nested_type());
         }
 
-        //3. child[0]->execute(new_block)
-        RETURN_IF_ERROR(children[0]->execute(context, &lambda_block, result_column_id));
+        ColumnPtr result_col = nullptr;
+        DataTypePtr res_type;
+        std::string res_name;
+
+        //process first row
+        args.array_start = (*args.offsets_ptr)[args.current_row_idx - 1];
+        args.cur_size = (*args.offsets_ptr)[args.current_row_idx] - args.array_start;
+
+        while (args.current_row_idx < block->rows()) {
+            Block lambda_block;
+            for (int i = 0; i < names.size(); i++) {
+                ColumnWithTypeAndName data_column;
+                if (_contains_column_id(args, i) || i >= gap) {
+                    data_column = ColumnWithTypeAndName(data_types[i], names[i]);
+                } else {
+                    data_column = ColumnWithTypeAndName(
+                            data_types[i]->create_column_const_with_default_value(0), data_types[i],
+                            names[i]);
+                }
+                lambda_block.insert(std::move(data_column));
+            }
+
+            MutableColumns columns = lambda_block.mutate_columns();
+            while (columns[gap]->size() < batch_size) {
+                long max_step = batch_size - columns[gap]->size();
+                long current_step =
+                        std::min(max_step, (long)(args.cur_size - args.current_offset_in_array));
+                size_t pos = args.array_start + args.current_offset_in_array;
+                for (int i = 0; i < arguments.size(); ++i) {
+                    columns[gap + i]->insert_range_from(*lambda_datas[i], pos, current_step);
+                }
+                args.current_offset_in_array += current_step;
+                args.current_repeat_times += current_step;
+                if (args.current_offset_in_array >= args.cur_size) {
+                    args.current_row_eos = true;
+                }
+                _extend_data(columns, block, args, gap);
+                if (args.current_row_eos) {
+                    args.current_row_idx++;
+                    args.current_offset_in_array = 0;
+                    if (args.current_row_idx >= block->rows()) {
+                        break;
+                    }
+                    args.current_row_eos = false;
+                    args.array_start = (*args.offsets_ptr)[args.current_row_idx - 1];
+                    args.cur_size = (*args.offsets_ptr)[args.current_row_idx] - args.array_start;
+                }
+            }
+
+            lambda_block.set_columns(std::move(columns));
 
-        auto res_col = lambda_block.get_by_position(*result_column_id)
-                               .column->convert_to_full_column_if_const();
-        auto res_type = lambda_block.get_by_position(*result_column_id).type;
-        auto res_name = lambda_block.get_by_position(*result_column_id).name;
+            //3. child[0]->execute(new_block)
+            RETURN_IF_ERROR(children[0]->execute(context, &lambda_block, result_column_id));
+
+            auto res_col = lambda_block.get_by_position(*result_column_id)
+                                   .column->convert_to_full_column_if_const();
+            res_type = lambda_block.get_by_position(*result_column_id).type;
+            res_name = lambda_block.get_by_position(*result_column_id).name;
+            if (!result_col) {
+                result_col = std::move(res_col);
+            } else {
+                MutableColumnPtr column = (*std::move(result_col)).mutate();
+                column->insert_range_from(*res_col, 0, res_col->size());
+            }
+        }
 
         //4. get the result column after execution, reassemble it into a new array column, and return.
         ColumnWithTypeAndName result_arr;
         if (result_type->is_nullable()) {
             if (res_type->is_nullable()) {
-                result_arr = {ColumnNullable::create(
-                                      ColumnArray::create(res_col, std::move(array_column_offset)),
-                                      std::move(outside_null_map)),
-                              result_type, res_name};
+                result_arr = {
+                        ColumnNullable::create(
+                                ColumnArray::create(result_col, std::move(array_column_offset)),
+                                std::move(outside_null_map)),
+                        result_type, res_name};
             } else {
                 // deal with eg: select array_map(x -> x is null, [null, 1, 2]);
                 // need to create the nested column null map for column array
-                auto nested_null_map = ColumnUInt8::create(res_col->size(), 0);
+                auto nested_null_map = ColumnUInt8::create(result_col->size(), 0);
                 result_arr = {
                         ColumnNullable::create(
-                                ColumnArray::create(
-                                        ColumnNullable::create(res_col, std::move(nested_null_map)),
-                                        std::move(array_column_offset)),
+                                ColumnArray::create(ColumnNullable::create(
+                                                            result_col, std::move(nested_null_map)),
+                                                    std::move(array_column_offset)),
                                 std::move(outside_null_map)),
                         result_type, res_name};
             }
         } else {
             if (res_type->is_nullable()) {
-                result_arr = {ColumnArray::create(res_col, std::move(array_column_offset)),
+                result_arr = {ColumnArray::create(result_col, std::move(array_column_offset)),
                               result_type, res_name};
             } else {
-                auto nested_null_map = ColumnUInt8::create(res_col->size(), 0);
-                result_arr = {ColumnArray::create(
-                                      ColumnNullable::create(res_col, std::move(nested_null_map)),
-                                      std::move(array_column_offset)),
+                auto nested_null_map = ColumnUInt8::create(result_col->size(), 0);
+                result_arr = {ColumnArray::create(ColumnNullable::create(
+                                                          result_col, std::move(nested_null_map)),
+                                                  std::move(array_column_offset)),
                               result_type, res_name};
             }
         }
         block->insert(std::move(result_arr));
         *result_column_id = block->columns() - 1;
+
         return Status::OK();
     }
+
+private:
+    bool _contains_column_id(LambdaArgs& args, int id) {
+        const auto it = std::find(args.output_slot_ref_indexs.begin(),
+                                  args.output_slot_ref_indexs.end(), id);
+        return it != args.output_slot_ref_indexs.end();
+    }
+
+    void _set_column_ref_column_id(VExprSPtr expr, int gap) {
+        for (const auto& child : expr->children()) {
+            if (child->is_column_ref()) {
+                auto* ref = static_cast<VColumnRef*>(child.get());
+                ref->set_gap(gap);
+            } else {
+                _set_column_ref_column_id(child, gap);
+            }
+        }
+    }
+
+    void _collect_slot_ref_column_id(VExprSPtr expr, LambdaArgs& args) {
+        for (const auto& child : expr->children()) {
+            if (child->is_slot_ref()) {
+                const auto* ref = static_cast<VSlotRef*>(child.get());
+                args.output_slot_ref_indexs.push_back(ref->column_id());
+            } else {
+                _collect_slot_ref_column_id(child, args);
+            }
+        }
+    }
+
+    void _extend_data(std::vector<MutableColumnPtr>& columns, Block* block, LambdaArgs& args,
+                      int size) {
+        if (!args.current_repeat_times || !size) {
+            return;
+        }
+        for (int i = 0; i < size; i++) {
+            if (_contains_column_id(args, i)) {
+                auto src_column =
+                        block->get_by_position(i).column->convert_to_full_column_if_const();
+                columns[i]->insert_many_from(*src_column, args.current_row_idx,
+                                             args.current_repeat_times);
+            } else {
+                // must be column const
+                DCHECK(is_column_const(*columns[i]));
+                columns[i]->resize(columns[i]->size() + args.current_repeat_times);
+            }
+        }
+        args.current_repeat_times = 0;
+    }
 };
 
 void register_function_array_map(doris::vectorized::LambdaFunctionFactory& factory) {
diff --git a/be/src/vec/exprs/vcolumn_ref.h b/be/src/vec/exprs/vcolumn_ref.h
index a763797880e361..d58e1375291457 100644
--- a/be/src/vec/exprs/vcolumn_ref.h
+++ b/be/src/vec/exprs/vcolumn_ref.h
@@ -16,6 +16,8 @@
 // under the License.
 
 #pragma once
+#include <atomic>
+
 #include "runtime/descriptors.h"
 #include "runtime/runtime_state.h"
 #include "vec/exprs/vexpr.h"
@@ -57,7 +59,7 @@ class VColumnRef final : public VExpr {
 
     Status execute(VExprContext* context, Block* block, int* result_column_id) override {
         DCHECK(_open_finished || _getting_const_col);
-        *result_column_id = _column_id;
+        *result_column_id = _column_id + _gap;
         return Status::OK();
     }
 
@@ -67,6 +69,12 @@ class VColumnRef final : public VExpr {
 
     const std::string& expr_name() const override { return _column_name; }
 
+    void set_gap(int gap) {
+        if (_gap == 0) {
+            _gap = gap;
+        }
+    }
+
     std::string debug_string() const override {
         std::stringstream out;
         out << "VColumnRef(slot_id: " << _column_id << ",column_name: " << _column_name
@@ -76,6 +84,7 @@ class VColumnRef final : public VExpr {
 
 private:
     int _column_id;
+    std::atomic<int> _gap = 0;
     std::string _column_name;
 };
 } // namespace vectorized
diff --git a/be/src/vec/exprs/vexpr.h b/be/src/vec/exprs/vexpr.h
index 3456fb431a48cb..2580cf7ddc88f9 100644
--- a/be/src/vec/exprs/vexpr.h
+++ b/be/src/vec/exprs/vexpr.h
@@ -148,6 +148,9 @@ class VExpr {
     TypeDescriptor type() { return _type; }
 
     bool is_slot_ref() const { return _node_type == TExprNodeType::SLOT_REF; }
+
+    bool is_column_ref() const { return _node_type == TExprNodeType::COLUMN_REF; }
+
     virtual bool is_literal() const { return false; }
 
     TExprNodeType::type node_type() const { return _node_type; }
diff --git a/be/src/vec/exprs/vlambda_function_call_expr.h b/be/src/vec/exprs/vlambda_function_call_expr.h
index 44d22b1f9ebbea..7b0ea1dcb5a75d 100644
--- a/be/src/vec/exprs/vlambda_function_call_expr.h
+++ b/be/src/vec/exprs/vlambda_function_call_expr.h
@@ -50,6 +50,7 @@ class VLambdaFunctionCallExpr : public VExpr {
             return Status::InternalError("Lambda Function {} is not implemented.",
                                          _fn.name.function_name);
         }
+        RETURN_IF_ERROR(_lambda_function->prepare(state));
         _prepare_finished = true;
         return Status::OK();
     }
diff --git a/be/src/vec/functions/array/function_array_shuffle.cpp b/be/src/vec/functions/array/function_array_shuffle.cpp
index fbf5bcfcdf1686..b9e3206ba0baa1 100644
--- a/be/src/vec/functions/array/function_array_shuffle.cpp
+++ b/be/src/vec/functions/array/function_array_shuffle.cpp
@@ -79,7 +79,8 @@ class FunctionArrayShuffle : public IFunction {
             seed = assert_cast<const ColumnInt64*>(seed_column.get())->get_element(0);
         }
 
-        std::mt19937 g(seed);
+        // time() and seed will not exceed the range of uint32.
+        std::mt19937 g(cast_set<uint32>(seed));
         auto dest_column_ptr = _execute(src_column_array, g);
         if (!dest_column_ptr) {
             return Status::RuntimeError(
diff --git a/be/src/vec/functions/function_bitmap.cpp b/be/src/vec/functions/function_bitmap.cpp
index d5f2075dffb6d2..92a5dba7b7a4d4 100644
--- a/be/src/vec/functions/function_bitmap.cpp
+++ b/be/src/vec/functions/function_bitmap.cpp
@@ -685,8 +685,8 @@ ColumnPtr handle_bitmap_op_count_null_value(ColumnPtr& src, const Block& block,
             continue;
         }
 
-        if (auto* nullable = assert_cast<const ColumnNullable*>(elem.column.get())) {
-            const ColumnPtr& null_map_column = nullable->get_null_map_column_ptr();
+        if (const auto* nullable_column = assert_cast<const ColumnNullable*>(elem.column.get())) {
+            const ColumnPtr& null_map_column = nullable_column->get_null_map_column_ptr();
             const NullMap& src_null_map =
                     assert_cast<const ColumnUInt8&>(*null_map_column).get_data();
 
diff --git a/be/src/vec/functions/function_conv.cpp b/be/src/vec/functions/function_conv.cpp
index 085d982a1cbf1e..38932530c5a2b4 100644
--- a/be/src/vec/functions/function_conv.cpp
+++ b/be/src/vec/functions/function_conv.cpp
@@ -223,8 +223,8 @@ struct ConvStringImpl {
         if (!MathFunctions::handle_parse_result(dst_base, &decimal_num, parse_res)) {
             result_column->insert_data("0", 1);
         } else {
-            StringRef str = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
-            result_column->insert_data(reinterpret_cast<const char*>(str.data), str.size);
+            StringRef str_base = MathFunctions::decimal_to_base(context, decimal_num, dst_base);
+            result_column->insert_data(reinterpret_cast<const char*>(str_base.data), str_base.size);
         }
     }
 };
diff --git a/be/src/vec/functions/function_ip.h b/be/src/vec/functions/function_ip.h
index 724121ce57c109..67edad5015aeaf 100644
--- a/be/src/vec/functions/function_ip.h
+++ b/be/src/vec/functions/function_ip.h
@@ -458,10 +458,10 @@ ColumnPtr convert_to_ipv6(const StringColumnType& string_column,
                 std::reverse(res_value, res_value + IPV6_BINARY_LENGTH);
             }
             if constexpr (std::is_same_v<ToColumn, ColumnString>) {
-                auto* column_string = assert_cast<ColumnString*>(col_res.get());
+                auto* column_string_res = assert_cast<ColumnString*>(col_res.get());
                 std::copy(res_value, res_value + IPV6_BINARY_LENGTH,
-                          column_string->get_chars().begin() + i * IPV6_BINARY_LENGTH);
-                column_string->get_offsets().push_back((i + 1) * IPV6_BINARY_LENGTH);
+                          column_string_res->get_chars().begin() + i * IPV6_BINARY_LENGTH);
+                column_string_res->get_offsets().push_back((i + 1) * IPV6_BINARY_LENGTH);
             } else {
                 col_res->insert_data(reinterpret_cast<const char*>(res_value), IPV6_BINARY_LENGTH);
             }
@@ -471,8 +471,8 @@ ColumnPtr convert_to_ipv6(const StringColumnType& string_column,
             }
             std::fill_n(&vec_res[out_offset], offset_inc, 0);
             if constexpr (std::is_same_v<ToColumn, ColumnString>) {
-                auto* column_string = assert_cast<ColumnString*>(col_res.get());
-                column_string->get_offsets().push_back((i + 1) * IPV6_BINARY_LENGTH);
+                auto* column_string_res = assert_cast<ColumnString*>(col_res.get());
+                column_string_res->get_offsets().push_back((i + 1) * IPV6_BINARY_LENGTH);
             }
             if constexpr (exception_mode == IPConvertExceptionMode::Null) {
                 (*vec_null_map_to)[i] = true;
@@ -871,6 +871,11 @@ class FunctionIPv4CIDRToRange : public IFunction {
     }
 };
 
+/**
+ * this function accepts two arguments: an IPv6 address and a CIDR mask
+ *  IPv6 address can be either ipv6 type or string type as ipv6 string address
+ *  FE: PropagateNullable is used to handle nullable columns
+ */
 class FunctionIPv6CIDRToRange : public IFunction {
 public:
     static constexpr auto name = "ipv6_cidr_to_range";
@@ -902,12 +907,14 @@ class FunctionIPv6CIDRToRange : public IFunction {
 
         if (addr_type.is_ipv6()) {
             const auto* ipv6_addr_column = assert_cast<const ColumnIPv6*>(addr_column.get());
-            col_res = execute_impl<ColumnIPv6>(*ipv6_addr_column, *cidr_col, input_rows_count,
-                                               add_col_const, col_const);
+            col_res = execute_impl(*ipv6_addr_column, *cidr_col, input_rows_count, add_col_const,
+                                   col_const);
         } else if (addr_type.is_string()) {
-            const auto* str_addr_column = assert_cast<const ColumnString*>(addr_column.get());
-            col_res = execute_impl<ColumnString>(*str_addr_column, *cidr_col, input_rows_count,
-                                                 add_col_const, col_const);
+            ColumnPtr col_ipv6 =
+                    convert_to_ipv6<IPConvertExceptionMode::Throw>(addr_column, nullptr);
+            const auto* ipv6_addr_column = assert_cast<const ColumnIPv6*>(col_ipv6.get());
+            col_res = execute_impl(*ipv6_addr_column, *cidr_col, input_rows_count, add_col_const,
+                                   col_const);
         } else {
             return Status::RuntimeError(
                     "Illegal column {} of argument of function {}, Expected IPv6 or String",
@@ -918,8 +925,7 @@ class FunctionIPv6CIDRToRange : public IFunction {
         return Status::OK();
     }
 
-    template <typename FromColumn>
-    static ColumnPtr execute_impl(const FromColumn& from_column, const ColumnInt16& cidr_column,
+    static ColumnPtr execute_impl(const ColumnIPv6& from_column, const ColumnInt16& cidr_column,
                                   size_t input_rows_count, bool is_addr_const = false,
                                   bool is_cidr_const = false) {
         auto col_res_lower_range = ColumnIPv6::create(input_rows_count, 0);
@@ -936,20 +942,10 @@ class FunctionIPv6CIDRToRange : public IFunction {
                     throw Exception(ErrorCode::INVALID_ARGUMENT, "Illegal cidr value '{}'",
                                     std::to_string(cidr));
                 }
-                if constexpr (std::is_same_v<FromColumn, ColumnString>) {
-                    // 16 bytes ipv6 string is stored in big-endian byte order
-                    // so transfer to little-endian firstly
-                    auto* src_data = const_cast<char*>(from_column.get_data_at(0).data);
-                    std::reverse(src_data, src_data + IPV6_BINARY_LENGTH);
-                    apply_cidr_mask(src_data, reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                } else {
-                    apply_cidr_mask(from_column.get_data_at(0).data,
-                                    reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                }
+                apply_cidr_mask(from_column.get_data_at(0).data,
+                                reinterpret_cast<char*>(&vec_res_lower_range[i]),
+                                reinterpret_cast<char*>(&vec_res_upper_range[i]),
+                                cast_set<UInt8>(cidr));
             }
         } else if (is_cidr_const) {
             auto cidr = cidr_column.get_int(0);
@@ -958,20 +954,10 @@ class FunctionIPv6CIDRToRange : public IFunction {
                                 std::to_string(cidr));
             }
             for (size_t i = 0; i < input_rows_count; ++i) {
-                if constexpr (std::is_same_v<FromColumn, ColumnString>) {
-                    // 16 bytes ipv6 string is stored in big-endian byte order
-                    // so transfer to little-endian firstly
-                    auto* src_data = const_cast<char*>(from_column.get_data_at(i).data);
-                    std::reverse(src_data, src_data + IPV6_BINARY_LENGTH);
-                    apply_cidr_mask(src_data, reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                } else {
-                    apply_cidr_mask(from_column.get_data_at(i).data,
-                                    reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                }
+                apply_cidr_mask(from_column.get_data_at(i).data,
+                                reinterpret_cast<char*>(&vec_res_lower_range[i]),
+                                reinterpret_cast<char*>(&vec_res_upper_range[i]),
+                                cast_set<UInt8>(cidr));
             }
         } else {
             for (size_t i = 0; i < input_rows_count; ++i) {
@@ -980,20 +966,10 @@ class FunctionIPv6CIDRToRange : public IFunction {
                     throw Exception(ErrorCode::INVALID_ARGUMENT, "Illegal cidr value '{}'",
                                     std::to_string(cidr));
                 }
-                if constexpr (std::is_same_v<FromColumn, ColumnString>) {
-                    // 16 bytes ipv6 string is stored in big-endian byte order
-                    // so transfer to little-endian firstly
-                    auto* src_data = const_cast<char*>(from_column.get_data_at(i).data);
-                    std::reverse(src_data, src_data + IPV6_BINARY_LENGTH);
-                    apply_cidr_mask(src_data, reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                } else {
-                    apply_cidr_mask(from_column.get_data_at(i).data,
-                                    reinterpret_cast<char*>(&vec_res_lower_range[i]),
-                                    reinterpret_cast<char*>(&vec_res_upper_range[i]),
-                                    cast_set<UInt8>(cidr));
-                }
+                apply_cidr_mask(from_column.get_data_at(i).data,
+                                reinterpret_cast<char*>(&vec_res_lower_range[i]),
+                                reinterpret_cast<char*>(&vec_res_upper_range[i]),
+                                cast_set<UInt8>(cidr));
             }
         }
         return ColumnStruct::create(
diff --git a/be/src/vec/functions/function_jsonb.cpp b/be/src/vec/functions/function_jsonb.cpp
index 0e78eb894b20c5..463508169aadc6 100644
--- a/be/src/vec/functions/function_jsonb.cpp
+++ b/be/src/vec/functions/function_jsonb.cpp
@@ -1638,17 +1638,16 @@ class FunctionJsonSearch : public IFunction {
                       LikeState* state, JsonbPath* cur_path,
                       std::unordered_set<std::string>* matches) const {
         if (element.isString()) {
-            const std::string_view str = element.getString();
+            const std::string_view element_str = element.getString();
             unsigned char res;
-            RETURN_IF_ERROR(matched(str, state, &res));
+            RETURN_IF_ERROR(matched(element_str, state, &res));
             if (res) {
                 std::string str;
                 auto valid = cur_path->to_string(&str);
                 if (!valid) {
                     return false;
                 }
-                auto res = matches->insert(str);
-                return res.second;
+                return matches->insert(str).second;
             } else {
                 return false;
             }
diff --git a/be/src/vec/functions/function_string.cpp b/be/src/vec/functions/function_string.cpp
index cee141db2a7820..c434d344daa40a 100644
--- a/be/src/vec/functions/function_string.cpp
+++ b/be/src/vec/functions/function_string.cpp
@@ -888,16 +888,17 @@ struct StringSpace {
                          ColumnString::Offsets& res_offsets) {
         res_offsets.resize(data.size());
         size_t input_size = res_offsets.size();
-        std::vector<char, Allocator_<char>> buffer;
+        // sample to get approximate best reserve size
+        if (input_size > 4) {
+            res_data.reserve(((data[0] + data[input_size >> 1] + data[input_size >> 2] +
+                               data[input_size - 1]) >>
+                              2) *
+                             input_size);
+        }
         for (size_t i = 0; i < input_size; ++i) {
-            buffer.clear();
-            if (data[i] > 0) {
-                buffer.resize(data[i]);
-                for (size_t j = 0; j < data[i]; ++j) {
-                    buffer[i] = ' ';
-                }
-                StringOP::push_value_string(std::string_view(buffer.data(), buffer.size()), i,
-                                            res_data, res_offsets);
+            if (data[i] > 0) [[likely]] {
+                res_data.resize_fill(res_data.size() + data[i], ' ');
+                res_offsets[i] = res_data.size();
             } else {
                 StringOP::push_empty_string(i, res_data, res_offsets);
             }
diff --git a/be/src/vec/olap/vertical_block_reader.cpp b/be/src/vec/olap/vertical_block_reader.cpp
index 369bf04459a8f2..8df4e38e455881 100644
--- a/be/src/vec/olap/vertical_block_reader.cpp
+++ b/be/src/vec/olap/vertical_block_reader.cpp
@@ -237,7 +237,7 @@ Status VerticalBlockReader::init(const ReaderParams& read_params,
         _next_block_func = &VerticalBlockReader::_direct_next_block;
         break;
     case KeysType::UNIQUE_KEYS:
-        if (tablet()->tablet_meta()->tablet_schema()->cluster_key_idxes().empty()) {
+        if (tablet()->tablet_meta()->tablet_schema()->cluster_key_uids().empty()) {
             _next_block_func = &VerticalBlockReader::_unique_key_next_block;
             if (_filter_delete) {
                 _delete_filter_column = ColumnUInt8::create();
diff --git a/be/src/vec/runtime/partitioner.h b/be/src/vec/runtime/partitioner.h
index 39ed0e899411b8..d5492c3be87683 100644
--- a/be/src/vec/runtime/partitioner.h
+++ b/be/src/vec/runtime/partitioner.h
@@ -23,7 +23,6 @@
 
 namespace doris {
 #include "common/compile_check_begin.h"
-class MemTracker;
 
 namespace vectorized {
 
diff --git a/be/src/vec/runtime/vdatetime_value.h b/be/src/vec/runtime/vdatetime_value.h
index dc7ba70b0b04ac..cfe9a368e83d4b 100644
--- a/be/src/vec/runtime/vdatetime_value.h
+++ b/be/src/vec/runtime/vdatetime_value.h
@@ -1275,8 +1275,6 @@ class DateV2Value {
         }
     }
 
-    operator int64_t() const { return to_int64(); }
-
     int64_t to_int64() const {
         if constexpr (is_datetime) {
             return (date_v2_value_.year_ * 10000L + date_v2_value_.month_ * 100 +
diff --git a/be/src/vec/sink/load_stream_stub.cpp b/be/src/vec/sink/load_stream_stub.cpp
index 979daf6a85e682..d5b04c636d4d6c 100644
--- a/be/src/vec/sink/load_stream_stub.cpp
+++ b/be/src/vec/sink/load_stream_stub.cpp
@@ -65,13 +65,11 @@ int LoadStreamReplyHandler::on_received_messages(brpc::StreamId id, butil::IOBuf
         if (response.failed_tablets_size() > 0) {
             ss << ", failed tablet ids:";
             for (auto pb : response.failed_tablets()) {
-                Status st = Status::create(pb.status());
-                ss << " " << pb.id() << ":" << st;
+                ss << " " << pb.id() << ":" << Status::create(pb.status());
             }
             std::lock_guard<bthread::Mutex> lock(stub->_failed_tablets_mutex);
             for (auto pb : response.failed_tablets()) {
-                Status st = Status::create(pb.status());
-                stub->_failed_tablets.emplace(pb.id(), st);
+                stub->_failed_tablets.emplace(pb.id(), Status::create(pb.status()));
             }
         }
         if (response.tablet_schemas_size() > 0) {
@@ -221,11 +219,7 @@ Status LoadStreamStub::append_data(int64_t partition_id, int64_t index_id, int64
         add_failed_tablet(tablet_id, _status);
         return _status;
     }
-    DBUG_EXECUTE_IF("LoadStreamStub.only_send_segment_0", {
-        if (segment_id != 0) {
-            return Status::OK();
-        }
-    });
+    DBUG_EXECUTE_IF("LoadStreamStub.skip_send_segment", { return Status::OK(); });
     PStreamHeader header;
     header.set_src_id(_src_id);
     *header.mutable_load_id() = _load_id;
@@ -248,11 +242,7 @@ Status LoadStreamStub::add_segment(int64_t partition_id, int64_t index_id, int64
         add_failed_tablet(tablet_id, _status);
         return _status;
     }
-    DBUG_EXECUTE_IF("LoadStreamStub.only_send_segment_0", {
-        if (segment_id != 0) {
-            return Status::OK();
-        }
-    });
+    DBUG_EXECUTE_IF("LoadStreamStub.skip_send_segment", { return Status::OK(); });
     PStreamHeader header;
     header.set_src_id(_src_id);
     *header.mutable_load_id() = _load_id;
@@ -342,6 +332,10 @@ Status LoadStreamStub::wait_for_schema(int64_t partition_id, int64_t index_id, i
 
 Status LoadStreamStub::close_wait(RuntimeState* state, int64_t timeout_ms) {
     DBUG_EXECUTE_IF("LoadStreamStub::close_wait.long_wait", DBUG_BLOCK);
+    if (!_is_open.load()) {
+        // we don't need to close wait on non-open streams
+        return Status::OK();
+    }
     if (!_is_closing.load()) {
         return _status;
     }
diff --git a/be/src/vec/sink/vdata_stream_sender.h b/be/src/vec/sink/vdata_stream_sender.h
index 5fe35e4da119d0..4999602fdf49a7 100644
--- a/be/src/vec/sink/vdata_stream_sender.h
+++ b/be/src/vec/sink/vdata_stream_sender.h
@@ -56,7 +56,6 @@ namespace doris {
 #include "common/compile_check_begin.h"
 class ObjectPool;
 class RuntimeState;
-class MemTracker;
 class RowDescriptor;
 class TDataSink;
 class TDataStreamSink;
diff --git a/be/src/vec/sink/writer/vtablet_writer_v2.cpp b/be/src/vec/sink/writer/vtablet_writer_v2.cpp
index 3dc58be3bcde88..cd196a8f2b3df2 100644
--- a/be/src/vec/sink/writer/vtablet_writer_v2.cpp
+++ b/be/src/vec/sink/writer/vtablet_writer_v2.cpp
@@ -269,14 +269,20 @@ Status VTabletWriterV2::open(RuntimeState* state, RuntimeProfile* profile) {
 }
 
 Status VTabletWriterV2::_open_streams() {
-    bool fault_injection_skip_be = true;
+    int fault_injection_skip_be = 0;
     bool any_backend = false;
     bool any_success = false;
     for (auto& [dst_id, _] : _tablets_for_node) {
         auto streams = _load_stream_map->get_or_create(dst_id);
         DBUG_EXECUTE_IF("VTabletWriterV2._open_streams.skip_one_backend", {
-            if (fault_injection_skip_be) {
-                fault_injection_skip_be = false;
+            if (fault_injection_skip_be < 1) {
+                fault_injection_skip_be++;
+                continue;
+            }
+        });
+        DBUG_EXECUTE_IF("VTabletWriterV2._open_streams.skip_two_backends", {
+            if (fault_injection_skip_be < 2) {
+                fault_injection_skip_be++;
                 continue;
             }
         });
diff --git a/be/test/http/http_client_test.cpp b/be/test/http/http_client_test.cpp
index d42e0a6775ed4b..c98328d7c8e37c 100644
--- a/be/test/http/http_client_test.cpp
+++ b/be/test/http/http_client_test.cpp
@@ -413,7 +413,7 @@ TEST_F(HttpClientTest, enable_http_auth) {
         EXPECT_TRUE(!st.ok());
         std::cout << "response = " << response << "\n";
         std::cout << "st.msg() = " << st.msg() << "\n";
-        EXPECT_TRUE(st.msg().find("Operation timed out after") != std::string::npos);
+        EXPECT_TRUE(st.msg().find("403") != std::string::npos);
     }
 
     {
@@ -474,7 +474,7 @@ TEST_F(HttpClientTest, enable_http_auth) {
         EXPECT_TRUE(!st.ok());
         std::cout << "response = " << response << "\n";
         std::cout << "st.msg() = " << st.msg() << "\n";
-        EXPECT_TRUE(st.msg().find("Operation timed out after") != std::string::npos);
+        EXPECT_TRUE(st.msg().find("403") != std::string::npos);
     }
 
     // valid token
@@ -521,7 +521,7 @@ TEST_F(HttpClientTest, enable_http_auth) {
         EXPECT_TRUE(!st.ok());
         std::cout << "response = " << response << "\n";
         std::cout << "st.msg() = " << st.msg() << "\n";
-        EXPECT_TRUE(st.msg().find("Operation timed out after") != std::string::npos);
+        EXPECT_TRUE(st.msg().find("403") != std::string::npos);
     }
 
     std::vector<std::string> check_get_list = {"/api/clear_cache/aa",
@@ -566,7 +566,7 @@ TEST_F(HttpClientTest, enable_http_auth) {
             EXPECT_TRUE(!st.ok());
             std::cout << "response = " << response << "\n";
             std::cout << "st.msg() = " << st.msg() << "\n";
-            EXPECT_TRUE(st.msg().find("Operation timed out after") != std::string::npos);
+            EXPECT_TRUE(st.msg().find("403") != std::string::npos);
         }
     }
 }
diff --git a/be/test/olap/bitmap_filter_column_predicate_test.cpp b/be/test/olap/bitmap_filter_column_predicate_test.cpp
index 2ad2bd124e3197..f3abef55f55ad7 100644
--- a/be/test/olap/bitmap_filter_column_predicate_test.cpp
+++ b/be/test/olap/bitmap_filter_column_predicate_test.cpp
@@ -42,7 +42,7 @@ class BitmapFilterColumnPredicateTest : public testing::Test {
     template <PrimitiveType type>
     BitmapFilterColumnPredicate<type> create_predicate(
             const std::shared_ptr<BitmapFilterFunc<type>>& filter) {
-        return BitmapFilterColumnPredicate<type>(0, filter, 0);
+        return BitmapFilterColumnPredicate<type>(0, filter);
     }
 
     const std::string kTestDir = "./ut_dir/bitmap_filter_column_predicate_test";
diff --git a/be/test/olap/bloom_filter_test.cpp b/be/test/olap/bloom_filter_test.cpp
deleted file mode 100644
index 32bf88e2c4d684..00000000000000
--- a/be/test/olap/bloom_filter_test.cpp
+++ /dev/null
@@ -1,160 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-#include "olap/bloom_filter.hpp"
-
-#include <glog/logging.h>
-#include <gtest/gtest-message.h>
-#include <gtest/gtest-test-part.h>
-
-#include <string>
-
-#include "gtest/gtest_pred_impl.h"
-
-using std::string;
-
-namespace doris {
-
-class TestBloomFilter : public testing::Test {
-public:
-    virtual ~TestBloomFilter() {}
-
-    virtual void SetUp() {}
-    virtual void TearDown() {}
-};
-
-// Init BloomFilter with different item number and fpp,
-//     and verify bit_num and hash_function_num calculated by BloomFilter
-TEST_F(TestBloomFilter, init_bloom_filter) {
-    {
-        BloomFilter bf;
-        bf.init(1024);
-        EXPECT_EQ(6400, bf.bit_num());
-        EXPECT_EQ(4, bf.hash_function_num());
-    }
-
-    {
-        BloomFilter bf;
-        bf.init(1024, 0.01);
-        EXPECT_EQ(9856, bf.bit_num());
-        EXPECT_EQ(7, bf.hash_function_num());
-    }
-
-    {
-        BloomFilter bf;
-        bf.init(10240, 0.1);
-        EXPECT_EQ(49088, bf.bit_num());
-        EXPECT_EQ(3, bf.hash_function_num());
-    }
-
-    {
-        BloomFilter bf;
-        uint32_t data_len = 100;
-        uint32_t hash_function_num = 4;
-        uint64_t* data = new uint64_t[data_len];
-
-        bf.init(data, data_len, hash_function_num);
-        EXPECT_EQ(6400, bf.bit_num());
-        EXPECT_EQ(4, bf.hash_function_num());
-        EXPECT_EQ(data, bf.bit_set_data());
-
-        bf.reset();
-        EXPECT_EQ(0, bf.bit_num());
-        EXPECT_EQ(0, bf.hash_function_num());
-        EXPECT_EQ(nullptr, bf.bit_set_data());
-        delete[] data;
-    }
-}
-
-// Add different buffer to BloomFilter and verify existence
-TEST_F(TestBloomFilter, add_and_test_bytes) {
-    string bytes;
-    BloomFilter bf;
-    bf.init(1024);
-
-    bf.add_bytes(nullptr, 0);
-    EXPECT_TRUE(bf.test_bytes(nullptr, 0));
-
-    bytes = "hello";
-    bf.add_bytes(bytes.c_str(), bytes.size());
-    EXPECT_TRUE(bf.test_bytes(bytes.c_str(), bytes.size()));
-
-    bytes = "doris";
-    bf.add_bytes(bytes.c_str(), bytes.size());
-    EXPECT_TRUE(bf.test_bytes(bytes.c_str(), bytes.size()));
-
-    BloomFilter new_bf;
-    new_bf.init(1024);
-
-    bytes = "world";
-    new_bf.add_bytes(bytes.c_str(), bytes.size());
-    EXPECT_TRUE(bf.merge(new_bf));
-    EXPECT_TRUE(bf.test_bytes(bytes.c_str(), bytes.size()));
-}
-
-// Print bloom filter buffer and points of specified string
-TEST_F(TestBloomFilter, bloom_filter_info) {
-    string bytes;
-    BloomFilter bf;
-    bf.init(8, 0.1);
-
-    bytes = "doris";
-    bf.add_bytes(bytes.c_str(), bytes.size());
-    string buffer_expect =
-            "bit_num:64 hash_function_num:6 "
-            "bit_set:0000100000000000100000010000000000010000001000000000000000000100";
-    string buffer = bf.to_string();
-    EXPECT_TRUE(buffer_expect == buffer);
-
-    string points_expect = "4-23-42-61-16-35";
-    string points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    EXPECT_TRUE(points_expect == points);
-
-    bytes = "a";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "ab";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "b";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "ba";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "c";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "bc";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "ac";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-
-    bytes = "abc";
-    points = bf.get_bytes_points_string(bytes.c_str(), bytes.size());
-    LOG(WARNING) << "bytes=" << bytes << " points=" << points;
-}
-
-} // namespace doris
diff --git a/be/test/olap/delta_writer_cluster_key_test.cpp b/be/test/olap/delta_writer_cluster_key_test.cpp
index 9c3e64109c4440..6c4b4d367a3d21 100644
--- a/be/test/olap/delta_writer_cluster_key_test.cpp
+++ b/be/test/olap/delta_writer_cluster_key_test.cpp
@@ -116,8 +116,8 @@ static void create_tablet_request_with_sequence_col(int64_t tablet_id, int32_t s
     request->tablet_schema.__set_sequence_col_idx(4);
     request->__set_storage_format(TStorageFormat::V2);
     request->__set_enable_unique_key_merge_on_write(enable_mow);
-    request->tablet_schema.cluster_key_idxes.push_back(1);
-    request->tablet_schema.cluster_key_idxes.push_back(0);
+    request->tablet_schema.cluster_key_uids.push_back(1);
+    request->tablet_schema.cluster_key_uids.push_back(0);
 
     TColumn k1;
     k1.column_name = "k1";
diff --git a/be/test/olap/rowset/segment_v2/bloom_filter_index_reader_writer_test.cpp b/be/test/olap/rowset/segment_v2/bloom_filter_index_reader_writer_test.cpp
index 69cb343f04bf91..813952595efcfd 100644
--- a/be/test/olap/rowset/segment_v2/bloom_filter_index_reader_writer_test.cpp
+++ b/be/test/olap/rowset/segment_v2/bloom_filter_index_reader_writer_test.cpp
@@ -32,6 +32,7 @@
 #include "io/fs/file_writer.h"
 #include "io/fs/local_file_system.h"
 #include "olap/decimal12.h"
+#include "olap/itoken_extractor.h"
 #include "olap/olap_common.h"
 #include "olap/rowset/segment_v2/bloom_filter.h"
 #include "olap/rowset/segment_v2/bloom_filter_index_reader.h"
@@ -62,18 +63,19 @@ template <FieldType type>
 Status write_bloom_filter_index_file(const std::string& file_name, const void* values,
                                      size_t value_count, size_t null_count,
                                      ColumnIndexMetaPB* index_meta,
-                                     bool use_primary_key_bloom_filter = false) {
+                                     bool use_primary_key_bloom_filter = false, double fpp = 0.05) {
     const auto* type_info = get_scalar_type_info<type>();
     using CppType = typename CppTypeTraits<type>::CppType;
     std::string fname = dname + "/" + file_name;
     auto fs = io::global_local_filesystem();
     {
+        size_t expect_size = 0;
         io::FileWriterPtr file_writer;
         RETURN_IF_ERROR(fs->create_file(fname, &file_writer));
 
         std::unique_ptr<BloomFilterIndexWriter> bloom_filter_index_writer;
         BloomFilterOptions bf_options;
-
+        bf_options.fpp = fpp; // Set the expected FPP
         if (use_primary_key_bloom_filter) {
             RETURN_IF_ERROR(PrimaryKeyBloomFilterIndexWriterImpl::create(
                     bf_options, type_info, &bloom_filter_index_writer));
@@ -91,12 +93,26 @@ Status write_bloom_filter_index_file(const std::string& file_name, const void* v
                 bloom_filter_index_writer->add_nulls(null_count);
             }
             RETURN_IF_ERROR(bloom_filter_index_writer->flush());
+            auto bf_size = BloomFilter::optimal_bit_num(num, fpp) / 8;
+            expect_size += bf_size + 1;
             i += 1024;
         }
+        if (value_count == 3072) {
+            RETURN_IF_ERROR(bloom_filter_index_writer->add_values(vals + 3071, 1));
+            auto bf_size = BloomFilter::optimal_bit_num(1, fpp) / 8;
+            expect_size += bf_size + 1;
+        }
         RETURN_IF_ERROR(bloom_filter_index_writer->finish(file_writer.get(), index_meta));
         EXPECT_TRUE(file_writer->close().ok());
         EXPECT_EQ(BLOOM_FILTER_INDEX, index_meta->type());
         EXPECT_EQ(bf_options.strategy, index_meta->bloom_filter_index().hash_strategy());
+        if constexpr (!field_is_slice_type(type)) {
+            EXPECT_EQ(expect_size, bloom_filter_index_writer->size());
+        }
+        if (use_primary_key_bloom_filter) {
+            std::cout << "primary key bf size is " << bloom_filter_index_writer->size()
+                      << std::endl;
+        }
     }
     return Status::OK();
 }
@@ -128,7 +144,7 @@ Status test_bloom_filter_index_reader_writer_template(
         BloomFilterIndexReader* reader = nullptr;
         std::unique_ptr<BloomFilterIndexIterator> iter;
         get_bloom_filter_reader_iter(file_name, meta, &reader, &iter);
-
+        EXPECT_EQ(reader->algorithm(), BloomFilterAlgorithmPB::BLOCK_BLOOM_FILTER);
         // page 0
         std::unique_ptr<BloomFilter> bf;
         RETURN_IF_ERROR(iter->read_bloom_filter(0, &bf));
@@ -171,7 +187,7 @@ Status test_bloom_filter_index_reader_writer_template(
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_int) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     int* val = new int[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -186,8 +202,58 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_int) {
     delete[] val;
 }
 
+TEST_F(BloomFilterIndexReaderWriterTest, test_string) {
+    size_t num = 1024 * 3;
+    std::vector<std::string> val_strings(num);
+    for (size_t i = 0; i < num; ++i) {
+        val_strings[i] = "string_test_" + std::to_string(i + 1);
+    }
+    Slice* val = new Slice[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = Slice(val_strings[i]);
+    }
+
+    std::string file_name = "bloom_filter_string";
+    Slice not_exist_value("string_test_not_exist");
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_STRING>(
+            file_name, val, num, 1, &not_exist_value, true);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_unsigned_int) {
+    size_t num = 1024 * 3;
+    uint32_t* val = new uint32_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = static_cast<uint32_t>(i + 1);
+    }
+
+    std::string file_name = "bloom_filter_unsigned_int";
+    uint32_t not_exist_value = 0xFFFFFFFF;
+    auto st =
+            test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_UNSIGNED_INT>(
+                    file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_smallint) {
+    size_t num = 1024 * 3;
+    int16_t* val = new int16_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = static_cast<int16_t>(i + 1);
+    }
+
+    std::string file_name = "bloom_filter_smallint";
+    int16_t not_exist_value = -1;
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_SMALLINT>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
 TEST_F(BloomFilterIndexReaderWriterTest, test_bigint) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     int64_t* val = new int64_t[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -203,7 +269,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_bigint) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_largeint) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     int128_t* val = new int128_t[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -219,7 +285,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_largeint) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_varchar_type) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     std::string* val = new std::string[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -240,7 +306,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_varchar_type) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_char) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     std::string* val = new std::string[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -261,7 +327,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_char) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_date) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     uint24_t* val = new uint24_t[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -277,7 +343,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_date) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_datetime) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     int64_t* val = new int64_t[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -293,7 +359,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_datetime) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_decimal) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     decimal12_t* val = new decimal12_t[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -308,8 +374,29 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_decimal) {
     delete[] val;
 }
 
+TEST_F(BloomFilterIndexReaderWriterTest, test_primary_key_bloom_filter_index_char) {
+    size_t num = 1024 * 3;
+    std::string* val = new std::string[num];
+    for (int i = 0; i < num; ++i) {
+        // there will be 3 bloom filter pages
+        val[i] = "primary_key_" + std::to_string(10000 + i);
+    }
+    Slice* slices = new Slice[num];
+    for (int i = 0; i < num; ++i) {
+        // there will be 3 bloom filter pages
+        slices[i] = Slice(val[i].c_str(), val[i].size());
+    }
+    std::string file_name = "primary_key_bloom_filter_index_char";
+    Slice not_exist_value("primary_key_not_exist_char");
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_CHAR>(
+            file_name, slices, num, 1, &not_exist_value, true, true);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+    delete[] slices;
+}
+
 TEST_F(BloomFilterIndexReaderWriterTest, test_primary_key_bloom_filter_index) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     std::vector<std::string> val_strings(num);
     for (size_t i = 0; i < num; ++i) {
         val_strings[i] = "primary_key_" + std::to_string(i);
@@ -328,7 +415,7 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_primary_key_bloom_filter_index) {
 }
 
 TEST_F(BloomFilterIndexReaderWriterTest, test_primary_key_bloom_filter_index_int) {
-    size_t num = 1024 * 3 - 1;
+    size_t num = 1024 * 3;
     int* val = new int[num];
     for (int i = 0; i < num; ++i) {
         // there will be 3 bloom filter pages
@@ -344,5 +431,377 @@ TEST_F(BloomFilterIndexReaderWriterTest, test_primary_key_bloom_filter_index_int
     delete[] val;
 }
 
+TEST_F(BloomFilterIndexReaderWriterTest, test_datev2) {
+    size_t num = 1024 * 3;
+    uint32_t* val = new uint32_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = 20210101 + i; // YYYYMMDD
+    }
+
+    std::string file_name = "bloom_filter_datev2";
+    uint32_t not_exist_value = 20211231;
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DATEV2>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_datetimev2) {
+    size_t num = 1024 * 3;
+    uint64_t* val = new uint64_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = 20210101000000 + i; // YYYYMMDDHHMMSS
+    }
+
+    std::string file_name = "bloom_filter_datetimev2";
+    uint64_t not_exist_value = 20211231235959;
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DATETIMEV2>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_decimal32) {
+    size_t num = 1024 * 3;
+    int32_t* val = new int32_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = static_cast<int32_t>(i * 100 + 1);
+    }
+
+    std::string file_name = "bloom_filter_decimal32";
+    int32_t not_exist_value = 99999;
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DECIMAL32>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_decimal64) {
+    size_t num = 1024 * 3;
+    ;
+    int64_t* val = new int64_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = static_cast<int64_t>(i * 1000 + 123);
+    }
+
+    std::string file_name = "bloom_filter_decimal64";
+    int64_t not_exist_value = 9999999;
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DECIMAL64>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_ipv4) {
+    size_t num = 1024 * 3; // 3072
+    uint32_t* val = new uint32_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = (192 << 24) | (168 << 16) | (i & 0xFFFF);
+    }
+
+    std::string file_name = "bloom_filter_ipv4";
+    uint32_t not_exist_value = (10 << 24) | (0 << 16) | (0 << 8) | 1; // 10.0.0.1
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_IPV4>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_decimal128i) {
+    size_t num = 1024 * 3;
+    int128_t* val = new int128_t[num];
+
+    int128_t base_value = int128_t(1000000000ULL) * int128_t(1000000000ULL);
+
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = base_value + int128_t(i);
+    }
+
+    std::string file_name = "bloom_filter_decimal128i";
+    int128_t not_exist_value = int128_t(9999999999999999999ULL);
+
+    auto st =
+            test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DECIMAL128I>(
+                    file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_decimal256) {
+    size_t num = 1024 * 3;
+    using Decimal256Type = wide::Int256;
+
+    Decimal256Type* val = new Decimal256Type[num];
+
+    Decimal256Type base_value = Decimal256Type(1000000000ULL); // 1e9
+    base_value *= Decimal256Type(1000000000ULL);               // base_value = 1e18
+    base_value *= Decimal256Type(100000000ULL);                // base_value = 1e26
+    base_value *= Decimal256Type(100000000ULL);                // base_value = 1e34
+    base_value *= Decimal256Type(10000ULL);                    // base_value = 1e38
+
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = base_value + Decimal256Type(i);
+    }
+
+    std::string file_name = "bloom_filter_decimal256";
+
+    Decimal256Type not_exist_value = base_value + Decimal256Type(9999999ULL);
+
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_DECIMAL256>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_ipv6) {
+    size_t num = 1024 * 3;
+    uint128_t* val = new uint128_t[num];
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = (uint128_t(0x20010DB800000000) << 64) | uint128_t(i);
+    }
+
+    std::string file_name = "bloom_filter_ipv6";
+    uint128_t not_exist_value = (uint128_t(0x20010DB800000000) << 64) | uint128_t(999999);
+
+    auto st = test_bloom_filter_index_reader_writer_template<FieldType::OLAP_FIELD_TYPE_IPV6>(
+            file_name, val, num, 1, &not_exist_value);
+    EXPECT_TRUE(st.ok());
+    delete[] val;
+}
+
+template <FieldType type>
+Status write_ngram_bloom_filter_index_file(const std::string& file_name, Slice* values,
+                                           size_t num_values, const TypeInfo* type_info,
+                                           BloomFilterIndexWriter* bf_index_writer,
+                                           ColumnIndexMetaPB* meta) {
+    auto fs = io::global_local_filesystem();
+    std::string fname = dname + "/" + file_name;
+    io::FileWriterPtr file_writer;
+    Status st = fs->create_file(fname, &file_writer);
+    EXPECT_TRUE(st.ok()) << st.to_string();
+
+    size_t i = 0;
+    while (i < num_values) {
+        size_t num = std::min(static_cast<size_t>(1024), num_values - i);
+        st = bf_index_writer->add_values(values + i, num);
+        EXPECT_TRUE(st.ok());
+        st = bf_index_writer->flush();
+        EXPECT_TRUE(st.ok());
+        i += num;
+    }
+    bf_index_writer->add_nulls(1);
+    st = bf_index_writer->finish(file_writer.get(), meta);
+    EXPECT_TRUE(st.ok()) << "Writer finish status: " << st.to_string();
+    EXPECT_TRUE(file_writer->close().ok());
+
+    return Status::OK();
+}
+
+Status read_and_test_ngram_bloom_filter_index_file(const std::string& file_name, size_t num_values,
+                                                   uint8_t gram_size, uint16_t bf_size,
+                                                   const ColumnIndexMetaPB& meta,
+                                                   const std::vector<std::string>& test_patterns) {
+    BloomFilterIndexReader* reader = nullptr;
+    std::unique_ptr<BloomFilterIndexIterator> iter;
+    get_bloom_filter_reader_iter(file_name, meta, &reader, &iter);
+    EXPECT_EQ(reader->algorithm(), BloomFilterAlgorithmPB::NGRAM_BLOOM_FILTER);
+
+    NgramTokenExtractor extractor(gram_size);
+    uint16_t gram_bf_size = bf_size;
+
+    size_t total_pages = (num_values + 1023) / 1024;
+    for (size_t page = 0; page < total_pages; ++page) {
+        std::unique_ptr<BloomFilter> bf;
+        auto st = iter->read_bloom_filter(page, &bf);
+        EXPECT_TRUE(st.ok());
+
+        for (const auto& pattern : test_patterns) {
+            std::unique_ptr<BloomFilter> query_bf;
+            st = BloomFilter::create(NGRAM_BLOOM_FILTER, &query_bf, gram_bf_size);
+            EXPECT_TRUE(st.ok());
+
+            if (extractor.string_like_to_bloom_filter(pattern.data(), pattern.size(), *query_bf)) {
+                bool contains = bf->contains(*query_bf);
+                bool expected = false;
+                if ((page == 0 && (pattern == "ngram15" || pattern == "ngram1000")) ||
+                    (page == 1 && pattern == "ngram1499")) {
+                    expected = true;
+                }
+                EXPECT_EQ(contains, expected) << "Pattern: " << pattern << ", Page: " << page;
+            }
+        }
+    }
+
+    delete reader;
+    return Status::OK();
+}
+
+template <FieldType type>
+Status test_ngram_bloom_filter_index_reader_writer(const std::string& file_name, Slice* values,
+                                                   size_t num_values, uint8_t gram_size,
+                                                   uint16_t bf_size) {
+    const auto* type_info = get_scalar_type_info<type>();
+    ColumnIndexMetaPB meta;
+
+    BloomFilterOptions bf_options;
+    std::unique_ptr<BloomFilterIndexWriter> bf_index_writer;
+    RETURN_IF_ERROR(NGramBloomFilterIndexWriterImpl::create(bf_options, type_info, gram_size,
+                                                            bf_size, &bf_index_writer));
+
+    RETURN_IF_ERROR(write_ngram_bloom_filter_index_file<type>(
+            file_name, values, num_values, type_info, bf_index_writer.get(), &meta));
+
+    std::vector<std::string> test_patterns = {"ngram15", "ngram1000", "ngram1499",
+                                              "non-existent-string"};
+
+    RETURN_IF_ERROR(read_and_test_ngram_bloom_filter_index_file(file_name, num_values, gram_size,
+                                                                bf_size, meta, test_patterns));
+
+    return Status::OK();
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_ngram_bloom_filter) {
+    size_t num = 1500;
+    std::vector<std::string> val(num);
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = "ngram" + std::to_string(i);
+    }
+    std::vector<Slice> slices(num);
+    for (size_t i = 0; i < num; ++i) {
+        slices[i] = Slice(val[i].data(), val[i].size());
+    }
+
+    uint8_t gram_size = 5;
+    uint16_t bf_size = 65535;
+
+    auto st = test_ngram_bloom_filter_index_reader_writer<FieldType::OLAP_FIELD_TYPE_VARCHAR>(
+            "bloom_filter_ngram_varchar", slices.data(), num, gram_size, bf_size);
+    EXPECT_TRUE(st.ok());
+    st = test_ngram_bloom_filter_index_reader_writer<FieldType::OLAP_FIELD_TYPE_CHAR>(
+            "bloom_filter_ngram_char", slices.data(), num, gram_size, bf_size);
+    EXPECT_TRUE(st.ok());
+    st = test_ngram_bloom_filter_index_reader_writer<FieldType::OLAP_FIELD_TYPE_STRING>(
+            "bloom_filter_ngram_string", slices.data(), num, gram_size, bf_size);
+    EXPECT_TRUE(st.ok());
+    st = test_ngram_bloom_filter_index_reader_writer<FieldType::OLAP_FIELD_TYPE_INT>(
+            "bloom_filter_ngram_string", slices.data(), num, gram_size, bf_size);
+    EXPECT_FALSE(st.ok());
+    EXPECT_EQ(st.code(), TStatusCode::NOT_IMPLEMENTED_ERROR);
+}
+void test_ngram_bloom_filter_with_size(uint16_t bf_size) {
+    const auto* type_info = get_scalar_type_info<FieldType::OLAP_FIELD_TYPE_VARCHAR>();
+    ColumnIndexMetaPB meta;
+
+    BloomFilterOptions bf_options;
+    size_t num = 1500;
+    std::vector<std::string> val(num);
+    for (size_t i = 0; i < num; ++i) {
+        val[i] = "ngram" + std::to_string(i);
+    }
+    std::vector<Slice> slices(num);
+    for (size_t i = 0; i < num; ++i) {
+        slices[i] = Slice(val[i].data(), val[i].size());
+    }
+    size_t total_pages = (num + 1024 - 1) / 1024;
+    uint8_t gram_size = 5;
+
+    std::unique_ptr<BloomFilterIndexWriter> bf_index_writer;
+    auto st = NGramBloomFilterIndexWriterImpl::create(bf_options, type_info, gram_size, bf_size,
+                                                      &bf_index_writer);
+    EXPECT_TRUE(st.ok());
+
+    std::string file_name = "bloom_filter_ngram_varchar_size_" + std::to_string(bf_size);
+    st = write_ngram_bloom_filter_index_file<FieldType::OLAP_FIELD_TYPE_VARCHAR>(
+            file_name, slices.data(), num, type_info, bf_index_writer.get(), &meta);
+    EXPECT_TRUE(st.ok());
+    EXPECT_EQ(bf_index_writer->size(), static_cast<uint64_t>(bf_size) * total_pages);
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_ngram_bloom_filter_size) {
+    std::vector<uint16_t> bf_sizes = {1024, 2048, 4096, 8192, 16384, 32768, 65535};
+    for (uint16_t bf_size : bf_sizes) {
+        test_ngram_bloom_filter_with_size(bf_size);
+    }
+}
+
+TEST_F(BloomFilterIndexReaderWriterTest, test_unsupported_type) {
+    auto type_info = get_scalar_type_info<FieldType::OLAP_FIELD_TYPE_FLOAT>();
+    BloomFilterOptions bf_options;
+    std::unique_ptr<BloomFilterIndexWriter> bloom_filter_index_writer;
+    auto st = BloomFilterIndexWriter::create(bf_options, type_info, &bloom_filter_index_writer);
+    EXPECT_FALSE(st.ok());
+    EXPECT_EQ(st.code(), TStatusCode::NOT_IMPLEMENTED_ERROR);
+}
+
+// Test function for verifying Bloom Filter FPP
+void test_bloom_filter_fpp(double expected_fpp) {
+    size_t n = 10000;  // Number of elements to insert into the Bloom Filter
+    size_t m = 100000; // Number of non-existent elements to test for false positives
+
+    // Generate and insert elements into the Bloom Filter index
+    std::vector<int64_t> insert_values;
+    for (size_t i = 0; i < n; ++i) {
+        int64_t val = static_cast<int64_t>(i);
+        insert_values.push_back(val);
+    }
+
+    // Write the Bloom Filter index to file
+    std::string file_name = "bloom_filter_fpp_test";
+    ColumnIndexMetaPB index_meta;
+    Status st = write_bloom_filter_index_file<FieldType::OLAP_FIELD_TYPE_BIGINT>(
+            file_name, insert_values.data(), n, 0, &index_meta, false, expected_fpp);
+    EXPECT_TRUE(st.ok());
+
+    // Read the Bloom Filter index
+    BloomFilterIndexReader* reader = nullptr;
+    std::unique_ptr<BloomFilterIndexIterator> iter;
+    get_bloom_filter_reader_iter(file_name, index_meta, &reader, &iter);
+
+    // Read the Bloom Filter (only one page since we flushed once)
+    std::unique_ptr<BloomFilter> bf;
+    st = iter->read_bloom_filter(0, &bf);
+    EXPECT_TRUE(st.ok());
+
+    // Generate non-existent elements for testing false positive rate
+    std::unordered_set<int64_t> inserted_elements(insert_values.begin(), insert_values.end());
+    std::unordered_set<int64_t> non_exist_elements;
+    std::vector<int64_t> test_values;
+    size_t max_value = n + m * 10; // Ensure test values are not in the inserted range
+    boost::mt19937_64 rng(12345);  // Seed the random number generator for reproducibility
+    std::uniform_int_distribution<int64_t> dist(static_cast<int64_t>(n + 1),
+                                                static_cast<int64_t>(max_value));
+    while (non_exist_elements.size() < m) {
+        int64_t val = dist(rng);
+        if (inserted_elements.find(val) == inserted_elements.end()) {
+            non_exist_elements.insert(val);
+            test_values.push_back(val);
+        }
+    }
+
+    // Test non-existent elements and count false positives
+    size_t fp_count = 0;
+    for (const auto& val : test_values) {
+        if (bf->test_bytes(reinterpret_cast<const char*>(&val), sizeof(int64_t))) {
+            fp_count++;
+        }
+    }
+
+    // Compute actual false positive probability
+    double actual_fpp = static_cast<double>(fp_count) / static_cast<double>(m);
+    std::cout << "Expected FPP: " << expected_fpp << ", Actual FPP: " << actual_fpp << std::endl;
+
+    // Verify that actual FPP is within the allowable error range
+    EXPECT_LE(actual_fpp, expected_fpp);
+
+    delete reader;
+}
+
+// Test case to run FPP tests with multiple expected FPP values
+TEST_F(BloomFilterIndexReaderWriterTest, test_bloom_filter_fpp_multiple) {
+    std::vector<double> fpp_values = {0.01, 0.02, 0.05};
+    for (double fpp : fpp_values) {
+        test_bloom_filter_fpp(fpp);
+    }
+}
 } // namespace segment_v2
 } // namespace doris
diff --git a/be/test/olap/rowset/segment_v2/inverted_index/query/phrase_query_test.cpp b/be/test/olap/rowset/segment_v2/inverted_index/query/phrase_query_test.cpp
index f3fb9763c9b84d..b8e11bece7b318 100644
--- a/be/test/olap/rowset/segment_v2/inverted_index/query/phrase_query_test.cpp
+++ b/be/test/olap/rowset/segment_v2/inverted_index/query/phrase_query_test.cpp
@@ -62,7 +62,6 @@ TEST_F(PhraseQueryTest, test_parser_info) {
         EXPECT_EQ(query_info.slop, res3);
         EXPECT_EQ(query_info.ordered, res4);
         EXPECT_EQ(query_info.additional_terms.size(), res5);
-        std::cout << "--- 1 ---: " << query_info.to_string() << std::endl;
     };
 
     // "english/history off.gif ~20+" sequential_opt = true
diff --git a/be/test/olap/rowset/segment_v2/inverted_index_file_writer_test.cpp b/be/test/olap/rowset/segment_v2/inverted_index_file_writer_test.cpp
index b454080434a008..41703d49d5e013 100644
--- a/be/test/olap/rowset/segment_v2/inverted_index_file_writer_test.cpp
+++ b/be/test/olap/rowset/segment_v2/inverted_index_file_writer_test.cpp
@@ -506,7 +506,7 @@ TEST_F(InvertedIndexFileWriterTest, WriteV2ExceptionHandlingTest) {
     EXPECT_CALL(writer_mock, write_index_headers_and_metadata(::testing::_, ::testing::_))
             .WillOnce(::testing::Throw(CLuceneError(CL_ERR_IO, "Simulated exception", false)));
 
-    Status status = writer_mock.write_v2();
+    Status status = writer_mock.write();
     ASSERT_FALSE(status.ok());
     ASSERT_EQ(status.code(), ErrorCode::INVERTED_INDEX_CLUCENE_ERROR);
 }
@@ -523,7 +523,7 @@ class InvertedIndexFileWriterMockCreateOutputStreamV2 : public InvertedIndexFile
 
     MOCK_METHOD((std::pair<std::unique_ptr<lucene::store::Directory, DirectoryDeleter>,
                            std::unique_ptr<lucene::store::IndexOutput>>),
-                create_output_stream_v2, (), (override));
+                create_output_stream, (), (override));
 };
 
 class InvertedIndexFileWriterMockCreateOutputStreamV1 : public InvertedIndexFileWriter {
@@ -622,7 +622,7 @@ TEST_F(InvertedIndexFileWriterTest, WriteV2OutputTest) {
     auto compound_file_output = std::unique_ptr<DorisFSDirectory::FSIndexOutputV2>(mock_output_v2);
     compound_file_output->init(file_writer.get());
 
-    EXPECT_CALL(writer_mock, create_output_stream_v2())
+    EXPECT_CALL(writer_mock, create_output_stream())
             .WillOnce(::testing::Invoke(
                     [&]() -> std::pair<std::unique_ptr<lucene::store::Directory, DirectoryDeleter>,
                                        std::unique_ptr<lucene::store::IndexOutput>> {
@@ -680,7 +680,7 @@ TEST_F(InvertedIndexFileWriterTest, WriteV2OutputCloseErrorTest) {
     auto compound_file_output = std::unique_ptr<DorisFSDirectory::FSIndexOutputV2>(mock_output_v2);
     compound_file_output->init(file_writer.get());
 
-    EXPECT_CALL(writer_mock, create_output_stream_v2())
+    EXPECT_CALL(writer_mock, create_output_stream())
             .WillOnce(::testing::Invoke(
                     [&]() -> std::pair<std::unique_ptr<lucene::store::Directory, DirectoryDeleter>,
                                        std::unique_ptr<lucene::store::IndexOutput>> {
diff --git a/be/test/vec/data_types/common_data_type_serder_test.h b/be/test/vec/data_types/common_data_type_serder_test.h
new file mode 100644
index 00000000000000..46206d5ed7eb15
--- /dev/null
+++ b/be/test/vec/data_types/common_data_type_serder_test.h
@@ -0,0 +1,366 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+#include <arrow/record_batch.h>
+#include <gen_cpp/data.pb.h>
+#include <gtest/gtest-message.h>
+#include <gtest/gtest-test-part.h>
+#include <gtest/gtest.h>
+
+#include <filesystem>
+#include <fstream>
+#include <iostream>
+
+#include "olap/schema.h"
+#include "runtime/descriptors.cpp"
+#include "runtime/descriptors.h"
+#include "util/arrow/block_convertor.h"
+#include "util/arrow/row_batch.h"
+#include "vec/columns/column.h"
+#include "vec/columns/column_array.h"
+#include "vec/columns/column_map.h"
+#include "vec/columns/columns_number.h"
+#include "vec/core/field.h"
+#include "vec/core/sort_block.h"
+#include "vec/core/sort_description.h"
+#include "vec/core/types.h"
+#include "vec/data_types/data_type.h"
+#include "vec/data_types/data_type_array.h"
+#include "vec/data_types/data_type_map.h"
+#include "vec/utils/arrow_column_to_doris_column.h"
+
+// this test is gonna to be a data type serialize and deserialize functions
+// such as
+// 1. standard hive text ser-deserialize
+//  deserialize_one_cell_from_hive_text (IColumn &column, Slice &slice, const FormatOptions &options, int hive_text_complex_type_delimiter_level=1) const
+//  deserialize_column_from_hive_text_vector (IColumn &column, std::vector< Slice > &slices, int *num_deserialized, const FormatOptions &options, int hive_text_complex_type_delimiter_level=1) const
+//  serialize_one_cell_to_hive_text (const IColumn &column, int row_num, BufferWritable &bw, FormatOptions &options, int hive_text_complex_type_delimiter_level=1) const
+// 2. json format ser-deserialize which used in table not in doris database
+//  serialize_one_cell_to_json (const IColumn &column, int row_num, BufferWritable &bw, FormatOptions &options) const =0
+//  serialize_column_to_json (const IColumn &column, int start_idx, int end_idx, BufferWritable &bw, FormatOptions &options) const =0
+//  deserialize_one_cell_from_json (IColumn &column, Slice &slice, const FormatOptions &options) const =0
+//  deserialize_column_from_json_vector (IColumn &column, std::vector< Slice > &slices, int *num_deserialized, const FormatOptions &options) const =0
+//  deserialize_column_from_fixed_json (IColumn &column, Slice &slice, int rows, int *num_deserialized, const FormatOptions &options) const
+//  insert_column_last_value_multiple_times (IColumn &column, int times) const
+// 3. fe|be protobuffer ser-deserialize
+//  write_column_to_pb (const IColumn &column, PValues &result, int start, int end) const =0
+//  read_column_from_pb (IColumn &column, const PValues &arg) const =0
+// 4. jsonb ser-deserialize which used in row-store situation
+//  write_one_cell_to_jsonb (const IColumn &column, JsonbWriter &result, Arena *mem_pool, int32_t col_id, int row_num) const =0
+//  read_one_cell_from_jsonb (IColumn &column, const JsonbValue *arg) const =0
+// 5. mysql text ser-deserialize
+//  write_column_to_mysql (const IColumn &column, MysqlRowBuffer< false > &row_buffer, int row_idx, bool col_const, const FormatOptions &options) const =0
+//  write_column_to_mysql (const IColumn &column, MysqlRowBuffer< true > &row_buffer, int row_idx, bool col_const, const FormatOptions &options) const =0
+// 6. arrow ser-deserialize which used in spark-flink connector
+//  write_column_to_arrow (const IColumn &column, const NullMap *null_map, arrow::ArrayBuilder *array_builder, int start, int end, const cctz::time_zone &ctz) const =0
+//  read_column_from_arrow (IColumn &column, const arrow::Array *arrow_array, int start, int end, const cctz::time_zone &ctz) const =0
+// 7. rapidjson ser-deserialize
+//  write_one_cell_to_json (const IColumn &column, rapidjson::Value &result, rapidjson::Document::AllocatorType &allocator, Arena &mem_pool, int row_num) const
+//  read_one_cell_from_json (IColumn &column, const rapidjson::Value &result) const
+//  convert_field_to_rapidjson (const vectorized::Field &field, rapidjson::Value &target, rapidjson::Document::AllocatorType &allocator)
+//  convert_array_to_rapidjson (const vectorized::Array &array, rapidjson::Value &target, rapidjson::Document::AllocatorType &allocator)
+
+namespace doris::vectorized {
+
+class CommonDataTypeSerdeTest : public ::testing::Test {
+public:
+    ////==================================================================================================================
+    // this is common function to check data in column against expected results according different function in assert function
+    // which can be used in all column test
+    // such as run regress tests
+    //  step1. we can set gen_check_data_in_assert to true, then we will generate a file for check data, otherwise we will read the file to check data
+    //  step2. we should write assert callback function to check data
+    static void check_data(
+            MutableColumns& columns, DataTypeSerDeSPtrs serders, char col_spliter,
+            std::set<int> idxes, const std::string& column_data_file,
+            std::function<void(MutableColumns& load_cols, DataTypeSerDeSPtrs serders)>
+                    assert_callback,
+            bool is_hive_format = false, DataTypes dataTypes = {}) {
+        ASSERT_EQ(serders.size(), columns.size());
+        // Step 1: Insert data from `column_data_file` into the column and check result with `check_data_file`
+        // Load column data and expected data from CSV files
+        std::vector<std::vector<std::string>> res;
+        struct stat buff;
+        if (stat(column_data_file.c_str(), &buff) == 0) {
+            if (S_ISREG(buff.st_mode)) {
+                // file
+                if (is_hive_format) {
+                    load_data_and_assert_from_csv<true, true>(serders, columns, column_data_file,
+                                                              col_spliter, idxes);
+                } else {
+                    load_data_and_assert_from_csv<false, true>(serders, columns, column_data_file,
+                                                               col_spliter, idxes);
+                }
+            } else if (S_ISDIR(buff.st_mode)) {
+                // dir
+                std::filesystem::path fs_path(column_data_file);
+                for (const auto& entry : std::filesystem::directory_iterator(fs_path)) {
+                    std::string file_path = entry.path().string();
+                    std::cout << "load data from file: " << file_path << std::endl;
+                    if (is_hive_format) {
+                        load_data_and_assert_from_csv<true, true>(serders, columns, file_path,
+                                                                  col_spliter, idxes);
+                    } else {
+                        load_data_and_assert_from_csv<false, true>(serders, columns, file_path,
+                                                                   col_spliter, idxes);
+                    }
+                }
+            }
+        }
+
+        // Step 2: Validate the data in `column` matches `expected_data`
+        assert_callback(columns, serders);
+    }
+
+    // Helper function to load data from CSV, with index which splited by spliter and load to columns
+    template <bool is_hive_format, bool generate_res_file>
+    static void load_data_and_assert_from_csv(const DataTypeSerDeSPtrs serders,
+                                              MutableColumns& columns, const std::string& file_path,
+                                              const char spliter = ';',
+                                              const std::set<int> idxes = {0}) {
+        ASSERT_EQ(serders.size(), columns.size())
+                << "serder size: " << serders.size() << " column size: " << columns.size();
+        ASSERT_EQ(serders.size(), idxes.size())
+                << "serder size: " << serders.size() << " idxes size: " << idxes.size();
+        std::ifstream file(file_path);
+        if (!file) {
+            throw doris::Exception(ErrorCode::INVALID_ARGUMENT, "can not open the file: {} ",
+                                   file_path);
+        }
+
+        std::string line;
+        DataTypeSerDe::FormatOptions options;
+        std::vector<std::vector<std::string>> res;
+        MutableColumns assert_str_cols(columns.size());
+        for (size_t i = 0; i < columns.size(); ++i) {
+            assert_str_cols[i] = ColumnString::create();
+        }
+
+        while (std::getline(file, line)) {
+            std::stringstream lineStream(line);
+            //            std::cout << "whole : " << lineStream.str() << std::endl;
+            std::string value;
+            int l_idx = 0;
+            int c_idx = 0;
+            std::vector<string> row;
+            while (std::getline(lineStream, value, spliter)) {
+                if (idxes.contains(l_idx)) {
+                    // load csv data
+                    Slice string_slice(value.data(), value.size());
+                    std::cout << "origin : " << string_slice << std::endl;
+                    Status st;
+                    // deserialize data
+                    if constexpr (is_hive_format) {
+                        st = serders[c_idx]->deserialize_one_cell_from_hive_text(
+                                *columns[c_idx], string_slice, options);
+                    } else {
+                        st = serders[c_idx]->deserialize_one_cell_from_json(*columns[c_idx],
+                                                                            string_slice, options);
+                    }
+                    if (!st.ok()) {
+                        // deserialize if happen error now we do not insert any value for input column
+                        // so we push a default value to column for row alignment
+                        columns[c_idx]->insert_default();
+                        std::cout << "error in deserialize but continue: " << st.to_string()
+                                  << std::endl;
+                    }
+                    // serialize data
+                    size_t row_num = columns[c_idx]->size() - 1;
+                    assert_str_cols[c_idx]->reserve(columns[c_idx]->size());
+                    VectorBufferWriter bw(assert_cast<ColumnString&>(*assert_str_cols[c_idx]));
+                    if constexpr (is_hive_format) {
+                        st = serders[c_idx]->serialize_one_cell_to_hive_text(*columns[c_idx],
+                                                                             row_num, bw, options);
+                        EXPECT_TRUE(st.ok()) << st.to_string();
+                    } else {
+                        st = serders[c_idx]->serialize_one_cell_to_json(*columns[c_idx], row_num,
+                                                                        bw, options);
+                        EXPECT_TRUE(st.ok()) << st.to_string();
+                    }
+                    bw.commit();
+                    // assert data : origin data and serialized data should be equal or generated
+                    // file to check data
+                    size_t assert_size = assert_str_cols[c_idx]->size();
+                    if constexpr (!generate_res_file) {
+                        EXPECT_EQ(assert_str_cols[c_idx]->get_data_at(assert_size - 1).to_string(),
+                                  string_slice.to_string())
+                                << "column: " << columns[c_idx]->get_name() << " row: " << row_num
+                                << " is_hive_format: " << is_hive_format;
+                    }
+                    ++c_idx;
+                }
+                res.push_back(row);
+                ++l_idx;
+            }
+        }
+
+        if (generate_res_file) {
+            // generate res
+            auto pos = file_path.find_last_of(".");
+            string hive_format = is_hive_format ? "_hive" : "";
+            std::string res_file = file_path.substr(0, pos) + hive_format + "_serde_res.csv";
+            std::ofstream res_f(res_file);
+            if (!res_f.is_open()) {
+                throw std::ios_base::failure("Failed to open file." + res_file);
+            }
+            for (size_t r = 0; r < assert_str_cols[0]->size(); ++r) {
+                for (size_t c = 0; c < assert_str_cols.size(); ++c) {
+                    std::cout << assert_str_cols[c]->get_data_at(r).to_string() << spliter
+                              << std::endl;
+                    res_f << assert_str_cols[c]->get_data_at(r).to_string() << spliter;
+                }
+                res_f << std::endl;
+            }
+            res_f.close();
+            std::cout << "generate res file: " << res_file << std::endl;
+        }
+    }
+
+    // standard hive text ser-deserialize assert function
+    static void assert_pb_format(MutableColumns& load_cols, DataTypeSerDeSPtrs serders) {
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            auto& col = load_cols[i];
+            std::cout << " now we are testing column : " << col->get_name() << std::endl;
+            // serialize to pb
+            PValues pv = PValues();
+            Status st = serders[i]->write_column_to_pb(*col, pv, 0, col->size());
+            if (!st.ok()) {
+                std::cerr << "write_column_to_pb error: " << st.msg() << std::endl;
+                continue;
+            }
+            // deserialize from pb
+            auto except_column = col->clone_empty();
+            st = serders[i]->read_column_from_pb(*except_column, pv);
+            EXPECT_TRUE(st.ok()) << st.to_string();
+            // check pb value from expected column
+            PValues as_pv = PValues();
+            st = serders[i]->write_column_to_pb(*except_column, as_pv, 0, except_column->size());
+            EXPECT_TRUE(st.ok()) << st.to_string();
+            EXPECT_EQ(pv.bytes_value_size(), as_pv.bytes_value_size());
+            // check column value
+            for (size_t j = 0; j < col->size(); ++j) {
+                auto cell = col->operator[](j);
+                auto except_cell = except_column->operator[](j);
+                EXPECT_EQ(cell, except_cell) << "column: " << col->get_name() << " row: " << j;
+            }
+        }
+    }
+
+    // actually this is block_to_jsonb and jsonb_to_block test
+    static void assert_jsonb_format(MutableColumns& load_cols, DataTypeSerDeSPtrs serders) {
+        Arena pool;
+        auto jsonb_column = ColumnString::create(); // jsonb column
+        jsonb_column->reserve(load_cols[0]->size());
+        MutableColumns assert_cols;
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            assert_cols.push_back(load_cols[i]->assume_mutable());
+        }
+        for (size_t r = 0; r < load_cols[0]->size(); ++r) {
+            JsonbWriterT<JsonbOutStream> jw;
+            jw.writeStartObject();
+            // serialize to jsonb
+            for (size_t i = 0; i < load_cols.size(); ++i) {
+                auto& col = load_cols[i];
+                serders[i]->write_one_cell_to_jsonb(*col, jw, &pool, i, r);
+            }
+            jw.writeEndObject();
+            jsonb_column->insert_data(jw.getOutput()->getBuffer(), jw.getOutput()->getSize());
+        }
+        // deserialize jsonb column to assert column
+        EXPECT_EQ(jsonb_column->size(), load_cols[0]->size());
+        for (size_t r = 0; r < jsonb_column->size(); ++r) {
+            StringRef jsonb_data = jsonb_column->get_data_at(r);
+            auto pdoc = JsonbDocument::createDocument(jsonb_data.data, jsonb_data.size);
+            JsonbDocument& doc = *pdoc;
+            size_t cIdx = 0;
+            for (auto it = doc->begin(); it != doc->end(); ++it) {
+                serders[cIdx]->read_one_cell_from_jsonb(*assert_cols[cIdx], it->value());
+                ++cIdx;
+            }
+        }
+        // check column value
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            auto& col = load_cols[i];
+            auto& assert_col = assert_cols[i];
+            for (size_t j = 0; j < col->size(); ++j) {
+                auto cell = col->operator[](j);
+                auto assert_cell = assert_col->operator[](j);
+                EXPECT_EQ(cell, assert_cell) << "column: " << col->get_name() << " row: " << j;
+            }
+        }
+    }
+
+    // assert mysql text format, now we just simple assert not to fatal or exception here
+    static void assert_mysql_format(MutableColumns& load_cols, DataTypeSerDeSPtrs serders) {
+        MysqlRowBuffer<false> row_buffer;
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            auto& col = load_cols[i];
+            for (size_t j = 0; j < col->size(); ++j) {
+                Status st;
+                EXPECT_NO_FATAL_FAILURE(
+                        st = serders[i]->write_column_to_mysql(*col, row_buffer, j, false, {}));
+                EXPECT_TRUE(st.ok()) << st.to_string();
+            }
+        }
+    }
+
+    // assert arrow serialize
+    static void assert_arrow_format(MutableColumns& load_cols, DataTypeSerDeSPtrs serders,
+                                    DataTypes types) {
+        // make a block to write to arrow
+        auto block = std::make_shared<Block>();
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            auto& col = load_cols[i];
+            block->insert(ColumnWithTypeAndName(std::move(col), types[i], types[i]->get_name()));
+        }
+        // print block
+        std::cout << "block: " << block->dump_structure() << std::endl;
+        std::shared_ptr<arrow::Schema> block_arrow_schema;
+        EXPECT_EQ(get_arrow_schema_from_block(*block, &block_arrow_schema, "UTC"), Status::OK());
+        // convert block to arrow
+        std::shared_ptr<arrow::RecordBatch> result;
+        cctz::time_zone _timezone_obj; //default UTC
+        Status stt = convert_to_arrow_batch(*block, block_arrow_schema,
+                                            arrow::default_memory_pool(), &result, _timezone_obj);
+        EXPECT_EQ(Status::OK(), stt) << "convert block to arrow failed" << stt.to_string();
+
+        // deserialize arrow to block
+        auto assert_block = block->clone_empty();
+        auto rows = block->rows();
+        for (size_t i = 0; i < load_cols.size(); ++i) {
+            auto array = result->column(i);
+            auto& column_with_type_and_name = assert_block.get_by_position(i);
+            auto ret = arrow_column_to_doris_column(
+                    array.get(), 0, column_with_type_and_name.column,
+                    column_with_type_and_name.type, rows, _timezone_obj);
+            // do check data
+            EXPECT_EQ(Status::OK(), ret) << "convert arrow to block failed" << ret.to_string();
+            auto& col = block->get_by_position(i).column;
+            auto& assert_col = column_with_type_and_name.column;
+            for (size_t j = 0; j < col->size(); ++j) {
+                auto cell = col->operator[](j);
+                auto assert_cell = assert_col->operator[](j);
+                EXPECT_EQ(cell, assert_cell) << "column: " << col->get_name() << " row: " << j;
+            }
+        }
+    }
+
+    // assert rapidjson format
+    // now rapidjson write_one_cell_to_json and read_one_cell_from_json only used in column_object
+    // can just be replaced by jsonb format
+};
+
+} // namespace doris::vectorized
\ No newline at end of file
diff --git a/be/test/vec/data_types/common_data_type_test.h b/be/test/vec/data_types/common_data_type_test.h
new file mode 100644
index 00000000000000..36abc3402e2156
--- /dev/null
+++ b/be/test/vec/data_types/common_data_type_test.h
@@ -0,0 +1,225 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+#include <gen_cpp/data.pb.h>
+#include <gtest/gtest-message.h>
+#include <gtest/gtest-test-part.h>
+#include <gtest/gtest.h>
+
+#include <filesystem>
+#include <fstream>
+#include <iostream>
+
+#include "olap/schema.h"
+#include "vec/columns/column.h"
+#include "vec/columns/column_array.h"
+#include "vec/columns/column_map.h"
+#include "vec/columns/columns_number.h"
+#include "vec/core/field.h"
+#include "vec/core/sort_block.h"
+#include "vec/core/sort_description.h"
+#include "vec/core/types.h"
+#include "vec/data_types/data_type.h"
+#include "vec/data_types/data_type_array.h"
+#include "vec/data_types/data_type_map.h"
+
+// this test is gonna to be a data type test template for all DataType which should make ut test to coverage the function defined
+// for example DataTypeIPv4 should test this function:
+// 1. datatype meta info:
+//         get_type_id, get_type_as_type_descriptor, get_storage_field_type, have_subtypes, get_pdata_type (const IDataType *data_type), to_pb_column_meta (PColumnMeta *col_meta)
+//         get_family_name, get_is_parametric, should_align_right_in_pretty_formats
+//         text_can_contain_only_valid_utf8
+//         have_maximum_size_of_value, get_maximum_size_of_value_in_memory, get_size_of_value_in_memory
+//         get_precision, get_scale
+//         get_field
+//         is_null_literal, is_value_represented_by_number, is_value_unambiguously_represented_in_contiguous_memory_region, is_value_unambiguously_represented_in_fixed_size_contiguous_memory_region
+// 2. datatype creation with column: create_column, create_column_const (size_t size, const Field &field), create_column_const_with_default_value (size_t size),  get_uncompressed_serialized_bytes (const IColumn &column, int be_exec_version)
+// 3. serde related: get_serde (int nesting_level=1)
+//          to_string (const IColumn &column, size_t row_num, BufferWritable &ostr), to_string (const IColumn &column, size_t row_num), to_string_batch (const IColumn &column, ColumnString &column_to), from_string (ReadBuffer &rb, IColumn *column)
+//          this two function should move to DataTypeSerDe and only used in Block
+//          serialize (const IColumn &column, char *buf, int be_exec_version), deserialize (const char *buf, MutableColumnPtr *column, int be_exec_version)
+// 4. compare: equals (const IDataType &rhs), is_comparable
+
+namespace doris::vectorized {
+
+static bool gen_check_data_in_assert = true;
+
+class CommonDataTypeTest : public ::testing::Test {
+protected:
+    // Helper function to load data from CSV, with index which splited by spliter and load to columns
+    void load_data_from_csv(const DataTypeSerDeSPtrs serders, MutableColumns& columns,
+                            const std::string& file_path, const char spliter = ';',
+                            const std::set<int> idxes = {0}) {
+        ASSERT_EQ(serders.size(), columns.size())
+                << "serder size: " << serders.size() << " column size: " << columns.size();
+        ASSERT_EQ(serders.size(), idxes.size())
+                << "serder size: " << serders.size() << " idxes size: " << idxes.size();
+        std::ifstream file(file_path);
+        if (!file) {
+            throw doris::Exception(ErrorCode::INVALID_ARGUMENT, "can not open the file: {} ",
+                                   file_path);
+        }
+
+        std::string line;
+        DataTypeSerDe::FormatOptions options;
+        while (std::getline(file, line)) {
+            std::stringstream lineStream(line);
+            //            std::cout << "whole : " << lineStream.str() << std::endl;
+            std::string value;
+            int l_idx = 0;
+            int c_idx = 0;
+            while (std::getline(lineStream, value, spliter)) {
+                if (idxes.contains(l_idx)) {
+                    Slice string_slice(value.data(), value.size());
+                    std::cout << string_slice << std::endl;
+                    if (auto st = serders[c_idx]->deserialize_one_cell_from_json(
+                                *columns[c_idx], string_slice, options);
+                        !st.ok()) {
+                        //                        std::cout << "error in deserialize but continue: " << st.to_string()
+                        //                                  << std::endl;
+                    }
+                    ++c_idx;
+                }
+                ++l_idx;
+            }
+        }
+    }
+
+public:
+    // we make meta info a default value, so assert should change the struct value to the right value
+    struct DataTypeMetaInfo {
+        TypeIndex type_id = TypeIndex::Nothing;
+        TypeDescriptor* type_as_type_descriptor = nullptr;
+        std::string family_name = "";
+        bool has_subtypes = false;
+        doris::FieldType storage_field_type = doris::FieldType::OLAP_FIELD_TYPE_UNKNOWN;
+        bool should_align_right_in_pretty_formats = false;
+        bool text_can_contain_only_valid_utf8 = false;
+        bool have_maximum_size_of_value = false;
+        size_t size_of_value_in_memory = -1;
+        size_t precision = -1;
+        size_t scale = -1;
+        bool is_null_literal = true;
+        bool is_value_represented_by_number = false;
+        PColumnMeta* pColumnMeta = nullptr;
+        DataTypeSerDeSPtr serde = nullptr;
+        //        bool is_value_unambiguously_represented_in_contiguous_memory_region = false;
+    };
+    void SetUp() override {}
+
+    // meta info assert is simple and can be used for all DataType
+    void meta_info_assert(DataTypePtr& data_type, DataTypeMetaInfo& meta_info) {
+        ASSERT_NE(data_type->get_serde(1), nullptr);
+        ASSERT_EQ(IDataType::get_pdata_type(data_type.get()), meta_info.pColumnMeta->type());
+        ASSERT_EQ(data_type->get_type_id(), meta_info.type_id);
+        ASSERT_EQ(data_type->get_type_as_type_descriptor(), *meta_info.type_as_type_descriptor);
+        ASSERT_EQ(data_type->get_family_name(), meta_info.family_name);
+        ASSERT_EQ(data_type->have_subtypes(), meta_info.has_subtypes);
+        ASSERT_EQ(data_type->get_storage_field_type(), meta_info.storage_field_type);
+        ASSERT_EQ(data_type->should_align_right_in_pretty_formats(),
+                  meta_info.should_align_right_in_pretty_formats);
+        ASSERT_EQ(data_type->text_can_contain_only_valid_utf8(),
+                  meta_info.text_can_contain_only_valid_utf8);
+        ASSERT_EQ(data_type->have_maximum_size_of_value(), meta_info.have_maximum_size_of_value);
+        ASSERT_EQ(data_type->get_size_of_value_in_memory(), meta_info.size_of_value_in_memory);
+        if (is_decimal(data_type)) {
+            ASSERT_EQ(data_type->get_precision(), meta_info.precision);
+            ASSERT_EQ(data_type->get_scale(), meta_info.scale);
+        } else {
+            EXPECT_ANY_THROW(EXPECT_FALSE(data_type->get_precision()));
+            EXPECT_THROW(EXPECT_FALSE(data_type->get_scale()), doris::Exception);
+        }
+        ASSERT_EQ(data_type->is_null_literal(), meta_info.is_null_literal);
+        ASSERT_EQ(data_type->is_value_represented_by_number(),
+                  meta_info.is_value_represented_by_number);
+        //        ASSERT_EQ(data_type->is_value_unambiguously_represented_in_contiguous_memory_region(), meta_info.is_value_unambiguously_represented_in_contiguous_memory_region);
+    }
+
+    // create column assert with default field is simple and can be used for all DataType
+    void create_column_assert(DataTypePtr& data_type, Field& default_field) {
+        auto column = data_type->create_column();
+        ASSERT_EQ(column->size(), 0);
+        ColumnPtr const_col = data_type->create_column_const(10, default_field);
+        ASSERT_EQ(const_col->size(), 10);
+        ColumnPtr default_const_col = data_type->create_column_const_with_default_value(10);
+        ASSERT_EQ(default_const_col->size(), 10);
+        for (int i = 0; i < 10; ++i) {
+            ASSERT_EQ(const_col->operator[](i), default_const_col->operator[](i));
+        }
+        // get_uncompressed_serialized_bytes
+        ASSERT_EQ(data_type->get_uncompressed_serialized_bytes(*column, 0), 4);
+    }
+
+    // get_field assert is simple and can be used for all DataType
+    void get_field_assert(DataTypePtr& data_type, TExprNode& node, Field& assert_field,
+                          bool assert_false = false) {
+        if (assert_false) {
+            EXPECT_ANY_THROW(data_type->get_field(node))
+                    << "get_field_assert: "
+                    << " datatype:" + data_type->get_name() << " node_type:" << node.node_type
+                    << " field: " << assert_field.get_type() << std::endl;
+        } else {
+            Field field = data_type->get_field(node);
+            ASSERT_EQ(field, assert_field)
+                    << "get_field_assert: "
+                    << " datatype:" + data_type->get_name() << " node_type:" << node.node_type
+                    << " field: " << assert_field.get_type() << std::endl;
+        }
+    }
+
+    // to_string | to_string_batch | from_string assert is simple and can be used for all DataType
+    void assert_to_string_from_string_assert(MutableColumnPtr mutableColumn,
+                                             DataTypePtr& data_type) {
+        // to_string_batch | from_string
+        auto col_to = ColumnString::create();
+        data_type->to_string_batch(*mutableColumn, *col_to);
+        ASSERT_EQ(col_to->size(), mutableColumn->size());
+        // from_string assert col_to to assert_column and check same with mutableColumn
+        auto assert_column = data_type->create_column();
+        for (int i = 0; i < col_to->size(); ++i) {
+            std::string s = col_to->get_data_at(i).to_string();
+            ReadBuffer rb(s.data(), s.size());
+            ASSERT_EQ(Status::OK(), data_type->from_string(rb, assert_column.get()));
+            ASSERT_EQ(assert_column->operator[](i), mutableColumn->operator[](i));
+        }
+        // to_string | from_string
+        auto ser_col = ColumnString::create();
+        ser_col->reserve(mutableColumn->size());
+        VectorBufferWriter buffer_writer(*ser_col.get());
+        for (int i = 0; i < mutableColumn->size(); ++i) {
+            data_type->to_string(*mutableColumn, i, buffer_writer);
+            buffer_writer.commit();
+        }
+        // check ser_col to assert_column and check same with mutableColumn
+        auto assert_column_1 = data_type->create_column();
+        for (int i = 0; i < ser_col->size(); ++i) {
+            std::string s = ser_col->get_data_at(i).to_string();
+            ReadBuffer rb(s.data(), s.size());
+            ASSERT_EQ(Status::OK(), data_type->from_string(rb, assert_column_1.get()));
+            ASSERT_EQ(assert_column_1->operator[](i), mutableColumn->operator[](i));
+        }
+    }
+
+    // should all datatype is compare?
+    void assert_compare_behavior(DataTypePtr l_dt, DataTypePtr& r_dt) {
+        ASSERT_TRUE(l_dt->is_comparable());
+        ASSERT_TRUE(r_dt->is_comparable());
+        // compare
+        ASSERT_FALSE(l_dt->equals(*r_dt));
+    }
+};
+
+} // namespace doris::vectorized
\ No newline at end of file
diff --git a/be/test/vec/data_types/data_type_ip_test.cpp b/be/test/vec/data_types/data_type_ip_test.cpp
new file mode 100644
index 00000000000000..72a340b9e145b8
--- /dev/null
+++ b/be/test/vec/data_types/data_type_ip_test.cpp
@@ -0,0 +1,250 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include <gtest/gtest-message.h>
+#include <gtest/gtest-test-part.h>
+#include <gtest/gtest.h>
+
+#include <filesystem>
+#include <fstream>
+#include <iostream>
+
+#include "olap/schema.h"
+#include "vec/columns/column.h"
+#include "vec/columns/column_array.h"
+#include "vec/columns/column_map.h"
+#include "vec/columns/columns_number.h"
+#include "vec/core/field.h"
+#include "vec/core/sort_block.h"
+#include "vec/core/sort_description.h"
+#include "vec/core/types.h"
+#include "vec/data_types/common_data_type_serder_test.h"
+#include "vec/data_types/common_data_type_test.h"
+#include "vec/data_types/data_type.h"
+#include "vec/data_types/data_type_factory.hpp"
+#include "vec/data_types/data_type_nullable.h"
+
+// this test is gonna to be a data type test template for all DataType which should make ut test to coverage the function defined
+// for example DataTypeIPv4 should test this function:
+// 1. datatype meta info:
+//         get_type_id, get_type_as_type_descriptor, get_storage_field_type, have_subtypes, get_pdata_type (const IDataType *data_type), to_pb_column_meta (PColumnMeta *col_meta)
+//         get_family_name, get_is_parametric, should_align_right_in_pretty_formats
+//         text_can_contain_only_valid_utf8
+//         have_maximum_size_of_value, get_maximum_size_of_value_in_memory, get_size_of_value_in_memory
+//         get_precision, get_scale
+//         is_null_literal, is_value_represented_by_number, is_value_unambiguously_represented_in_contiguous_memory_region
+// 2. datatype creation with column : create_column, create_column_const (size_t size, const Field &field), create_column_const_with_default_value (size_t size), get_uncompressed_serialized_bytes (const IColumn &column, int be_exec_version)
+// 3. serde related: get_serde (int nesting_level=1)
+//          to_string (const IColumn &column, size_t row_num, BufferWritable &ostr), to_string (const IColumn &column, size_t row_num), to_string_batch (const IColumn &column, ColumnString &column_to), from_string (ReadBuffer &rb, IColumn *column)
+//          serialize (const IColumn &column, char *buf, int be_exec_version), deserialize (const char *buf, MutableColumnPtr *column, int be_exec_version)
+// 4. compare: equals (const IDataType &rhs), is_comparable
+// 5. others: update_avg_value_size_hint (const IColumn &column, double &avg_value_size_hint)
+
+namespace doris::vectorized {
+
+class DataTypeIPTest : public CommonDataTypeTest {
+protected:
+    void SetUp() override {
+        data_files = {"regression-test/data/nereids_function_p0/fn_test_ip_invalid.csv",
+                      "regression-test/data/nereids_function_p0/fn_test_ip_normal.csv",
+                      "regression-test/data/nereids_function_p0/fn_test_ip_nullable.csv",
+                      "regression-test/data/nereids_function_p0/fn_test_ip_special.csv",
+                      "regression-test/data/nereids_function_p0/fn_test_ip_special_no_null.csv"};
+    }
+
+public:
+    DataTypePtr dt_ipv4 =
+            DataTypeFactory::instance().create_data_type(FieldType::OLAP_FIELD_TYPE_IPV4, 0, 0);
+    DataTypePtr dt_ipv6 =
+            DataTypeFactory::instance().create_data_type(FieldType::OLAP_FIELD_TYPE_IPV6, 0, 0);
+    DataTypePtr dt_ipv4_nullable = std::make_shared<vectorized::DataTypeNullable>(dt_ipv4);
+    DataTypePtr dt_ipv6_nullable = std::make_shared<vectorized::DataTypeNullable>(dt_ipv6);
+    // common ip data
+    std::vector<string> data_files;
+};
+
+TEST_F(DataTypeIPTest, MetaInfoTest) {
+    TypeDescriptor ipv4_type_descriptor = {PrimitiveType::TYPE_IPV4};
+    auto col_meta = std::make_shared<PColumnMeta>();
+    col_meta->set_type(PGenericType_TypeId_IPV4);
+    DataTypeMetaInfo ipv4_meta_info_to_assert = {
+            .type_id = TypeIndex::IPv4,
+            .type_as_type_descriptor = &ipv4_type_descriptor,
+            .family_name = "IPv4",
+            .has_subtypes = false,
+            .storage_field_type = doris::FieldType::OLAP_FIELD_TYPE_IPV4,
+            .should_align_right_in_pretty_formats = true,
+            .text_can_contain_only_valid_utf8 = true,
+            .have_maximum_size_of_value = true,
+            .size_of_value_in_memory = sizeof(IPv4),
+            .precision = size_t(-1),
+            .scale = size_t(-1),
+            .is_null_literal = false,
+            .is_value_represented_by_number = true,
+            .pColumnMeta = col_meta.get()
+            //                .is_value_unambiguously_represented_in_contiguous_memory_region = true
+    };
+    TypeDescriptor ipv6_type_descriptor = {PrimitiveType::TYPE_IPV6};
+    auto col_meta6 = std::make_shared<PColumnMeta>();
+    col_meta6->set_type(PGenericType_TypeId_IPV6);
+    DataTypeMetaInfo ipv6_meta_info = {
+            .type_id = TypeIndex::IPv6,
+            .type_as_type_descriptor = &ipv6_type_descriptor,
+            .family_name = "IPv6",
+            .has_subtypes = false,
+            .storage_field_type = doris::FieldType::OLAP_FIELD_TYPE_IPV6,
+            .should_align_right_in_pretty_formats = true,
+            .text_can_contain_only_valid_utf8 = true,
+            .have_maximum_size_of_value = true,
+            .size_of_value_in_memory = sizeof(IPv6),
+            .precision = size_t(-1),
+            .scale = size_t(-1),
+            .is_null_literal = false,
+            .is_value_represented_by_number = true,
+            .pColumnMeta = col_meta6.get()
+            //                .is_value_unambiguously_represented_in_contiguous_memory_region = true
+    };
+    meta_info_assert(dt_ipv4, ipv4_meta_info_to_assert);
+    meta_info_assert(dt_ipv6, ipv6_meta_info);
+}
+
+TEST_F(DataTypeIPTest, CreateColumnTest) {
+    Field default_field_ipv4 = IPv4(0);
+    Field default_field_ipv6 = IPv6(0);
+    create_column_assert(dt_ipv4, default_field_ipv4);
+    create_column_assert(dt_ipv6, default_field_ipv6);
+}
+
+TEST_F(DataTypeIPTest, GetFieldTest) {
+    auto serde_ipv4 = dt_ipv4->get_serde(1);
+    auto serde_ipv6 = dt_ipv6->get_serde(1);
+    auto column_ipv4 = dt_ipv4->create_column();
+    auto column_ipv6 = dt_ipv6->create_column();
+
+    // insert from data csv and assert insert result
+    MutableColumns ip_cols;
+    ip_cols.push_back(column_ipv4->get_ptr());
+    ip_cols.push_back(column_ipv6->get_ptr());
+    DataTypeSerDeSPtrs serde = {dt_ipv4->get_serde(), dt_ipv6->get_serde()};
+    CommonDataTypeSerdeTest::load_data_and_assert_from_csv<true, true>(serde, ip_cols,
+                                                                       data_files[1], ';', {1, 2});
+    TExprNode node_ipv4;
+    node_ipv4.node_type = TExprNodeType::IPV4_LITERAL;
+    for (size_t i = 0; i < ip_cols[0]->size(); ++i) {
+        node_ipv4.ipv4_literal.value = ip_cols[0]->get_int(i);
+        Field assert_field;
+        ip_cols[0]->get(i, assert_field);
+        get_field_assert(dt_ipv4, node_ipv4, assert_field);
+    }
+
+    TExprNode node_ipv6;
+    node_ipv6.node_type = TExprNodeType::IPV6_LITERAL;
+    for (size_t i = 0; i < ip_cols[1]->size(); ++i) {
+        node_ipv6.ipv6_literal.value =
+                IPv6Value::to_string(assert_cast<ColumnIPv6&>(*ip_cols[1]).get_data()[i]);
+        Field assert_field;
+        ip_cols[1]->get(i, assert_field);
+        get_field_assert(dt_ipv6, node_ipv6, assert_field);
+    }
+
+    TExprNode invalid_node_ipv6;
+    invalid_node_ipv6.node_type = TExprNodeType::IPV6_LITERAL;
+    // todo.(check) 2001:db8:::1 this is invalid ipv6 value, but it can pass the test
+    std::vector<string> invalid_ipv6 = {"2001:db8::12345",
+                                        "",
+                                        "::fffff:0:0",
+                                        "2001:db8::g123",
+                                        "2001:db8:85a3::8a2e:0370:",
+                                        "2001:0db8:85a3:0000:0000:8a2e:0370:7334:1234",
+                                        "::12345:abcd"};
+    for (auto& ipv6 : invalid_ipv6) {
+        invalid_node_ipv6.ipv6_literal.value = ipv6;
+        Field field;
+        get_field_assert(dt_ipv6, invalid_node_ipv6, field, true);
+    }
+}
+
+TEST_F(DataTypeIPTest, FromAndToStringTest) {
+    auto serde_ipv4 = dt_ipv4->get_serde(1);
+    auto serde_ipv6 = dt_ipv6->get_serde(1);
+    auto column_ipv4 = dt_ipv4->create_column();
+    auto column_ipv6 = dt_ipv6->create_column();
+
+    // insert from data csv and assert insert result
+    MutableColumns ip_cols;
+    ip_cols.push_back(column_ipv4->get_ptr());
+    ip_cols.push_back(column_ipv6->get_ptr());
+    DataTypeSerDeSPtrs serde = {dt_ipv4->get_serde(), dt_ipv6->get_serde()};
+    load_data_from_csv(serde, ip_cols, data_files[0], ';', {1, 2});
+    // test ipv4
+    assert_to_string_from_string_assert(ip_cols[0]->get_ptr(), dt_ipv4);
+    // test ipv6
+    assert_to_string_from_string_assert(ip_cols[1]->get_ptr(), dt_ipv6);
+}
+
+TEST_F(DataTypeIPTest, CompareTest) {
+    assert_compare_behavior(dt_ipv4, dt_ipv6);
+}
+
+TEST_F(DataTypeIPTest, SerdeHiveTextAndJsonFormatTest) {
+    auto serde_ipv4 = dt_ipv4->get_serde(1);
+    auto serde_ipv6 = dt_ipv6->get_serde(1);
+    auto column_ipv4 = dt_ipv4->create_column();
+    auto column_ipv6 = dt_ipv6->create_column();
+
+    // insert from data csv and assert insert result
+    MutableColumns ip_cols;
+    ip_cols.push_back(column_ipv4->get_ptr());
+    ip_cols.push_back(column_ipv6->get_ptr());
+    DataTypeSerDeSPtrs serde = {dt_ipv4->get_serde(), dt_ipv6->get_serde()};
+    CommonDataTypeSerdeTest::load_data_and_assert_from_csv<true, true>(serde, ip_cols,
+                                                                       data_files[1], ';', {1, 2});
+    CommonDataTypeSerdeTest::load_data_and_assert_from_csv<false, true>(serde, ip_cols,
+                                                                        data_files[1], ';', {1, 2});
+}
+
+TEST_F(DataTypeIPTest, SerdePbTest) {
+    auto serde_ipv4 = dt_ipv4->get_serde(1);
+    auto serde_ipv6 = dt_ipv6->get_serde(1);
+    auto column_ipv4 = dt_ipv4->create_column();
+    auto column_ipv6 = dt_ipv6->create_column();
+
+    // insert from data csv and assert insert result
+    MutableColumns ip_cols;
+    ip_cols.push_back(column_ipv4->get_ptr());
+    ip_cols.push_back(column_ipv6->get_ptr());
+    DataTypeSerDeSPtrs serde = {dt_ipv4->get_serde(), dt_ipv6->get_serde()};
+    CommonDataTypeSerdeTest::check_data(ip_cols, serde, ';', {1, 2}, data_files[0],
+                                        CommonDataTypeSerdeTest::assert_pb_format);
+}
+
+TEST_F(DataTypeIPTest, SerdeJsonbTest) {
+    auto serde_ipv4 = dt_ipv4->get_serde(1);
+    auto serde_ipv6 = dt_ipv6->get_serde(1);
+    auto column_ipv4 = dt_ipv4->create_column();
+    auto column_ipv6 = dt_ipv6->create_column();
+
+    // insert from data csv and assert insert result
+    MutableColumns ip_cols;
+    ip_cols.push_back(column_ipv4->get_ptr());
+    ip_cols.push_back(column_ipv6->get_ptr());
+    DataTypeSerDeSPtrs serde = {dt_ipv4->get_serde(), dt_ipv6->get_serde()};
+    CommonDataTypeSerdeTest::check_data(ip_cols, serde, ';', {1, 2}, data_files[0],
+                                        CommonDataTypeSerdeTest::assert_jsonb_format);
+}
+
+} // namespace doris::vectorized
\ No newline at end of file
diff --git a/build.sh b/build.sh
index c90f6b14144600..da4e701f42146a 100755
--- a/build.sh
+++ b/build.sh
@@ -538,6 +538,7 @@ fi
 if [[ "${BUILD_BE_JAVA_EXTENSIONS}" -eq 1 ]]; then
     modules+=("fe-common")
     modules+=("be-java-extensions/hudi-scanner")
+    modules+=("be-java-extensions/hadoop-hudi-scanner")
     modules+=("be-java-extensions/java-common")
     modules+=("be-java-extensions/java-udf")
     modules+=("be-java-extensions/jdbc-scanner")
@@ -825,6 +826,7 @@ EOF
     extensions_modules=("java-udf")
     extensions_modules+=("jdbc-scanner")
     extensions_modules+=("hudi-scanner")
+    extensions_modules+=("hadoop-hudi-scanner")
     extensions_modules+=("paimon-scanner")
     extensions_modules+=("trino-connector-scanner")
     extensions_modules+=("max-compute-scanner")
diff --git a/cloud/src/common/bvars.cpp b/cloud/src/common/bvars.cpp
index 507acb00dff0b0..746f109ac6d7fd 100644
--- a/cloud/src/common/bvars.cpp
+++ b/cloud/src/common/bvars.cpp
@@ -198,3 +198,10 @@ BvarStatusWithTag<long> g_bvar_checker_instance_volume("checker", "instance_volu
 BvarStatusWithTag<long> g_bvar_inverted_checker_num_scanned("checker", "num_inverted_scanned");
 BvarStatusWithTag<long> g_bvar_inverted_checker_num_check_failed("checker",
                                                                  "num_inverted_check_failed");
+
+BvarStatusWithTag<int64_t> g_bvar_inverted_checker_leaked_delete_bitmaps("checker",
+                                                                         "leaked_delete_bitmaps");
+BvarStatusWithTag<int64_t> g_bvar_inverted_checker_abnormal_delete_bitmaps(
+        "checker", "abnormal_delete_bitmaps");
+BvarStatusWithTag<int64_t> g_bvar_inverted_checker_delete_bitmaps_scanned(
+        "checker", "delete_bitmap_keys_scanned");
\ No newline at end of file
diff --git a/cloud/src/common/bvars.h b/cloud/src/common/bvars.h
index 373a3a63ff2703..d0ad2e97957ae6 100644
--- a/cloud/src/common/bvars.h
+++ b/cloud/src/common/bvars.h
@@ -250,3 +250,7 @@ extern BvarStatusWithTag<long> g_bvar_checker_last_success_time_ms;
 extern BvarStatusWithTag<long> g_bvar_checker_instance_volume;
 extern BvarStatusWithTag<long> g_bvar_inverted_checker_num_scanned;
 extern BvarStatusWithTag<long> g_bvar_inverted_checker_num_check_failed;
+
+extern BvarStatusWithTag<int64_t> g_bvar_inverted_checker_leaked_delete_bitmaps;
+extern BvarStatusWithTag<int64_t> g_bvar_inverted_checker_abnormal_delete_bitmaps;
+extern BvarStatusWithTag<int64_t> g_bvar_inverted_checker_delete_bitmaps_scanned;
diff --git a/cloud/src/common/config.h b/cloud/src/common/config.h
index 43a426a89593d5..ac4403aeb24a3c 100644
--- a/cloud/src/common/config.h
+++ b/cloud/src/common/config.h
@@ -72,6 +72,11 @@ CONF_Bool(enable_checker, "false");
 CONF_Int32(recycle_pool_parallelism, "40");
 // Currently only used for recycler test
 CONF_Bool(enable_inverted_check, "false");
+// Currently only used for recycler test
+CONF_Bool(enable_delete_bitmap_inverted_check, "false");
+// checks if https://github.com/apache/doris/pull/40204 works as expected
+CONF_Bool(enable_delete_bitmap_storage_optimize_check, "false");
+CONF_mInt64(delete_bitmap_storage_optimize_check_version_gap, "1000");
 // interval for scanning instances to do checks and inspections
 CONF_mInt32(scan_instances_interval_seconds, "60"); // 1min
 // interval for check object
diff --git a/cloud/src/meta-service/keys.cpp b/cloud/src/meta-service/keys.cpp
index 820d349084e35f..a518b6e264d20d 100644
--- a/cloud/src/meta-service/keys.cpp
+++ b/cloud/src/meta-service/keys.cpp
@@ -382,6 +382,14 @@ void stats_tablet_num_segs_key(const StatsTabletKeyInfo& in, std::string* out) {
     stats_tablet_key(in, out);
     encode_bytes(STATS_KEY_SUFFIX_NUM_SEGS, out);
 }
+void stats_tablet_index_size_key(const StatsTabletKeyInfo& in, std::string* out) {
+    stats_tablet_key(in, out);
+    encode_bytes(STATS_KEY_SUFFIX_INDEX_SIZE, out);
+}
+void stats_tablet_segment_size_key(const StatsTabletKeyInfo& in, std::string* out) {
+    stats_tablet_key(in, out);
+    encode_bytes(STATS_KEY_SUFFIX_SEGMENT_SIZE, out);
+}
 
 //==============================================================================
 // Job keys
diff --git a/cloud/src/meta-service/keys.h b/cloud/src/meta-service/keys.h
index c63af925b8f4de..855171c1dc648a 100644
--- a/cloud/src/meta-service/keys.h
+++ b/cloud/src/meta-service/keys.h
@@ -51,6 +51,8 @@
 // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "num_rows"    -> int64
 // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "num_rowsets" -> int64
 // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "num_segs"    -> int64
+// 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "index_size"  -> int64
+// 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "segment_size"-> int64
 //
 // 0x01 "recycle" ${instance_id} "index" ${index_id}                                       -> RecycleIndexPB
 // 0x01 "recycle" ${instance_id} "partition" ${partition_id}                               -> RecyclePartitionPB
@@ -83,6 +85,8 @@ static constexpr std::string_view STATS_KEY_SUFFIX_DATA_SIZE = "data_size";
 static constexpr std::string_view STATS_KEY_SUFFIX_NUM_ROWS = "num_rows";
 static constexpr std::string_view STATS_KEY_SUFFIX_NUM_ROWSETS = "num_rowsets";
 static constexpr std::string_view STATS_KEY_SUFFIX_NUM_SEGS = "num_segs";
+static constexpr std::string_view STATS_KEY_SUFFIX_INDEX_SIZE = "index_size";
+static constexpr std::string_view STATS_KEY_SUFFIX_SEGMENT_SIZE = "segment_size";
 
 // clang-format off
 /**
@@ -247,6 +251,8 @@ void stats_tablet_data_size_key(const StatsTabletKeyInfo& in, std::string* out);
 void stats_tablet_num_rows_key(const StatsTabletKeyInfo& in, std::string* out);
 void stats_tablet_num_rowsets_key(const StatsTabletKeyInfo& in, std::string* out);
 void stats_tablet_num_segs_key(const StatsTabletKeyInfo& in, std::string* out);
+void stats_tablet_index_size_key(const StatsTabletKeyInfo& in, std::string* out);
+void stats_tablet_segment_size_key(const StatsTabletKeyInfo& in, std::string* out);
 static inline std::string stats_tablet_key(const StatsTabletKeyInfo& in) { std::string s; stats_tablet_key(in, &s); return s; }
 
 void job_recycle_key(const JobRecycleKeyInfo& in, std::string* out);
diff --git a/cloud/src/meta-service/meta_service.cpp b/cloud/src/meta-service/meta_service.cpp
index 974b3091a73e95..9da5750d8d83f9 100644
--- a/cloud/src/meta-service/meta_service.cpp
+++ b/cloud/src/meta-service/meta_service.cpp
@@ -1033,14 +1033,18 @@ void MetaServiceImpl::prepare_rowset(::google::protobuf::RpcController* controll
     prepare_rowset.SerializeToString(&val);
     DCHECK_GT(prepare_rowset.expiration(), 0);
     txn->put(prepare_rs_key, val);
+    std::size_t segment_key_bounds_bytes = get_segments_key_bounds_bytes(rowset_meta);
     LOG(INFO) << "put prepare_rs_key " << hex(prepare_rs_key) << " value_size " << val.size()
-              << " txn_id " << request->txn_id();
+              << " txn_id " << request->txn_id() << " segment_key_bounds_bytes "
+              << segment_key_bounds_bytes;
     err = txn->commit();
     if (err != TxnErrorCode::TXN_OK) {
         if (err == TxnErrorCode::TXN_VALUE_TOO_LARGE) {
             LOG(WARNING) << "failed to prepare rowset, err=value too large"
                          << ", txn_id=" << request->txn_id() << ", tablet_id=" << tablet_id
                          << ", rowset_id=" << rowset_id
+                         << ", rowset_meta_bytes=" << rowset_meta.ByteSizeLong()
+                         << ", segment_key_bounds_bytes=" << segment_key_bounds_bytes
                          << ", rowset_meta=" << rowset_meta.ShortDebugString();
         }
         code = cast_as<ErrCategory::COMMIT>(err);
@@ -1167,15 +1171,18 @@ void MetaServiceImpl::commit_rowset(::google::protobuf::RpcController* controlle
     DCHECK_GT(rowset_meta.txn_expiration(), 0);
     auto tmp_rs_val = rowset_meta.SerializeAsString();
     txn->put(tmp_rs_key, tmp_rs_val);
+    std::size_t segment_key_bounds_bytes = get_segments_key_bounds_bytes(rowset_meta);
     LOG(INFO) << "put tmp_rs_key " << hex(tmp_rs_key) << " delete recycle_rs_key "
               << hex(recycle_rs_key) << " value_size " << tmp_rs_val.size() << " txn_id "
-              << request->txn_id();
+              << request->txn_id() << " segment_key_bounds_bytes " << segment_key_bounds_bytes;
     err = txn->commit();
     if (err != TxnErrorCode::TXN_OK) {
         if (err == TxnErrorCode::TXN_VALUE_TOO_LARGE) {
             LOG(WARNING) << "failed to commit rowset, err=value too large"
                          << ", txn_id=" << request->txn_id() << ", tablet_id=" << tablet_id
                          << ", rowset_id=" << rowset_id
+                         << ", rowset_meta_bytes=" << rowset_meta.ByteSizeLong()
+                         << ", segment_key_bounds_bytes=" << segment_key_bounds_bytes
                          << ", rowset_meta=" << rowset_meta.ShortDebugString();
         }
         code = cast_as<ErrCategory::COMMIT>(err);
@@ -1267,10 +1274,21 @@ void MetaServiceImpl::update_tmp_rowset(::google::protobuf::RpcController* contr
     }
 
     txn->put(update_key, update_val);
+    std::size_t segment_key_bounds_bytes = get_segments_key_bounds_bytes(rowset_meta);
     LOG(INFO) << "xxx put "
-              << "update_rowset_key " << hex(update_key) << " value_size " << update_val.size();
+              << "update_rowset_key " << hex(update_key) << " value_size " << update_val.size()
+              << " segment_key_bounds_bytes " << segment_key_bounds_bytes;
     err = txn->commit();
     if (err != TxnErrorCode::TXN_OK) {
+        if (err == TxnErrorCode::TXN_VALUE_TOO_LARGE) {
+            const auto& rowset_id = rowset_meta.rowset_id_v2();
+            LOG(WARNING) << "failed to update tmp rowset, err=value too large"
+                         << ", txn_id=" << request->txn_id() << ", tablet_id=" << tablet_id
+                         << ", rowset_id=" << rowset_id
+                         << ", rowset_meta_bytes=" << rowset_meta.ByteSizeLong()
+                         << ", segment_key_bounds_bytes=" << segment_key_bounds_bytes
+                         << ", rowset_meta=" << rowset_meta.ShortDebugString();
+        }
         code = cast_as<ErrCategory::COMMIT>(err);
         ss << "failed to update rowset meta, err=" << err;
         msg = ss.str();
@@ -1642,6 +1660,8 @@ void MetaServiceImpl::get_tablet_stats(::google::protobuf::RpcController* contro
 #ifdef NDEBUG
         // Force data size >= 0 to reduce the losses caused by bugs
         if (tablet_stats->data_size() < 0) tablet_stats->set_data_size(0);
+        if (tablet_stats->index_size() < 0) tablet_stats->set_index_size(0);
+        if (tablet_stats->segment_size() < 0) tablet_stats->set_segment_size(0);
 #endif
     }
 }
@@ -2370,4 +2390,12 @@ MetaServiceResponseStatus MetaServiceImpl::fix_tablet_stats(std::string cloud_un
     return st;
 }
 
+std::size_t get_segments_key_bounds_bytes(const doris::RowsetMetaCloudPB& rowset_meta) {
+    size_t ret {0};
+    for (const auto& key_bounds : rowset_meta.segments_key_bounds()) {
+        ret += key_bounds.ByteSizeLong();
+    }
+    return ret;
+}
+
 } // namespace doris::cloud
diff --git a/cloud/src/meta-service/meta_service.h b/cloud/src/meta-service/meta_service.h
index 7af96cbc14b8ee..5374cbea741fb0 100644
--- a/cloud/src/meta-service/meta_service.h
+++ b/cloud/src/meta-service/meta_service.h
@@ -729,6 +729,7 @@ class MetaServiceProxy final : public MetaService {
         int32_t retry_times = 0;
         uint64_t duration_ms = 0, retry_drift_ms = 0;
         while (true) {
+            resp->Clear(); // reset the response message in case it is reused for retry
             (impl_.get()->*method)(ctrl, req, resp, brpc::DoNothing());
             MetaServiceCode code = resp->status().code();
             if (code != MetaServiceCode::KV_TXN_STORE_GET_RETRYABLE &&
diff --git a/cloud/src/meta-service/meta_service_helper.h b/cloud/src/meta-service/meta_service_helper.h
index 4ef98ea2fb7b0c..e4ed7e2a231901 100644
--- a/cloud/src/meta-service/meta_service_helper.h
+++ b/cloud/src/meta-service/meta_service_helper.h
@@ -118,6 +118,12 @@ void finish_rpc(std::string_view func_name, brpc::Controller* ctrl, Response* re
                   << " status=" << res->status().ShortDebugString()
                   << " tablet=" << res->tablet_id()
                   << " delete_bitmap_count=" << res->segment_delete_bitmaps_size();
+    } else if constexpr (std::is_same_v<Response, GetDeleteBitmapUpdateLockResponse>) {
+        if (res->status().code() != MetaServiceCode::OK) {
+            res->clear_base_compaction_cnts();
+            res->clear_cumulative_compaction_cnts();
+            res->clear_cumulative_points();
+        }
     } else if constexpr (std::is_same_v<Response, GetObjStoreInfoResponse> ||
                          std::is_same_v<Response, GetStageResponse>) {
         std::string debug_string = res->DebugString();
@@ -248,4 +254,5 @@ void get_tablet_idx(MetaServiceCode& code, std::string& msg, Transaction* txn,
 bool is_dropped_tablet(Transaction* txn, const std::string& instance_id, int64_t index_id,
                        int64_t partition_id);
 
+std::size_t get_segments_key_bounds_bytes(const doris::RowsetMetaCloudPB& rowset_meta);
 } // namespace doris::cloud
diff --git a/cloud/src/meta-service/meta_service_job.cpp b/cloud/src/meta-service/meta_service_job.cpp
index d1c8df15870de7..cc80d5bd138980 100644
--- a/cloud/src/meta-service/meta_service_job.cpp
+++ b/cloud/src/meta-service/meta_service_job.cpp
@@ -701,6 +701,8 @@ void process_compaction_job(MetaServiceCode& code, std::string& msg, std::string
         stats->set_data_size(stats->data_size() + (compaction.size_output_rowsets() - compaction.size_input_rowsets()));
         stats->set_num_rowsets(stats->num_rowsets() + (compaction.num_output_rowsets() - compaction.num_input_rowsets()));
         stats->set_num_segments(stats->num_segments() + (compaction.num_output_segments() - compaction.num_input_segments()));
+        stats->set_index_size(stats->index_size() + (compaction.index_size_output_rowsets() - compaction.index_size_input_rowsets()));
+        stats->set_segment_size(stats->segment_size() + (compaction.segment_size_output_rowsets() - compaction.segment_size_input_rowsets()));
         stats->set_last_cumu_compaction_time_ms(now * 1000);
         // clang-format on
     } else if (compaction.type() == TabletCompactionJobPB::BASE) {
@@ -710,6 +712,8 @@ void process_compaction_job(MetaServiceCode& code, std::string& msg, std::string
         stats->set_data_size(stats->data_size() + (compaction.size_output_rowsets() - compaction.size_input_rowsets()));
         stats->set_num_rowsets(stats->num_rowsets() + (compaction.num_output_rowsets() - compaction.num_input_rowsets()));
         stats->set_num_segments(stats->num_segments() + (compaction.num_output_segments() - compaction.num_input_segments()));
+        stats->set_index_size(stats->index_size() + (compaction.index_size_output_rowsets() - compaction.index_size_input_rowsets()));
+        stats->set_segment_size(stats->segment_size() + (compaction.segment_size_output_rowsets() - compaction.segment_size_input_rowsets()));
         stats->set_last_base_compaction_time_ms(now * 1000);
         // clang-format on
     } else if (compaction.type() == TabletCompactionJobPB::FULL) {
@@ -724,6 +728,8 @@ void process_compaction_job(MetaServiceCode& code, std::string& msg, std::string
         stats->set_data_size(stats->data_size() + (compaction.size_output_rowsets() - compaction.size_input_rowsets()));
         stats->set_num_rowsets(stats->num_rowsets() + (compaction.num_output_rowsets() - compaction.num_input_rowsets()));
         stats->set_num_segments(stats->num_segments() + (compaction.num_output_segments() - compaction.num_input_segments()));
+        stats->set_index_size(stats->index_size() + (compaction.index_size_output_rowsets() - compaction.index_size_input_rowsets()));
+        stats->set_segment_size(stats->segment_size() + (compaction.segment_size_output_rowsets() - compaction.segment_size_input_rowsets()));
         stats->set_last_full_compaction_time_ms(now * 1000);
         // clang-format on
     } else {
@@ -738,10 +744,14 @@ void process_compaction_job(MetaServiceCode& code, std::string& msg, std::string
                << " stats.data_size=" << stats->data_size()
                << " stats.num_rowsets=" << stats->num_rowsets()
                << " stats.num_segments=" << stats->num_segments()
+               << " stats.index_size=" << stats->index_size()
+               << " stats.segment_size=" << stats->segment_size()
                << " detached_stats.num_rows=" << detached_stats.num_rows
                << " detached_stats.data_size=" << detached_stats.data_size
                << " detached_stats.num_rowset=" << detached_stats.num_rowsets
                << " detached_stats.num_segments=" << detached_stats.num_segs
+               << " detached_stats.index_size=" << detached_stats.index_size
+               << " detached_stats.segment_size=" << detached_stats.segment_size
                << " compaction.size_output_rowsets=" << compaction.size_output_rowsets()
                << " compaction.size_input_rowsets=" << compaction.size_input_rowsets();
     txn->put(stats_key, stats_val);
@@ -752,10 +762,14 @@ void process_compaction_job(MetaServiceCode& code, std::string& msg, std::string
                             << " stats.data_size=" << stats->data_size()
                             << " stats.num_rowsets=" << stats->num_rowsets()
                             << " stats.num_segments=" << stats->num_segments()
+                            << " stats.index_size=" << stats->index_size()
+                            << " stats.segment_size=" << stats->segment_size()
                             << " detached_stats.num_rows=" << detached_stats.num_rows
                             << " detached_stats.data_size=" << detached_stats.data_size
                             << " detached_stats.num_rowset=" << detached_stats.num_rowsets
                             << " detached_stats.num_segments=" << detached_stats.num_segs
+                            << " detached_stats.index_size=" << detached_stats.index_size
+                            << " detached_stats.segment_size=" << detached_stats.segment_size
                             << " compaction.size_output_rowsets="
                             << compaction.size_output_rowsets()
                             << " compaction.size_input_rowsets=" << compaction.size_input_rowsets();
@@ -1133,6 +1147,8 @@ void process_schema_change_job(MetaServiceCode& code, std::string& msg, std::str
     int64_t size_remove_rowsets = 0;
     int64_t num_remove_rowsets = 0;
     int64_t num_remove_segments = 0;
+    int64_t index_size_remove_rowsets = 0;
+    int64_t segment_size_remove_rowsets = 0;
 
     auto rs_start = meta_rowset_key({instance_id, new_tablet_id, 2});
     auto rs_end = meta_rowset_key({instance_id, new_tablet_id, schema_change.alter_version() + 1});
@@ -1162,9 +1178,11 @@ void process_schema_change_job(MetaServiceCode& code, std::string& msg, std::str
             }
 
             num_remove_rows += rs.num_rows();
-            size_remove_rowsets += rs.data_disk_size();
+            size_remove_rowsets += rs.total_disk_size();
             ++num_remove_rowsets;
             num_remove_segments += rs.num_segments();
+            index_size_remove_rowsets += rs.index_disk_size();
+            segment_size_remove_rowsets += rs.data_disk_size();
 
             auto recycle_key = recycle_rowset_key({instance_id, new_tablet_id, rs.rowset_id_v2()});
             RecycleRowsetPB recycle_rowset;
@@ -1199,6 +1217,8 @@ void process_schema_change_job(MetaServiceCode& code, std::string& msg, std::str
     stats->set_data_size(stats->data_size() + (schema_change.size_output_rowsets() - size_remove_rowsets));
     stats->set_num_rowsets(stats->num_rowsets() + (schema_change.num_output_rowsets() - num_remove_rowsets));
     stats->set_num_segments(stats->num_segments() + (schema_change.num_output_segments() - num_remove_segments));
+    stats->set_index_size(stats->index_size() + (schema_change.index_size_output_rowsets() - index_size_remove_rowsets));
+    stats->set_segment_size(stats->segment_size() + (schema_change.segment_size_output_rowsets() - segment_size_remove_rowsets));
     // clang-format on
     auto stats_key = stats_tablet_key(
             {instance_id, new_table_id, new_index_id, new_partition_id, new_tablet_id});
diff --git a/cloud/src/meta-service/meta_service_tablet_stats.cpp b/cloud/src/meta-service/meta_service_tablet_stats.cpp
index cecccbd67673ad..4cbf629c9a3185 100644
--- a/cloud/src/meta-service/meta_service_tablet_stats.cpp
+++ b/cloud/src/meta-service/meta_service_tablet_stats.cpp
@@ -45,7 +45,8 @@ void internal_get_tablet_stats(MetaServiceCode& code, std::string& msg, Transact
     auto end_key = stats_tablet_key({instance_id, idx.table_id(), idx.index_id(), idx.partition_id(), idx.tablet_id() + 1});
     // clang-format on
     std::vector<std::pair<std::string, std::string>> stats_kvs;
-    stats_kvs.reserve(5); // aggregate + data_size + num_rows + num_rowsets + num_segments
+    stats_kvs.reserve(
+            7); // aggregate + data_size + num_rows + num_rowsets + num_segments + index_size + segment_size
 
     std::unique_ptr<RangeGetIterator> it;
     do {
@@ -93,7 +94,7 @@ int get_detached_tablet_stats(const std::vector<std::pair<std::string, std::stri
                               TabletStats& detached_stats) {
     bool unexpected_size = false;
     // clang-format off
-    if (stats_kvs.size() != 5    // aggregated stats and 4 splitted stats: num_rowsets num_segs data_size num_rows
+    if (stats_kvs.size() != 7    // aggregated stats and 4 splitted stats: num_rowsets num_segs data_size num_rows index_size segment_size
         && stats_kvs.size() != 2 // aggregated stats and 1 splitted stats: num_rowsets
         && stats_kvs.size() != 1 // aggregated stats only (nothing has been imported since created)
         ) {
@@ -137,6 +138,10 @@ int get_detached_tablet_stats(const std::vector<std::pair<std::string, std::stri
             detached_stats.num_rowsets = val;
         } else if (*suffix == STATS_KEY_SUFFIX_NUM_SEGS) {
             detached_stats.num_segs = val;
+        } else if (*suffix == STATS_KEY_SUFFIX_INDEX_SIZE) {
+            detached_stats.index_size = val;
+        } else if (*suffix == STATS_KEY_SUFFIX_SEGMENT_SIZE) {
+            detached_stats.segment_size = val;
         } else {
             LOG(WARNING) << "unknown tablet stats suffix=" << *suffix << " key=" << hex(k);
         }
@@ -155,6 +160,8 @@ void merge_tablet_stats(TabletStatsPB& stats, const TabletStats& detached_stats)
     stats.set_num_rows(stats.num_rows() + detached_stats.num_rows);
     stats.set_num_rowsets(stats.num_rowsets() + detached_stats.num_rowsets);
     stats.set_num_segments(stats.num_segments() + detached_stats.num_segs);
+    stats.set_index_size(stats.index_size() + detached_stats.index_size);
+    stats.set_segment_size(stats.segment_size() + detached_stats.segment_size);
 }
 
 void internal_get_tablet_stats(MetaServiceCode& code, std::string& msg, Transaction* txn,
@@ -253,14 +260,20 @@ MetaServiceResponseStatus fix_tablet_stats_internal(
             return st;
         }
         int64_t total_disk_size = 0;
+        int64_t index_disk_size = 0;
+        int64_t data_disk_size = 0;
         for (const auto& rs_meta : resp.rowset_meta()) {
             total_disk_size += rs_meta.total_disk_size();
+            index_disk_size += rs_meta.index_disk_size();
+            data_disk_size += rs_meta.data_disk_size();
         }
 
         // set new disk size to tabletPB and write it back
         TabletStatsPB tablet_stat;
         tablet_stat.CopyFrom(*tablet_stat_ptr);
         tablet_stat.set_data_size(total_disk_size);
+        tablet_stat.set_index_size(index_disk_size);
+        tablet_stat.set_segment_size(data_disk_size);
         // record tablet stats batch
         tablet_stat_shared_ptr_vec_batch.emplace_back(std::make_shared<TabletStatsPB>(tablet_stat));
         std::string tablet_stat_key;
@@ -312,6 +325,30 @@ MetaServiceResponseStatus fix_tablet_stats_internal(
             memcpy(tablet_stat_data_size_value.data(), &tablet_stat_data_size,
                    sizeof(tablet_stat_data_size));
             txn->put(tablet_stat_data_size_key, tablet_stat_data_size_value);
+            // set tablet stats index size = 0
+            // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "index_size" -> int64
+            std::string tablet_stat_index_size_key;
+            stats_tablet_index_size_key(
+                    {instance_id, tablet_stat.idx().table_id(), tablet_stat.idx().index_id(),
+                     tablet_stat.idx().partition_id(), tablet_stat.idx().tablet_id()},
+                    &tablet_stat_index_size_key);
+            int64_t tablet_stat_index_size = 0;
+            std::string tablet_stat_index_size_value(sizeof(tablet_stat_index_size), '\0');
+            memcpy(tablet_stat_index_size_value.data(), &tablet_stat_index_size,
+                   sizeof(tablet_stat_index_size));
+            txn->put(tablet_stat_index_size_key, tablet_stat_index_size_value);
+            // set tablet stats segment size = 0
+            // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "segment_size" -> int64
+            std::string tablet_stat_segment_size_key;
+            stats_tablet_segment_size_key(
+                    {instance_id, tablet_stat.idx().table_id(), tablet_stat.idx().index_id(),
+                     tablet_stat.idx().partition_id(), tablet_stat.idx().tablet_id()},
+                    &tablet_stat_segment_size_key);
+            int64_t tablet_stat_segment_size = 0;
+            std::string tablet_stat_segment_size_value(sizeof(tablet_stat_segment_size), '\0');
+            memcpy(tablet_stat_segment_size_value.data(), &tablet_stat_segment_size,
+                   sizeof(tablet_stat_segment_size));
+            txn->put(tablet_stat_segment_size_key, tablet_stat_segment_size_value);
         }
     }
 
@@ -396,6 +433,76 @@ MetaServiceResponseStatus check_new_tablet_stats(
                     .tag("data size", tablet_stat_data_size)
                     .tag("check data size", tablet_stat_data_size_check);
         }
+
+        // check index size
+        std::string tablet_stat_index_size_key;
+        stats_tablet_index_size_key(
+                {instance_id, tablet_stat_ptr->idx().table_id(), tablet_stat_ptr->idx().index_id(),
+                 tablet_stat_ptr->idx().partition_id(), tablet_stat_ptr->idx().tablet_id()},
+                &tablet_stat_index_size_key);
+        int64_t tablet_stat_index_size = 0;
+        std::string tablet_stat_index_size_value(sizeof(tablet_stat_index_size), '\0');
+        err = txn->get(tablet_stat_index_size_key, &tablet_stat_index_size_value);
+        if (err != TxnErrorCode::TXN_OK && err != TxnErrorCode::TXN_KEY_NOT_FOUND) {
+            st.set_code(cast_as<ErrCategory::READ>(err));
+            return st;
+        }
+        int64_t tablet_stat_index_size_check;
+
+        if (tablet_stat_index_size_value.size() != sizeof(tablet_stat_index_size_check))
+                [[unlikely]] {
+            LOG(WARNING) << " malformed tablet stats value v.index_size="
+                         << tablet_stat_index_size_value.size()
+                         << " value=" << hex(tablet_stat_index_size_value);
+        }
+        std::memcpy(&tablet_stat_index_size_check, tablet_stat_index_size_value.data(),
+                    sizeof(tablet_stat_index_size_check));
+        if constexpr (std::endian::native == std::endian::big) {
+            tablet_stat_index_size_check = bswap_64(tablet_stat_index_size_check);
+        }
+        if (tablet_stat_index_size_check != tablet_stat_index_size &&
+            // ditto
+            (tablet_stat_index_size_check > 2 * tablet_stat_index_size ||
+             tablet_stat_index_size > 2 * tablet_stat_index_size_check)) {
+            LOG_WARNING("[fix tablet stats]:index size check failed")
+                    .tag("index size", tablet_stat_index_size)
+                    .tag("check index size", tablet_stat_index_size_check);
+        }
+
+        // check data size
+        std::string tablet_stat_segment_size_key;
+        stats_tablet_segment_size_key(
+                {instance_id, tablet_stat_ptr->idx().table_id(), tablet_stat_ptr->idx().index_id(),
+                 tablet_stat_ptr->idx().partition_id(), tablet_stat_ptr->idx().tablet_id()},
+                &tablet_stat_segment_size_key);
+        int64_t tablet_stat_segment_size = 0;
+        std::string tablet_stat_segment_size_value(sizeof(tablet_stat_segment_size), '\0');
+        err = txn->get(tablet_stat_segment_size_key, &tablet_stat_segment_size_value);
+        if (err != TxnErrorCode::TXN_OK && err != TxnErrorCode::TXN_KEY_NOT_FOUND) {
+            st.set_code(cast_as<ErrCategory::READ>(err));
+            return st;
+        }
+        int64_t tablet_stat_segment_size_check;
+
+        if (tablet_stat_segment_size_value.size() != sizeof(tablet_stat_segment_size_check))
+                [[unlikely]] {
+            LOG(WARNING) << " malformed tablet stats value v.segment_size="
+                         << tablet_stat_segment_size_value.size()
+                         << " value=" << hex(tablet_stat_segment_size_value);
+        }
+        std::memcpy(&tablet_stat_segment_size_check, tablet_stat_segment_size_value.data(),
+                    sizeof(tablet_stat_segment_size_check));
+        if constexpr (std::endian::native == std::endian::big) {
+            tablet_stat_segment_size_check = bswap_64(tablet_stat_segment_size_check);
+        }
+        if (tablet_stat_segment_size_check != tablet_stat_segment_size &&
+            // ditto
+            (tablet_stat_segment_size_check > 2 * tablet_stat_segment_size ||
+             tablet_stat_segment_size > 2 * tablet_stat_segment_size_check)) {
+            LOG_WARNING("[fix tablet stats]:segment size check failed")
+                    .tag("segment size", tablet_stat_segment_size)
+                    .tag("check segment size", tablet_stat_segment_size_check);
+        }
     }
 
     return st;
diff --git a/cloud/src/meta-service/meta_service_tablet_stats.h b/cloud/src/meta-service/meta_service_tablet_stats.h
index a7aea5885a8e1a..30cbaf56f6dc80 100644
--- a/cloud/src/meta-service/meta_service_tablet_stats.h
+++ b/cloud/src/meta-service/meta_service_tablet_stats.h
@@ -31,6 +31,8 @@ struct TabletStats {
     int64_t num_rows = 0;
     int64_t num_rowsets = 0;
     int64_t num_segs = 0;
+    int64_t index_size = 0;
+    int64_t segment_size = 0;
 };
 
 // Get tablet stats and detached tablet stats via `txn`. If an error occurs, `code` will be set to non OK.
diff --git a/cloud/src/meta-service/meta_service_txn.cpp b/cloud/src/meta-service/meta_service_txn.cpp
index 58930f6edfc63b..5d696220b72dab 100644
--- a/cloud/src/meta-service/meta_service_txn.cpp
+++ b/cloud/src/meta-service/meta_service_txn.cpp
@@ -880,6 +880,12 @@ void update_tablet_stats(const StatsTabletKeyInfo& info, const TabletStats& stat
             std::string num_segs_key;
             stats_tablet_num_segs_key(info, &num_segs_key);
             txn->atomic_add(num_segs_key, stats.num_segs);
+            std::string index_size_key;
+            stats_tablet_index_size_key(info, &index_size_key);
+            txn->atomic_add(index_size_key, stats.index_size);
+            std::string segment_size_key;
+            stats_tablet_segment_size_key(info, &segment_size_key);
+            txn->atomic_add(segment_size_key, stats.segment_size);
         }
         std::string num_rowsets_key;
         stats_tablet_num_rowsets_key(info, &num_rowsets_key);
@@ -906,6 +912,8 @@ void update_tablet_stats(const StatsTabletKeyInfo& info, const TabletStats& stat
         stats_pb.set_num_rows(stats_pb.num_rows() + stats.num_rows);
         stats_pb.set_num_rowsets(stats_pb.num_rowsets() + stats.num_rowsets);
         stats_pb.set_num_segments(stats_pb.num_segments() + stats.num_segs);
+        stats_pb.set_index_size(stats_pb.index_size() + stats.index_size);
+        stats_pb.set_segment_size(stats_pb.segment_size() + stats.segment_size);
         stats_pb.SerializeToString(&val);
         txn->put(key, val);
         LOG(INFO) << "put stats_tablet_key key=" << hex(key);
@@ -1234,6 +1242,8 @@ void commit_txn_immediately(
             stats.num_rows += i.num_rows();
             ++stats.num_rowsets;
             stats.num_segs += i.num_segments();
+            stats.index_size += i.index_disk_size();
+            stats.segment_size += i.data_disk_size();
         } // for tmp_rowsets_meta
 
         process_mow_when_commit_txn(request, instance_id, code, msg, txn, table_id_tablet_ids);
@@ -1864,10 +1874,12 @@ void commit_txn_eventually(
         for (auto& [_, i] : tmp_rowsets_meta) {
             // Accumulate affected rows
             auto& stats = tablet_stats[i.tablet_id()];
-            stats.data_size += i.data_disk_size();
+            stats.data_size += i.total_disk_size();
             stats.num_rows += i.num_rows();
             ++stats.num_rowsets;
             stats.num_segs += i.num_segments();
+            stats.index_size += i.index_disk_size();
+            stats.segment_size += i.data_disk_size();
         }
 
         // calculate table stats from tablets stats
@@ -2238,10 +2250,12 @@ void commit_txn_with_sub_txn(const CommitTxnRequest* request, CommitTxnResponse*
 
             // Accumulate affected rows
             auto& stats = tablet_stats[tablet_id];
-            stats.data_size += i.data_disk_size();
+            stats.data_size += i.total_disk_size();
             stats.num_rows += i.num_rows();
             ++stats.num_rowsets;
             stats.num_segs += i.num_segments();
+            stats.index_size += i.index_disk_size();
+            stats.segment_size += i.data_disk_size();
         } // for tmp_rowsets_meta
     }
 
@@ -2351,6 +2365,12 @@ void commit_txn_with_sub_txn(const CommitTxnRequest* request, CommitTxnResponse*
                 auto& num_segs_key = kv_pool.emplace_back();
                 stats_tablet_num_segs_key(info, &num_segs_key);
                 txn->atomic_add(num_segs_key, stats.num_segs);
+                auto& index_size_key = kv_pool.emplace_back();
+                stats_tablet_index_size_key(info, &index_size_key);
+                txn->atomic_add(index_size_key, stats.index_size);
+                auto& segment_size_key = kv_pool.emplace_back();
+                stats_tablet_segment_size_key(info, &segment_size_key);
+                txn->atomic_add(segment_size_key, stats.segment_size);
             }
             auto& num_rowsets_key = kv_pool.emplace_back();
             stats_tablet_num_rowsets_key(info, &num_rowsets_key);
@@ -2379,6 +2399,8 @@ void commit_txn_with_sub_txn(const CommitTxnRequest* request, CommitTxnResponse*
             stats_pb.set_num_rows(stats_pb.num_rows() + stats.num_rows);
             stats_pb.set_num_rowsets(stats_pb.num_rowsets() + stats.num_rowsets);
             stats_pb.set_num_segments(stats_pb.num_segments() + stats.num_segs);
+            stats_pb.set_index_size(stats_pb.index_size() + stats.index_size);
+            stats_pb.set_segment_size(stats_pb.segment_size() + stats.segment_size);
             stats_pb.SerializeToString(&val);
             txn->put(key, val);
             LOG(INFO) << "put stats_tablet_key, key=" << hex(key);
diff --git a/cloud/src/meta-service/txn_lazy_committer.cpp b/cloud/src/meta-service/txn_lazy_committer.cpp
index 25d36faab06796..9859c2b0ed1ae3 100644
--- a/cloud/src/meta-service/txn_lazy_committer.cpp
+++ b/cloud/src/meta-service/txn_lazy_committer.cpp
@@ -174,10 +174,12 @@ void convert_tmp_rowsets(
 
         // Accumulate affected rows
         auto& stats = tablet_stats[tmp_rowset_pb.tablet_id()];
-        stats.data_size += tmp_rowset_pb.data_disk_size();
+        stats.data_size += tmp_rowset_pb.total_disk_size();
         stats.num_rows += tmp_rowset_pb.num_rows();
         ++stats.num_rowsets;
         stats.num_segs += tmp_rowset_pb.num_segments();
+        stats.index_size += tmp_rowset_pb.index_disk_size();
+        stats.segment_size += tmp_rowset_pb.data_disk_size();
     }
 
     for (auto& [tablet_id, stats] : tablet_stats) {
diff --git a/cloud/src/recycler/checker.cpp b/cloud/src/recycler/checker.cpp
index 19a10d61c12d35..60b6b7fc5eefea 100644
--- a/cloud/src/recycler/checker.cpp
+++ b/cloud/src/recycler/checker.cpp
@@ -168,17 +168,35 @@ int Checker::start() {
             auto ctime_ms =
                     duration_cast<milliseconds>(system_clock::now().time_since_epoch()).count();
             g_bvar_checker_enqueue_cost_s.put(instance_id, ctime_ms / 1000 - enqueue_time_s);
-            int ret1 = checker->do_check();
 
-            int ret2 = 0;
+            bool success {true};
+
+            if (int ret = checker->do_check(); ret != 0) {
+                success = false;
+            }
+
             if (config::enable_inverted_check) {
-                ret2 = checker->do_inverted_check();
+                if (int ret = checker->do_inverted_check(); ret != 0) {
+                    success = false;
+                }
+            }
+
+            if (config::enable_delete_bitmap_inverted_check) {
+                if (int ret = checker->do_delete_bitmap_inverted_check(); ret != 0) {
+                    success = false;
+                }
+            }
+
+            if (config::enable_delete_bitmap_storage_optimize_check) {
+                if (int ret = checker->do_delete_bitmap_storage_optimize_check(); ret != 0) {
+                    success = false;
+                }
             }
 
             // If instance checker has been aborted, don't finish this job
             if (!checker->stopped()) {
                 finish_instance_recycle_job(txn_kv_.get(), check_job_key, instance.instance_id(),
-                                            ip_port_, ret1 == 0 && ret2 == 0, ctime_ms);
+                                            ip_port_, success, ctime_ms);
             }
             {
                 std::lock_guard lock(mtx_);
@@ -740,4 +758,435 @@ int InstanceChecker::do_inverted_check() {
     return num_file_leak > 0 ? 1 : check_ret;
 }
 
+int InstanceChecker::traverse_mow_tablet(const std::function<int(int64_t)>& check_func) {
+    std::unique_ptr<RangeGetIterator> it;
+    auto begin = meta_rowset_key({instance_id_, 0, 0});
+    auto end = meta_rowset_key({instance_id_, std::numeric_limits<int64_t>::max(), 0});
+    do {
+        std::unique_ptr<Transaction> txn;
+        TxnErrorCode err = txn_kv_->create_txn(&txn);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to create txn";
+            return -1;
+        }
+        err = txn->get(begin, end, &it, false, 1);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to get rowset kv, err=" << err;
+            return -1;
+        }
+        if (!it->has_next()) {
+            break;
+        }
+        while (it->has_next() && !stopped()) {
+            auto [k, v] = it->next();
+            std::string_view k1 = k;
+            k1.remove_prefix(1);
+            std::vector<std::tuple<std::variant<int64_t, std::string>, int, int>> out;
+            decode_key(&k1, &out);
+            // 0x01 "meta" ${instance_id} "rowset" ${tablet_id} ${version} -> RowsetMetaCloudPB
+            auto tablet_id = std::get<int64_t>(std::get<0>(out[3]));
+
+            if (!it->has_next()) {
+                // Update to next smallest key for iteration
+                // scan for next tablet in this instance
+                begin = meta_rowset_key({instance_id_, tablet_id + 1, 0});
+            }
+
+            TabletMetaCloudPB tablet_meta;
+            int ret = get_tablet_meta(txn_kv_.get(), instance_id_, tablet_id, tablet_meta);
+            if (ret < 0) {
+                LOG(WARNING) << fmt::format(
+                        "failed to get_tablet_meta in do_delete_bitmap_integrity_check(), "
+                        "instance_id={}, tablet_id={}",
+                        instance_id_, tablet_id);
+                return ret;
+            }
+
+            if (tablet_meta.enable_unique_key_merge_on_write()) {
+                // only check merge-on-write table
+                int ret = check_func(tablet_id);
+                if (ret < 0) {
+                    // return immediately when encounter unexpected error,
+                    // otherwise, we continue to check the next tablet
+                    return ret;
+                }
+            }
+        }
+    } while (it->more() && !stopped());
+    return 0;
+}
+
+int InstanceChecker::traverse_rowset_delete_bitmaps(
+        int64_t tablet_id, std::string rowset_id,
+        const std::function<int(int64_t, std::string_view, int64_t, int64_t)>& callback) {
+    std::unique_ptr<RangeGetIterator> it;
+    auto begin = meta_delete_bitmap_key({instance_id_, tablet_id, rowset_id, 0, 0});
+    auto end = meta_delete_bitmap_key({instance_id_, tablet_id, rowset_id,
+                                       std::numeric_limits<int64_t>::max(),
+                                       std::numeric_limits<int64_t>::max()});
+    do {
+        std::unique_ptr<Transaction> txn;
+        TxnErrorCode err = txn_kv_->create_txn(&txn);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to create txn";
+            return -1;
+        }
+        err = txn->get(begin, end, &it);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to get rowset kv, err=" << err;
+            return -1;
+        }
+        if (!it->has_next()) {
+            break;
+        }
+        while (it->has_next() && !stopped()) {
+            auto [k, v] = it->next();
+            std::string_view k1 = k;
+            k1.remove_prefix(1);
+            std::vector<std::tuple<std::variant<int64_t, std::string>, int, int>> out;
+            decode_key(&k1, &out);
+            // 0x01 "meta" ${instance_id} "delete_bitmap" ${tablet_id} ${rowset_id} ${version} ${segment_id} -> roaringbitmap
+            auto version = std::get<std::int64_t>(std::get<0>(out[5]));
+            auto segment_id = std::get<std::int64_t>(std::get<0>(out[6]));
+
+            int ret = callback(tablet_id, rowset_id, version, segment_id);
+            if (ret != 0) {
+                return ret;
+            }
+
+            if (!it->has_next()) {
+                begin = k;
+                begin.push_back('\x00'); // Update to next smallest key for iteration
+                break;
+            }
+        }
+    } while (it->more() && !stopped());
+
+    return 0;
+}
+
+int InstanceChecker::collect_tablet_rowsets(
+        int64_t tablet_id, const std::function<void(const doris::RowsetMetaCloudPB&)>& collect_cb) {
+    std::unique_ptr<Transaction> txn;
+    TxnErrorCode err = txn_kv_->create_txn(&txn);
+    if (err != TxnErrorCode::TXN_OK) {
+        LOG(WARNING) << "failed to create txn";
+        return -1;
+    }
+    std::unique_ptr<RangeGetIterator> it;
+    auto begin = meta_rowset_key({instance_id_, tablet_id, 0});
+    auto end = meta_rowset_key({instance_id_, tablet_id + 1, 0});
+
+    int64_t rowsets_num {0};
+    do {
+        TxnErrorCode err = txn->get(begin, end, &it);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to get rowset kv, err=" << err;
+            return -1;
+        }
+        if (!it->has_next()) {
+            break;
+        }
+        while (it->has_next() && !stopped()) {
+            auto [k, v] = it->next();
+            doris::RowsetMetaCloudPB rowset;
+            if (!rowset.ParseFromArray(v.data(), v.size())) {
+                LOG(WARNING) << "malformed rowset meta value, key=" << hex(k);
+                return -1;
+            }
+
+            ++rowsets_num;
+            collect_cb(rowset);
+
+            if (!it->has_next()) {
+                begin = k;
+                begin.push_back('\x00'); // Update to next smallest key for iteration
+                break;
+            }
+        }
+    } while (it->more() && !stopped());
+
+    LOG(INFO) << fmt::format(
+            "[delete bitmap checker] successfully collect rowsets for instance_id={}, "
+            "tablet_id={}, rowsets_num={}",
+            instance_id_, tablet_id, rowsets_num);
+    return 0;
+}
+
+int InstanceChecker::do_delete_bitmap_inverted_check() {
+    LOG(INFO) << fmt::format(
+            "[delete bitmap checker] begin to do_delete_bitmap_inverted_check for instance_id={}",
+            instance_id_);
+
+    // number of delete bitmap keys being scanned
+    int64_t total_delete_bitmap_keys {0};
+    // number of delete bitmaps which belongs to non mow tablet
+    int64_t abnormal_delete_bitmaps {0};
+    // number of delete bitmaps which doesn't have corresponding rowset in MS
+    int64_t leaked_delete_bitmaps {0};
+
+    auto start_time = std::chrono::steady_clock::now();
+    std::unique_ptr<int, std::function<void(int*)>> defer_log_statistics((int*)0x01, [&](int*) {
+        g_bvar_inverted_checker_leaked_delete_bitmaps.put(instance_id_, leaked_delete_bitmaps);
+        g_bvar_inverted_checker_abnormal_delete_bitmaps.put(instance_id_, abnormal_delete_bitmaps);
+        g_bvar_inverted_checker_delete_bitmaps_scanned.put(instance_id_, total_delete_bitmap_keys);
+
+        auto cost = std::chrono::duration_cast<std::chrono::milliseconds>(
+                            std::chrono::steady_clock::now() - start_time)
+                            .count();
+        if (leaked_delete_bitmaps > 0 || abnormal_delete_bitmaps > 0) {
+            LOG(WARNING) << fmt::format(
+                    "[delete bitmap check fails] delete bitmap inverted check for instance_id={}, "
+                    "cost={} ms, total_delete_bitmap_keys={}, leaked_delete_bitmaps={}, "
+                    "abnormal_delete_bitmaps={}",
+                    instance_id_, cost, total_delete_bitmap_keys, leaked_delete_bitmaps,
+                    abnormal_delete_bitmaps);
+        } else {
+            LOG(INFO) << fmt::format(
+                    "[delete bitmap checker] delete bitmap inverted check for instance_id={}, "
+                    "passed. cost={} ms, total_delete_bitmap_keys={}",
+                    instance_id_, cost, total_delete_bitmap_keys);
+        }
+    });
+
+    struct TabletsRowsetsCache {
+        int64_t tablet_id {-1};
+        bool enable_merge_on_write {false};
+        std::unordered_set<std::string> rowsets {};
+    } tablet_rowsets_cache {};
+
+    std::unique_ptr<RangeGetIterator> it;
+    auto begin = meta_delete_bitmap_key({instance_id_, 0, "", 0, 0});
+    auto end =
+            meta_delete_bitmap_key({instance_id_, std::numeric_limits<int64_t>::max(), "", 0, 0});
+    do {
+        std::unique_ptr<Transaction> txn;
+        TxnErrorCode err = txn_kv_->create_txn(&txn);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to create txn";
+            return -1;
+        }
+        err = txn->get(begin, end, &it);
+        if (err != TxnErrorCode::TXN_OK) {
+            LOG(WARNING) << "failed to get rowset kv, err=" << err;
+            return -1;
+        }
+        if (!it->has_next()) {
+            break;
+        }
+        while (it->has_next() && !stopped()) {
+            auto [k, v] = it->next();
+            std::string_view k1 = k;
+            k1.remove_prefix(1);
+            std::vector<std::tuple<std::variant<int64_t, std::string>, int, int>> out;
+            decode_key(&k1, &out);
+            // 0x01 "meta" ${instance_id} "delete_bitmap" ${tablet_id} ${rowset_id} ${version} ${segment_id} -> roaringbitmap
+            auto tablet_id = std::get<int64_t>(std::get<0>(out[3]));
+            auto rowset_id = std::get<std::string>(std::get<0>(out[4]));
+            auto version = std::get<std::int64_t>(std::get<0>(out[5]));
+            auto segment_id = std::get<std::int64_t>(std::get<0>(out[6]));
+
+            ++total_delete_bitmap_keys;
+
+            if (!it->has_next()) {
+                begin = k;
+                begin.push_back('\x00'); // Update to next smallest key for iteration
+            }
+
+            if (tablet_rowsets_cache.tablet_id == -1 ||
+                tablet_rowsets_cache.tablet_id != tablet_id) {
+                TabletMetaCloudPB tablet_meta;
+                int ret = get_tablet_meta(txn_kv_.get(), instance_id_, tablet_id, tablet_meta);
+                if (ret < 0) {
+                    LOG(WARNING) << fmt::format(
+                            "[delete bitmap checker] failed to get_tablet_meta in "
+                            "do_delete_bitmap_inverted_check(), instance_id={}, tablet_id={}",
+                            instance_id_, tablet_id);
+                    return ret;
+                }
+
+                tablet_rowsets_cache.tablet_id = tablet_id;
+                tablet_rowsets_cache.enable_merge_on_write =
+                        tablet_meta.enable_unique_key_merge_on_write();
+                tablet_rowsets_cache.rowsets.clear();
+
+                if (tablet_rowsets_cache.enable_merge_on_write) {
+                    // only collect rowsets for merge-on-write tablet
+                    auto collect_cb =
+                            [&tablet_rowsets_cache](const doris::RowsetMetaCloudPB& rowset) {
+                                tablet_rowsets_cache.rowsets.insert(rowset.rowset_id_v2());
+                            };
+                    ret = collect_tablet_rowsets(tablet_id, collect_cb);
+                    if (ret < 0) {
+                        return ret;
+                    }
+                }
+            }
+            DCHECK_EQ(tablet_id, tablet_rowsets_cache.tablet_id);
+
+            if (!tablet_rowsets_cache.enable_merge_on_write) {
+                // clang-format off
+                TEST_SYNC_POINT_CALLBACK(
+                        "InstanceChecker::do_delete_bitmap_inverted_check.get_abnormal_delete_bitmap",
+                        &tablet_id, &rowset_id, &version, &segment_id);
+                // clang-format on
+                ++abnormal_delete_bitmaps;
+                // log an error and continue to check the next delete bitmap
+                LOG(WARNING) << fmt::format(
+                        "[delete bitmap check fails] find a delete bitmap belongs to tablet "
+                        "which is not a merge-on-write table! instance_id={}, tablet_id={}, "
+                        "version={}, segment_id={}",
+                        instance_id_, tablet_id, version, segment_id);
+                continue;
+            }
+
+            if (!tablet_rowsets_cache.rowsets.contains(rowset_id)) {
+                TEST_SYNC_POINT_CALLBACK(
+                        "InstanceChecker::do_delete_bitmap_inverted_check.get_leaked_delete_bitmap",
+                        &tablet_id, &rowset_id, &version, &segment_id);
+                ++leaked_delete_bitmaps;
+                // log an error and continue to check the next delete bitmap
+                LOG(WARNING) << fmt::format(
+                        "[delete bitmap check fails] can't find corresponding rowset for delete "
+                        "bitmap instance_id={}, tablet_id={}, rowset_id={}, version={}, "
+                        "segment_id={}",
+                        instance_id_, tablet_id, rowset_id, version, segment_id);
+            }
+        }
+    } while (it->more() && !stopped());
+
+    return (leaked_delete_bitmaps > 0 || abnormal_delete_bitmaps > 0) ? 1 : 0;
+}
+
+int InstanceChecker::check_delete_bitmap_storage_optimize(int64_t tablet_id) {
+    using Version = std::pair<int64_t, int64_t>;
+    struct RowsetDigest {
+        std::string rowset_id;
+        Version version;
+        doris::SegmentsOverlapPB segments_overlap;
+
+        bool operator<(const RowsetDigest& other) const {
+            return version.first < other.version.first;
+        }
+
+        bool produced_by_compaction() const {
+            return (version.first < version.second) ||
+                   ((version.first == version.second) && segments_overlap == NONOVERLAPPING);
+        }
+    };
+
+    // number of rowsets which may have problems
+    int64_t abnormal_rowsets_num {0};
+
+    std::vector<RowsetDigest> tablet_rowsets {};
+    // Get all visible rowsets of this tablet
+    auto collect_cb = [&tablet_rowsets](const doris::RowsetMetaCloudPB& rowset) {
+        if (rowset.start_version() == 0 && rowset.end_version() == 1) {
+            // ignore dummy rowset [0-1]
+            return;
+        }
+        tablet_rowsets.emplace_back(
+                rowset.rowset_id_v2(),
+                std::make_pair<int64_t, int64_t>(rowset.start_version(), rowset.end_version()),
+                rowset.segments_overlap_pb());
+    };
+    if (int ret = collect_tablet_rowsets(tablet_id, collect_cb); ret != 0) {
+        return ret;
+    }
+
+    std::sort(tablet_rowsets.begin(), tablet_rowsets.end());
+
+    // find right-most rowset which is produced by compaction
+    auto it = std::find_if(
+            tablet_rowsets.crbegin(), tablet_rowsets.crend(),
+            [](const RowsetDigest& rowset) { return rowset.produced_by_compaction(); });
+    if (it == tablet_rowsets.crend()) {
+        LOG(INFO) << fmt::format(
+                "[delete bitmap checker] skip to check delete bitmap storage optimize for "
+                "tablet_id={} because it doesn't have compacted rowsets.",
+                tablet_id);
+        return 0;
+    }
+
+    int64_t start_version = it->version.first;
+    int64_t pre_min_version = it->version.second;
+
+    // after BE sweeping stale rowsets, all rowsets in this tablet before
+    // should not have delete bitmaps with versions lower than `pre_min_version`
+    if (config::delete_bitmap_storage_optimize_check_version_gap > 0) {
+        pre_min_version -= config::delete_bitmap_storage_optimize_check_version_gap;
+        if (pre_min_version <= 1) {
+            LOG(INFO) << fmt::format(
+                    "[delete bitmap checker] skip to check delete bitmap storage optimize for "
+                    "tablet_id={} because pre_min_version is too small.",
+                    tablet_id);
+            return 0;
+        }
+    }
+
+    auto check_func = [pre_min_version, instance_id = instance_id_](
+                              int64_t tablet_id, std::string_view rowset_id, int64_t version,
+                              int64_t segment_id) -> int {
+        if (version < pre_min_version) {
+            LOG(WARNING) << fmt::format(
+                    "[delete bitmap check fails] delete bitmap storage optimize check fail for "
+                    "instance_id={}, tablet_id={}, rowset_id={}, found delete bitmap with "
+                    "version={} < pre_min_version={}",
+                    instance_id, tablet_id, rowset_id, version, pre_min_version);
+            return 1;
+        }
+        return 0;
+    };
+
+    for (const auto& rowset : tablet_rowsets) {
+        // check for all rowsets before the max compacted rowset
+        if (rowset.version.second < start_version) {
+            auto rowset_id = rowset.rowset_id;
+            int ret = traverse_rowset_delete_bitmaps(tablet_id, rowset_id, check_func);
+            if (ret < 0) {
+                return ret;
+            }
+
+            if (ret != 0) {
+                ++abnormal_rowsets_num;
+                TEST_SYNC_POINT_CALLBACK(
+                        "InstanceChecker::check_delete_bitmap_storage_optimize.get_abnormal_rowset",
+                        &tablet_id, &rowset_id);
+            }
+        }
+    }
+
+    LOG(INFO) << fmt::format(
+            "[delete bitmap checker] finish check delete bitmap storage optimize for "
+            "instance_id={}, tablet_id={}, rowsets_num={}, abnormal_rowsets_num={}, "
+            "pre_min_version={}",
+            instance_id_, tablet_id, tablet_rowsets.size(), abnormal_rowsets_num, pre_min_version);
+
+    return (abnormal_rowsets_num > 1 ? 1 : 0);
+}
+
+int InstanceChecker::do_delete_bitmap_storage_optimize_check() {
+    int64_t total_tablets_num {0};
+    int64_t failed_tablets_num {0};
+
+    // check that for every visible rowset, there exists at least delete one bitmap in MS
+    int ret = traverse_mow_tablet([&](int64_t tablet_id) {
+        ++total_tablets_num;
+        int res = check_delete_bitmap_storage_optimize(tablet_id);
+        failed_tablets_num += (res != 0);
+        return res;
+    });
+
+    if (ret < 0) {
+        return ret;
+    }
+
+    LOG(INFO) << fmt::format(
+            "[delete bitmap checker] check delete bitmap storage optimize for instance_id={}, "
+            "total_tablets_num={}, failed_tablets_num={}",
+            instance_id_, total_tablets_num, failed_tablets_num);
+
+    return (failed_tablets_num > 0) ? 1 : 0;
+}
+
 } // namespace doris::cloud
diff --git a/cloud/src/recycler/checker.h b/cloud/src/recycler/checker.h
index 03717a69b5ea20..7f87e90f7cb366 100644
--- a/cloud/src/recycler/checker.h
+++ b/cloud/src/recycler/checker.h
@@ -23,6 +23,7 @@
 #include <atomic>
 #include <condition_variable>
 #include <deque>
+#include <functional>
 #include <thread>
 #include <unordered_map>
 #include <unordered_set>
@@ -30,6 +31,10 @@
 #include "recycler/storage_vault_accessor.h"
 #include "recycler/white_black_list.h"
 
+namespace doris {
+class RowsetMetaCloudPB;
+} // namespace doris
+
 namespace doris::cloud {
 class StorageVaultAccessor;
 class InstanceChecker;
@@ -86,6 +91,18 @@ class InstanceChecker {
     // Return 1 if data loss is identified.
     // Return negative if a temporary error occurred during the check process.
     int do_check();
+
+    // Return 0 if success.
+    // Return 1 if delete bitmap leak is identified.
+    // Return negative if a temporary error occurred during the check process.
+    int do_delete_bitmap_inverted_check();
+
+    // checks if https://github.com/apache/doris/pull/40204 works as expected
+    // the stale delete bitmap will be cleared in MS when BE delete expired stale rowsets
+    // NOTE: stale rowsets will be lost after BE restarts, so there may be some stale delete bitmaps
+    // which will not be cleared.
+    int do_delete_bitmap_storage_optimize_check();
+
     // If there are multiple buckets, return the minimum lifecycle; if there are no buckets (i.e.
     // all accessors are HdfsAccessor), return INT64_MAX.
     // Return 0 if success, otherwise error
@@ -100,6 +117,17 @@ class InstanceChecker {
     // returns 0 for success otherwise error
     int init_storage_vault_accessors(const InstanceInfoPB& instance);
 
+    int traverse_mow_tablet(const std::function<int(int64_t)>& check_func);
+    int traverse_rowset_delete_bitmaps(
+            int64_t tablet_id, std::string rowset_id,
+            const std::function<int(int64_t, std::string_view, int64_t, int64_t)>& callback);
+    int collect_tablet_rowsets(
+            int64_t tablet_id,
+            const std::function<void(const doris::RowsetMetaCloudPB&)>& collect_cb);
+    int traverse_delete_bitmaps(const std::function<int(int64_t)>& check_func);
+
+    int check_delete_bitmap_storage_optimize(int64_t tablet_id);
+
     std::atomic_bool stopped_ {false};
     std::shared_ptr<TxnKv> txn_kv_;
     std::string instance_id_;
diff --git a/cloud/src/recycler/recycler.cpp b/cloud/src/recycler/recycler.cpp
index 1b21ec68916be6..f7000ea379225f 100644
--- a/cloud/src/recycler/recycler.cpp
+++ b/cloud/src/recycler/recycler.cpp
@@ -417,8 +417,12 @@ class InstanceRecycler::InvertedIndexIdCache {
             LOG(WARNING) << "malformed schema value, key=" << hex(schema_key);
             return -1;
         }
-        if (schema.index_size() > 0 && schema.has_inverted_index_storage_format()) {
-            res.first = schema.inverted_index_storage_format();
+        if (schema.index_size() > 0) {
+            InvertedIndexStorageFormatPB index_format = InvertedIndexStorageFormatPB::V1;
+            if (schema.has_inverted_index_storage_format()) {
+                index_format = schema.inverted_index_storage_format();
+            }
+            res.first = index_format;
             res.second.reserve(schema.index_size());
             for (auto& i : schema.index()) {
                 if (i.has_index_type() && i.index_type() == IndexType::INVERTED) {
@@ -1382,17 +1386,19 @@ int InstanceRecycler::delete_rowset_data(const doris::RowsetMetaCloudPB& rs_meta
     }
     std::vector<std::string> file_paths;
     auto tablet_schema = rs_meta_pb.tablet_schema();
+    auto index_storage_format = InvertedIndexStorageFormatPB::V1;
     for (int64_t i = 0; i < num_segments; ++i) {
         file_paths.push_back(segment_path(tablet_id, rowset_id, i));
         if (tablet_schema.has_inverted_index_storage_format()) {
-            if (tablet_schema.inverted_index_storage_format() == InvertedIndexStorageFormatPB::V1) {
-                for (const auto& index_id : index_ids) {
-                    file_paths.push_back(inverted_index_path_v1(tablet_id, rowset_id, i,
-                                                                index_id.first, index_id.second));
-                }
-            } else if (!index_ids.empty()) {
-                file_paths.push_back(inverted_index_path_v2(tablet_id, rowset_id, i));
+            index_storage_format = tablet_schema.inverted_index_storage_format();
+        }
+        if (index_storage_format == InvertedIndexStorageFormatPB::V1) {
+            for (const auto& index_id : index_ids) {
+                file_paths.push_back(inverted_index_path_v1(tablet_id, rowset_id, i, index_id.first,
+                                                            index_id.second));
             }
+        } else if (!index_ids.empty()) {
+            file_paths.push_back(inverted_index_path_v2(tablet_id, rowset_id, i));
         }
     }
     // TODO(AlexYue): seems could do do batch
@@ -1429,8 +1435,8 @@ int InstanceRecycler::delete_rowset_data(const std::vector<doris::RowsetMetaClou
 
         // Process inverted indexes
         std::vector<std::pair<int64_t, std::string>> index_ids;
-        // default format as v2.
-        InvertedIndexStorageFormatPB index_format = InvertedIndexStorageFormatPB::V2;
+        // default format as v1.
+        InvertedIndexStorageFormatPB index_format = InvertedIndexStorageFormatPB::V1;
 
         if (rs.has_tablet_schema()) {
             for (const auto& index : rs.tablet_schema().index()) {
diff --git a/cloud/src/recycler/s3_accessor.cpp b/cloud/src/recycler/s3_accessor.cpp
index 2c983a5fa0617b..1aca88d2d1161d 100644
--- a/cloud/src/recycler/s3_accessor.cpp
+++ b/cloud/src/recycler/s3_accessor.cpp
@@ -205,6 +205,7 @@ std::optional<S3Conf> S3Conf::from_obj_store_info(const ObjectStoreInfoPB& obj_i
     s3_conf.region = obj_info.region();
     s3_conf.bucket = obj_info.bucket();
     s3_conf.prefix = obj_info.prefix();
+    s3_conf.use_virtual_addressing = !obj_info.use_path_style();
 
     return s3_conf;
 }
@@ -289,7 +290,7 @@ int S3Accessor::init() {
         auto s3_client = std::make_shared<Aws::S3::S3Client>(
                 std::move(aws_cred), std::move(aws_config),
                 Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
-                true /* useVirtualAddressing */);
+                conf_.use_virtual_addressing /* useVirtualAddressing */);
         obj_client_ = std::make_shared<S3ObjClient>(std::move(s3_client), conf_.endpoint);
         return 0;
     }
diff --git a/cloud/src/recycler/s3_accessor.h b/cloud/src/recycler/s3_accessor.h
index 6886ee5e7c5640..e9640b5693a1f5 100644
--- a/cloud/src/recycler/s3_accessor.h
+++ b/cloud/src/recycler/s3_accessor.h
@@ -69,6 +69,7 @@ struct S3Conf {
     std::string region;
     std::string bucket;
     std::string prefix;
+    bool use_virtual_addressing {true};
 
     enum Provider : uint8_t {
         S3,
diff --git a/cloud/src/recycler/s3_obj_client.cpp b/cloud/src/recycler/s3_obj_client.cpp
index 53fa821c7e5503..c8dcdad18d7115 100644
--- a/cloud/src/recycler/s3_obj_client.cpp
+++ b/cloud/src/recycler/s3_obj_client.cpp
@@ -284,6 +284,7 @@ ObjectStorageResponse S3ObjClient::delete_object(ObjectStoragePathRef path) {
         SCOPED_BVAR_LATENCY(s3_bvar::s3_delete_object_latency);
         return s3_client_->DeleteObject(request);
     });
+    TEST_SYNC_POINT_CALLBACK("S3ObjClient::delete_object", &outcome);
     if (!outcome.IsSuccess()) {
         LOG_WARNING("failed to delete object")
                 .tag("endpoint", endpoint_)
diff --git a/cloud/src/recycler/util.cpp b/cloud/src/recycler/util.cpp
index d6c63ea752f4f1..6797782d5d665c 100644
--- a/cloud/src/recycler/util.cpp
+++ b/cloud/src/recycler/util.cpp
@@ -23,6 +23,7 @@
 
 #include "common/util.h"
 #include "meta-service/keys.h"
+#include "meta-service/meta_service_schema.h"
 #include "meta-service/txn_kv.h"
 #include "meta-service/txn_kv_error.h"
 
@@ -233,4 +234,69 @@ int lease_instance_recycle_job(TxnKv* txn_kv, std::string_view key, const std::s
     return 0;
 }
 
+int get_tablet_idx(TxnKv* txn_kv, const std::string& instance_id, int64_t tablet_id,
+                   TabletIndexPB& tablet_idx) {
+    std::unique_ptr<Transaction> txn;
+    TxnErrorCode err = txn_kv->create_txn(&txn);
+    if (err != TxnErrorCode::TXN_OK) {
+        LOG(WARNING) << "failed to create txn";
+        return -1;
+    }
+
+    std::string key, val;
+    meta_tablet_idx_key({instance_id, tablet_id}, &key);
+    err = txn->get(key, &val);
+    if (err != TxnErrorCode::TXN_OK) {
+        LOG(WARNING) << fmt::format("failed to get tablet_idx, err={} tablet_id={} key={}", err,
+                                    tablet_id, hex(key));
+        return -1;
+    }
+    if (!tablet_idx.ParseFromString(val)) [[unlikely]] {
+        LOG(WARNING) << fmt::format("malformed tablet index value, tablet_id={} key={}", tablet_id,
+                                    hex(key));
+        return -1;
+    }
+    if (tablet_id != tablet_idx.tablet_id()) [[unlikely]] {
+        LOG(WARNING) << "unexpected error given_tablet_id=" << tablet_id
+                     << " idx_pb_tablet_id=" << tablet_idx.tablet_id() << " key=" << hex(key);
+        return -1;
+    }
+    return 0;
+}
+
+int get_tablet_meta(TxnKv* txn_kv, const std::string& instance_id, int64_t tablet_id,
+                    TabletMetaCloudPB& tablet_meta) {
+    TabletIndexPB tablet_idx;
+    int ret = get_tablet_idx(txn_kv, instance_id, tablet_id, tablet_idx);
+    if (ret < 0) {
+        return ret;
+    }
+
+    std::unique_ptr<Transaction> txn;
+    TxnErrorCode err = txn_kv->create_txn(&txn);
+    if (err != TxnErrorCode::TXN_OK) {
+        LOG(WARNING) << "failed to create txn";
+        return -1;
+    }
+
+    std::string key, val;
+    meta_tablet_key({instance_id, tablet_idx.table_id(), tablet_idx.index_id(),
+                     tablet_idx.partition_id(), tablet_id},
+                    &key);
+    err = txn->get(key, &val);
+    if (err != TxnErrorCode::TXN_OK) {
+        LOG(WARNING) << fmt::format(
+                "failed to get tablet, err={}, table_id={}, index_id={}, partition_id={}, "
+                "tablet_id={} key={}",
+                err, tablet_idx.table_id(), tablet_idx.index_id(), tablet_idx.partition_id(),
+                tablet_id, hex(key));
+        return -1;
+    }
+    if (!tablet_meta.ParseFromString(val)) [[unlikely]] {
+        LOG(WARNING) << fmt::format("malformed tablet meta, tablet_id={} key={}", tablet_id,
+                                    hex(key));
+        return -1;
+    }
+    return 0;
+}
 } // namespace doris::cloud
diff --git a/cloud/src/recycler/util.h b/cloud/src/recycler/util.h
index b6d4d3299b5e0f..5aa929c23984b1 100644
--- a/cloud/src/recycler/util.h
+++ b/cloud/src/recycler/util.h
@@ -85,4 +85,9 @@ inline std::string tablet_path_prefix(int64_t tablet_id) {
     return fmt::format("data/{}/", tablet_id);
 }
 
+int get_tablet_idx(TxnKv* txn_kv, const std::string& instance_id, int64_t tablet_id,
+                   TabletIndexPB& tablet_idx);
+
+int get_tablet_meta(TxnKv* txn_kv, const std::string& instance_id, int64_t tablet_id,
+                    TabletMetaCloudPB& tablet_meta);
 } // namespace doris::cloud
diff --git a/cloud/test/http_encode_key_test.cpp b/cloud/test/http_encode_key_test.cpp
index 77f800846076a9..d245682474349d 100644
--- a/cloud/test/http_encode_key_test.cpp
+++ b/cloud/test/http_encode_key_test.cpp
@@ -310,7 +310,7 @@ txn_id=126419752960)",
         },
         R"({"creation_time":"12345","label":"label_1"})",
     },
-    Input { // aggregated_stats + full detached_stats, there are 5 KVs in total
+    Input { // aggregated_stats + full detached_stats, there are 7 KVs in total
         "StatsTabletKey",
         "instance_id=gavin-instance&table_id=10086&index_id=10010&part_id=10000&tablet_id=1008601",
         {
@@ -327,15 +327,17 @@ txn_id=126419752960)",
             idx->set_index_id(100010);
             idx->set_partition_id(10000);
             idx->set_tablet_id(1008601);
-            pb.set_data_size(1);
+            pb.set_data_size(2);
             pb.set_num_rows(10);
             pb.set_num_rowsets(11);
             pb.set_num_segments(12);
+            pb.set_index_size(1);
+            pb.set_segment_size(1);
             return {pb.SerializeAsString(), {"\x01\x00\x00\x00\x00\x00\x00\x00",8}, {"\x02\x00\x00\x00\x00\x00\x00\x00",8}, {"\x03\x00\x00\x00\x00\x00\x00\x00",8}, {"\x04\x00\x00\x00\x00\x00\x00\x00",8}};
         },
-        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008601"},"data_size":"1","num_rows":"10","num_rowsets":"11","num_segments":"12"}
-detached_stats: {"data_size":"1","num_rows":"2","num_rowsets":"3","num_segments":"4"}
-merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008601"},"data_size":"2","num_rows":"12","num_rowsets":"14","num_segments":"16"}
+        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008601"},"data_size":"2","num_rows":"10","num_rowsets":"11","num_segments":"12","index_size":"1","segment_size":"1"}
+detached_stats: {"data_size":"1","num_rows":"2","num_rowsets":"3","num_segments":"4","index_size":"0","segment_size":"0"}
+merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008601"},"data_size":"3","num_rows":"12","num_rowsets":"14","num_segments":"16","index_size":"1","segment_size":"1"}
 )",
     },
     Input { // aggregated_stats + half detached_stats (num_segs == 0, there is num_rowsets detached stats)
@@ -352,15 +354,17 @@ merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"100
             idx->set_index_id(100010);
             idx->set_partition_id(10000);
             idx->set_tablet_id(1008602);
-            pb.set_data_size(1);
+            pb.set_data_size(2);
             pb.set_num_rows(10);
             pb.set_num_rowsets(11);
             pb.set_num_segments(12);
+            pb.set_index_size(1);
+            pb.set_segment_size(1);
             return {pb.SerializeAsString(), {"\x03\x00\x00\x00\x00\x00\x00\x00",8}};
         },
-        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"1","num_rows":"10","num_rowsets":"11","num_segments":"12"}
-detached_stats: {"data_size":"0","num_rows":"0","num_rowsets":"3","num_segments":"0"}
-merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"1","num_rows":"10","num_rowsets":"14","num_segments":"12"}
+        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"2","num_rows":"10","num_rowsets":"11","num_segments":"12","index_size":"1","segment_size":"1"}
+detached_stats: {"data_size":"0","num_rows":"0","num_rowsets":"3","num_segments":"0","index_size":"0","segment_size":"0"}
+merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"2","num_rows":"10","num_rowsets":"14","num_segments":"12","index_size":"1","segment_size":"1"}
 )",
     },
     Input { // aggregated_stats only, the legacy
@@ -376,15 +380,17 @@ merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"100
             idx->set_index_id(100010);
             idx->set_partition_id(10000);
             idx->set_tablet_id(1008602);
-            pb.set_data_size(1);
+            pb.set_data_size(2);
             pb.set_num_rows(10);
             pb.set_num_rowsets(11);
             pb.set_num_segments(12);
+            pb.set_index_size(1);
+            pb.set_segment_size(1);
             return {pb.SerializeAsString()};
         },
-        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"1","num_rows":"10","num_rowsets":"11","num_segments":"12"}
-detached_stats: {"data_size":"0","num_rows":"0","num_rowsets":"0","num_segments":"0"}
-merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"1","num_rows":"10","num_rowsets":"11","num_segments":"12"}
+        R"(aggregated_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"2","num_rows":"10","num_rowsets":"11","num_segments":"12","index_size":"1","segment_size":"1"}
+detached_stats: {"data_size":"0","num_rows":"0","num_rowsets":"0","num_segments":"0","index_size":"0","segment_size":"0"}
+merged_stats: {"idx":{"table_id":"10086","index_id":"100010","partition_id":"10000","tablet_id":"1008602"},"data_size":"2","num_rows":"10","num_rowsets":"11","num_segments":"12","index_size":"1","segment_size":"1"}
 )",
     },
     Input {
diff --git a/cloud/test/keys_test.cpp b/cloud/test/keys_test.cpp
index a92a685cda45f8..52d840e1f5ce6b 100644
--- a/cloud/test/keys_test.cpp
+++ b/cloud/test/keys_test.cpp
@@ -803,6 +803,40 @@ TEST(KeysTest, StatsKeysTest) {
 
         EXPECT_EQ("num_segs", dec_stats_suffix);
     }
+
+    // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "index_size"   -> int64
+    {
+        StatsTabletKeyInfo stats_key {instance_id, table_id, index_id, partition_id, tablet_id};
+        std::string encoded_stats_key0;
+        stats_tablet_index_size_key(stats_key, &encoded_stats_key0);
+        std::cout << hex(encoded_stats_key0) << std::endl;
+
+        std::string dec_stats_suffix;
+
+        std::string_view key_sv(encoded_stats_key0);
+        expect_stats_prefix(key_sv);
+        ASSERT_EQ(decode_bytes(&key_sv, &dec_stats_suffix), 0);
+        ASSERT_TRUE(key_sv.empty());
+
+        EXPECT_EQ("index_size", dec_stats_suffix);
+    }
+
+    // 0x01 "stats" ${instance_id} "tablet" ${table_id} ${index_id} ${partition_id} ${tablet_id} "segment_size"   -> int64
+    {
+        StatsTabletKeyInfo stats_key {instance_id, table_id, index_id, partition_id, tablet_id};
+        std::string encoded_stats_key0;
+        stats_tablet_segment_size_key(stats_key, &encoded_stats_key0);
+        std::cout << hex(encoded_stats_key0) << std::endl;
+
+        std::string dec_stats_suffix;
+
+        std::string_view key_sv(encoded_stats_key0);
+        expect_stats_prefix(key_sv);
+        ASSERT_EQ(decode_bytes(&key_sv, &dec_stats_suffix), 0);
+        ASSERT_TRUE(key_sv.empty());
+
+        EXPECT_EQ("segment_size", dec_stats_suffix);
+    }
 }
 
 TEST(KeysTest, JobKeysTest) {
diff --git a/cloud/test/meta_service_http_test.cpp b/cloud/test/meta_service_http_test.cpp
index 4360efeb4422a9..81c322303a5a8c 100644
--- a/cloud/test/meta_service_http_test.cpp
+++ b/cloud/test/meta_service_http_test.cpp
@@ -1257,6 +1257,8 @@ TEST(MetaServiceHttpTest, GetTabletStatsTest) {
     EXPECT_EQ(res.tablet_stats(0).num_rows(), 0);
     EXPECT_EQ(res.tablet_stats(0).num_rowsets(), 1);
     EXPECT_EQ(res.tablet_stats(0).num_segments(), 0);
+    EXPECT_EQ(res.tablet_stats(0).index_size(), 0);
+    EXPECT_EQ(res.tablet_stats(0).segment_size(), 0);
     {
         GetTabletStatsRequest req;
         auto idx = req.add_tablet_idx();
@@ -1288,6 +1290,16 @@ TEST(MetaServiceHttpTest, GetTabletStatsTest) {
                                &data_size_key);
     ASSERT_EQ(txn->get(data_size_key, &data_size_val), TxnErrorCode::TXN_OK);
     EXPECT_EQ(*(int64_t*)data_size_val.data(), 22000);
+    std::string index_size_key, index_size_val;
+    stats_tablet_index_size_key({mock_instance, table_id, index_id, partition_id, tablet_id},
+                                &index_size_key);
+    ASSERT_EQ(txn->get(index_size_key, &index_size_val), TxnErrorCode::TXN_OK);
+    EXPECT_EQ(*(int64_t*)index_size_val.data(), 2000);
+    std::string segment_size_key, segment_size_val;
+    stats_tablet_segment_size_key({mock_instance, table_id, index_id, partition_id, tablet_id},
+                                  &segment_size_key);
+    ASSERT_EQ(txn->get(segment_size_key, &segment_size_val), TxnErrorCode::TXN_OK);
+    EXPECT_EQ(*(int64_t*)segment_size_val.data(), 20000);
     std::string num_rows_key, num_rows_val;
     stats_tablet_num_rows_key({mock_instance, table_id, index_id, partition_id, tablet_id},
                               &num_rows_key);
@@ -1312,6 +1324,8 @@ TEST(MetaServiceHttpTest, GetTabletStatsTest) {
     EXPECT_EQ(res.tablet_stats(0).num_rows(), 400);
     EXPECT_EQ(res.tablet_stats(0).num_rowsets(), 5);
     EXPECT_EQ(res.tablet_stats(0).num_segments(), 4);
+    EXPECT_EQ(res.tablet_stats(0).index_size(), 4000);
+    EXPECT_EQ(res.tablet_stats(0).segment_size(), 40000);
     {
         GetTabletStatsRequest req;
         auto idx = req.add_tablet_idx();
diff --git a/cloud/test/meta_service_job_test.cpp b/cloud/test/meta_service_job_test.cpp
index f0323eebb790be..e1dbb0089e2e73 100644
--- a/cloud/test/meta_service_job_test.cpp
+++ b/cloud/test/meta_service_job_test.cpp
@@ -95,7 +95,9 @@ doris::RowsetMetaCloudPB create_rowset(int64_t tablet_id, int64_t start_version,
     rowset.set_end_version(end_version);
     rowset.set_num_segments(1);
     rowset.set_num_rows(num_rows);
-    rowset.set_data_disk_size(num_rows * 100);
+    rowset.set_total_disk_size(num_rows * 100);
+    rowset.set_data_disk_size(num_rows * 50);
+    rowset.set_index_disk_size(num_rows * 50);
     rowset.mutable_tablet_schema()->set_schema_version(0);
     rowset.set_txn_expiration(::time(nullptr)); // Required by DCHECK
     return rowset;
@@ -114,11 +116,13 @@ void insert_rowsets(TxnKv* txn_kv, int64_t table_id, int64_t index_id, int64_t p
     std::unique_ptr<Transaction> txn;
     ASSERT_EQ(txn_kv->create_txn(&txn), TxnErrorCode::TXN_OK) << tablet_id;
     std::deque<std::string> buffer;
-    int data_size = 0, num_rows = 0, num_seg = 0;
+    int data_size = 0, num_rows = 0, num_seg = 0, index_size = 0, segment_size = 0;
     for (auto& rowset : rowsets) {
-        data_size += rowset.data_disk_size();
+        data_size += rowset.total_disk_size();
         num_rows += rowset.num_rows();
         num_seg += rowset.num_segments();
+        index_size += rowset.index_disk_size();
+        segment_size += rowset.data_disk_size();
         auto& key = buffer.emplace_back();
         auto& val = buffer.emplace_back();
         meta_rowset_key({instance_id, tablet_id, rowset.end_version()}, &key);
@@ -138,6 +142,12 @@ void insert_rowsets(TxnKv* txn_kv, int64_t table_id, int64_t index_id, int64_t p
     std::string num_segs_key;
     stats_tablet_num_segs_key(info, &num_segs_key);
     txn->atomic_add(num_segs_key, num_seg);
+    std::string index_size_key;
+    stats_tablet_index_size_key(info, &index_size_key);
+    txn->atomic_add(index_size_key, index_size);
+    std::string segment_size_key;
+    stats_tablet_segment_size_key(info, &segment_size_key);
+    txn->atomic_add(segment_size_key, segment_size);
     ASSERT_EQ(txn->commit(), TxnErrorCode::TXN_OK) << tablet_id;
 }
 
@@ -241,7 +251,11 @@ void finish_schema_change_job(
             sc->add_output_versions(rowset.end_version());
             sc->set_num_output_rows(sc->num_output_rows() + rowset.num_rows());
             sc->set_num_output_segments(sc->num_output_segments() + rowset.num_segments());
-            sc->set_size_output_rowsets(sc->size_output_rowsets() + rowset.data_disk_size());
+            sc->set_size_output_rowsets(sc->size_output_rowsets() + rowset.total_disk_size());
+            sc->set_index_size_output_rowsets(sc->index_size_output_rowsets() +
+                                              rowset.index_disk_size());
+            sc->set_segment_size_output_rowsets(sc->segment_size_output_rowsets() +
+                                                rowset.data_disk_size());
         }
         sc->set_num_output_rowsets(output_rowsets.size());
     }
@@ -853,6 +867,10 @@ TEST(MetaServiceJobTest, CompactionJobTest) {
         compaction->set_num_input_segments(dist(rng));
         compaction->set_size_input_rowsets(dist(rng));
         compaction->set_size_output_rowsets(dist(rng));
+        compaction->set_index_size_input_rowsets(dist(rng));
+        compaction->set_segment_size_output_rowsets(dist(rng));
+        compaction->set_index_size_input_rowsets(dist(rng));
+        compaction->set_segment_size_output_rowsets(dist(rng));
         compaction->set_type(type);
 
         tablet_stats_pb.set_cumulative_compaction_cnt(dist(rng));
@@ -863,6 +881,8 @@ TEST(MetaServiceJobTest, CompactionJobTest) {
         tablet_stats_pb.set_data_size(dist(rng) + compaction->size_input_rowsets());
         tablet_stats_pb.set_num_rowsets(dist(rng) + compaction->num_input_rowsets());
         tablet_stats_pb.set_num_segments(dist(rng) + compaction->num_input_segments());
+        tablet_stats_pb.set_index_size(dist(rng) + compaction->index_size_input_rowsets());
+        tablet_stats_pb.set_segment_size(dist(rng) + compaction->segment_size_input_rowsets());
 
         std::string tablet_stats_val = tablet_stats_pb.SerializeAsString();
         ASSERT_FALSE(tablet_stats_val.empty());
@@ -981,6 +1001,8 @@ TEST(MetaServiceJobTest, CompactionJobTest) {
         EXPECT_EQ(stats.data_size()                , tablet_stats_pb.data_size() + (req.job().compaction(0).size_output_rowsets() - req.job().compaction(0).size_input_rowsets()));
         EXPECT_EQ(stats.num_rowsets()              , tablet_stats_pb.num_rowsets() + (req.job().compaction(0).num_output_rowsets() - req.job().compaction(0).num_input_rowsets()));
         EXPECT_EQ(stats.num_segments()             , tablet_stats_pb.num_segments() + (req.job().compaction(0).num_output_segments() - req.job().compaction(0).num_input_segments()));
+        EXPECT_EQ(stats.index_size()               , tablet_stats_pb.index_size() + (req.job().compaction(0).index_size_output_rowsets() - req.job().compaction(0).index_size_input_rowsets()));
+        EXPECT_EQ(stats.segment_size()             , tablet_stats_pb.segment_size() + (req.job().compaction(0).segment_size_output_rowsets() - req.job().compaction(0).segment_size_input_rowsets()));
         // clang-format on
 
         // Check job removed, tablet meta updated
@@ -1157,6 +1179,8 @@ TEST(MetaServiceJobTest, CompactionJobWithMoWTest) {
         tablet_stats_pb.set_data_size(dist(rng) + compaction->size_input_rowsets());
         tablet_stats_pb.set_num_rowsets(dist(rng) + compaction->num_input_rowsets());
         tablet_stats_pb.set_num_segments(dist(rng) + compaction->num_input_segments());
+        tablet_stats_pb.set_index_size(dist(rng) + compaction->index_size_input_rowsets());
+        tablet_stats_pb.set_segment_size(dist(rng) + compaction->segment_size_input_rowsets());
 
         std::string tablet_stats_val = tablet_stats_pb.SerializeAsString();
         ASSERT_FALSE(tablet_stats_val.empty());
@@ -1391,12 +1415,16 @@ TEST(MetaServiceJobTest, SchemaChangeJobTest) {
         EXPECT_EQ(res.stats().num_rowsets(), 6);
         EXPECT_EQ(res.stats().num_segments(), 5);
         EXPECT_EQ(res.stats().data_size(), 50000);
+        EXPECT_EQ(res.stats().index_size(), 25000);
+        EXPECT_EQ(res.stats().segment_size(), 25000);
         TabletStatsPB tablet_stats;
         get_tablet_stats(meta_service.get(), new_tablet_id, tablet_stats);
         EXPECT_EQ(tablet_stats.num_rows(), 500);
         EXPECT_EQ(tablet_stats.num_rowsets(), 6);
         EXPECT_EQ(tablet_stats.num_segments(), 5);
         EXPECT_EQ(tablet_stats.data_size(), 50000);
+        EXPECT_EQ(tablet_stats.index_size(), 25000);
+        EXPECT_EQ(tablet_stats.segment_size(), 25000);
 
         std::unique_ptr<Transaction> txn;
         ASSERT_EQ(meta_service->txn_kv()->create_txn(&txn), TxnErrorCode::TXN_OK);
@@ -1465,12 +1493,16 @@ TEST(MetaServiceJobTest, SchemaChangeJobTest) {
         EXPECT_EQ(res.stats().num_rowsets(), 6);
         EXPECT_EQ(res.stats().num_segments(), 5);
         EXPECT_EQ(res.stats().data_size(), 50000);
+        EXPECT_EQ(res.stats().index_size(), 25000);
+        EXPECT_EQ(res.stats().segment_size(), 25000);
         TabletStatsPB tablet_stats;
         get_tablet_stats(meta_service.get(), new_tablet_id, tablet_stats);
         EXPECT_EQ(tablet_stats.num_rows(), 500);
         EXPECT_EQ(tablet_stats.num_rowsets(), 6);
         EXPECT_EQ(tablet_stats.num_segments(), 5);
         EXPECT_EQ(tablet_stats.data_size(), 50000);
+        EXPECT_EQ(tablet_stats.index_size(), 25000);
+        EXPECT_EQ(tablet_stats.segment_size(), 25000);
 
         std::unique_ptr<Transaction> txn;
         ASSERT_EQ(meta_service->txn_kv()->create_txn(&txn), TxnErrorCode::TXN_OK);
@@ -1628,12 +1660,16 @@ TEST(MetaServiceJobTest, RetrySchemaChangeJobTest) {
     EXPECT_EQ(res.stats().num_rowsets(), 6);
     EXPECT_EQ(res.stats().num_segments(), 5);
     EXPECT_EQ(res.stats().data_size(), 50000);
+    EXPECT_EQ(res.stats().index_size(), 25000);
+    EXPECT_EQ(res.stats().segment_size(), 25000);
     TabletStatsPB tablet_stats;
     get_tablet_stats(meta_service.get(), new_tablet_id, tablet_stats);
     EXPECT_EQ(tablet_stats.num_rows(), 500);
     EXPECT_EQ(tablet_stats.num_rowsets(), 6);
     EXPECT_EQ(tablet_stats.num_segments(), 5);
     EXPECT_EQ(tablet_stats.data_size(), 50000);
+    EXPECT_EQ(tablet_stats.index_size(), 25000);
+    EXPECT_EQ(tablet_stats.segment_size(), 25000);
 
     std::unique_ptr<Transaction> txn;
     ASSERT_EQ(meta_service->txn_kv()->create_txn(&txn), TxnErrorCode::TXN_OK);
@@ -1942,10 +1978,14 @@ TEST(MetaServiceJobTest, ConcurrentCompactionTest) {
         compaction->add_output_rowset_ids(output_rowset.rowset_id_v2());
         compaction->set_output_cumulative_point(11);
         compaction->set_size_input_rowsets(60000);
+        compaction->set_index_size_input_rowsets(30000);
+        compaction->set_segment_size_input_rowsets(30000);
         compaction->set_num_input_rows(600);
         compaction->set_num_input_rowsets(6);
         compaction->set_num_input_segments(6);
         compaction->set_size_output_rowsets(10000);
+        compaction->set_index_size_output_rowsets(5000);
+        compaction->set_segment_size_output_rowsets(5000);
         compaction->set_num_output_rows(100);
         compaction->set_num_output_rowsets(1);
         compaction->set_num_output_segments(1);
@@ -1958,12 +1998,16 @@ TEST(MetaServiceJobTest, ConcurrentCompactionTest) {
         EXPECT_EQ(res.stats().num_rowsets(), 6);
         EXPECT_EQ(res.stats().num_segments(), 5);
         EXPECT_EQ(res.stats().data_size(), 50000);
+        EXPECT_EQ(res.stats().index_size(), 25000);
+        EXPECT_EQ(res.stats().segment_size(), 25000);
         TabletStatsPB tablet_stats;
         get_tablet_stats(meta_service.get(), tablet_id, tablet_stats);
         EXPECT_EQ(tablet_stats.num_rows(), 500);
         EXPECT_EQ(tablet_stats.num_rowsets(), 6);
         EXPECT_EQ(tablet_stats.num_segments(), 5);
         EXPECT_EQ(tablet_stats.data_size(), 50000);
+        EXPECT_EQ(tablet_stats.index_size(), 25000);
+        EXPECT_EQ(tablet_stats.segment_size(), 25000);
 
         ASSERT_EQ(meta_service->txn_kv()->create_txn(&txn), TxnErrorCode::TXN_OK);
         // Check tmp rowsets
@@ -2046,10 +2090,14 @@ TEST(MetaServiceJobTest, ConcurrentCompactionTest) {
         compaction->add_output_rowset_ids(output_rowset.rowset_id_v2());
         compaction->set_output_cumulative_point(5);
         compaction->set_size_input_rowsets(30000);
+        compaction->set_index_size_input_rowsets(15000);
+        compaction->set_segment_size_input_rowsets(15000);
         compaction->set_num_input_rows(300);
         compaction->set_num_input_rowsets(3);
         compaction->set_num_input_segments(3);
         compaction->set_size_output_rowsets(10000);
+        compaction->set_index_size_output_rowsets(5000);
+        compaction->set_segment_size_output_rowsets(5000);
         compaction->set_num_output_rows(100);
         compaction->set_num_output_rowsets(1);
         compaction->set_num_output_segments(1);
@@ -2062,12 +2110,16 @@ TEST(MetaServiceJobTest, ConcurrentCompactionTest) {
         EXPECT_EQ(res.stats().num_rowsets(), 4);
         EXPECT_EQ(res.stats().num_segments(), 3);
         EXPECT_EQ(res.stats().data_size(), 30000);
+        EXPECT_EQ(res.stats().index_size(), 15000);
+        EXPECT_EQ(res.stats().segment_size(), 15000);
         TabletStatsPB tablet_stats;
         get_tablet_stats(meta_service.get(), tablet_id, tablet_stats);
         EXPECT_EQ(tablet_stats.num_rows(), 300);
         EXPECT_EQ(tablet_stats.num_rowsets(), 4);
         EXPECT_EQ(tablet_stats.num_segments(), 3);
         EXPECT_EQ(tablet_stats.data_size(), 30000);
+        EXPECT_EQ(tablet_stats.index_size(), 15000);
+        EXPECT_EQ(tablet_stats.segment_size(), 15000);
 
         ASSERT_EQ(meta_service->txn_kv()->create_txn(&txn), TxnErrorCode::TXN_OK);
         // Check tmp rowsets
diff --git a/cloud/test/meta_service_test.cpp b/cloud/test/meta_service_test.cpp
index 1f93b228c6de08..d2dd80f6871e3e 100644
--- a/cloud/test/meta_service_test.cpp
+++ b/cloud/test/meta_service_test.cpp
@@ -4429,6 +4429,8 @@ TEST(MetaServiceTest, GetTabletStatsTest) {
     EXPECT_EQ(res.tablet_stats(0).num_rows(), 0);
     EXPECT_EQ(res.tablet_stats(0).num_rowsets(), 1);
     EXPECT_EQ(res.tablet_stats(0).num_segments(), 0);
+    EXPECT_EQ(res.tablet_stats(0).index_size(), 0);
+    EXPECT_EQ(res.tablet_stats(0).segment_size(), 0);
     // Insert rowset
     config::split_tablet_stats = false;
     ASSERT_NO_FATAL_FAILURE(
@@ -4448,6 +4450,16 @@ TEST(MetaServiceTest, GetTabletStatsTest) {
                                &data_size_key);
     ASSERT_EQ(txn->get(data_size_key, &data_size_val), TxnErrorCode::TXN_OK);
     EXPECT_EQ(*(int64_t*)data_size_val.data(), 22000);
+    std::string index_size_key, index_size_val;
+    stats_tablet_index_size_key({mock_instance, table_id, index_id, partition_id, tablet_id},
+                                &index_size_key);
+    ASSERT_EQ(txn->get(index_size_key, &index_size_val), TxnErrorCode::TXN_OK);
+    EXPECT_EQ(*(int64_t*)index_size_val.data(), 2000);
+    std::string segment_size_key, segment_size_val;
+    stats_tablet_segment_size_key({mock_instance, table_id, index_id, partition_id, tablet_id},
+                                  &segment_size_key);
+    ASSERT_EQ(txn->get(segment_size_key, &segment_size_val), TxnErrorCode::TXN_OK);
+    EXPECT_EQ(*(int64_t*)segment_size_val.data(), 20000);
     std::string num_rows_key, num_rows_val;
     stats_tablet_num_rows_key({mock_instance, table_id, index_id, partition_id, tablet_id},
                               &num_rows_key);
@@ -4472,6 +4484,8 @@ TEST(MetaServiceTest, GetTabletStatsTest) {
     EXPECT_EQ(res.tablet_stats(0).num_rows(), 400);
     EXPECT_EQ(res.tablet_stats(0).num_rowsets(), 5);
     EXPECT_EQ(res.tablet_stats(0).num_segments(), 4);
+    EXPECT_EQ(res.tablet_stats(0).index_size(), 4000);
+    EXPECT_EQ(res.tablet_stats(0).segment_size(), 40000);
 }
 
 TEST(MetaServiceTest, GetDeleteBitmapUpdateLock) {
@@ -7771,6 +7785,8 @@ TEST(MetaServiceTest, UpdateTmpRowsetTest) {
         // simulate that there are new segments added to this rowset
         rowset.set_num_segments(rowset.num_segments() + 3);
         rowset.set_num_rows(rowset.num_rows() + 1000);
+        rowset.set_total_disk_size(rowset.total_disk_size() + 11000);
+        rowset.set_index_disk_size(rowset.index_disk_size() + 1000);
         rowset.set_data_disk_size(rowset.data_disk_size() + 10000);
 
         ASSERT_NO_FATAL_FAILURE(update_tmp_rowset(meta_service.get(), rowset, res));
@@ -7789,6 +7805,8 @@ TEST(MetaServiceTest, UpdateTmpRowsetTest) {
         ASSERT_EQ(doris::BEGIN_PARTIAL_UPDATE, fetchedRowsetMeta.rowset_state());
         ASSERT_EQ(rowset.num_segments(), fetchedRowsetMeta.num_segments());
         ASSERT_EQ(rowset.num_rows(), fetchedRowsetMeta.num_rows());
+        ASSERT_EQ(rowset.total_disk_size(), fetchedRowsetMeta.total_disk_size());
+        ASSERT_EQ(rowset.index_disk_size(), fetchedRowsetMeta.index_disk_size());
         ASSERT_EQ(rowset.data_disk_size(), fetchedRowsetMeta.data_disk_size());
 
         ASSERT_NO_FATAL_FAILURE(commit_txn(meta_service.get(), db_id, txn_id, label));
@@ -7819,6 +7837,8 @@ TEST(MetaServiceTest, UpdateTmpRowsetTest) {
         // simulate that there are new segments added to this rowset
         rowset.set_num_segments(rowset.num_segments() + 3);
         rowset.set_num_rows(rowset.num_rows() + 1000);
+        rowset.set_total_disk_size(rowset.total_disk_size() + 11000);
+        rowset.set_index_disk_size(rowset.index_disk_size() + 1000);
         rowset.set_data_disk_size(rowset.data_disk_size() + 10000);
 
         // repeated calls to update_tmp_rowset will all success
@@ -7844,6 +7864,8 @@ TEST(MetaServiceTest, UpdateTmpRowsetTest) {
         ASSERT_EQ(doris::BEGIN_PARTIAL_UPDATE, fetchedRowsetMeta.rowset_state());
         ASSERT_EQ(rowset.num_segments(), fetchedRowsetMeta.num_segments());
         ASSERT_EQ(rowset.num_rows(), fetchedRowsetMeta.num_rows());
+        ASSERT_EQ(rowset.total_disk_size(), fetchedRowsetMeta.total_disk_size());
+        ASSERT_EQ(rowset.index_disk_size(), fetchedRowsetMeta.index_disk_size());
         ASSERT_EQ(rowset.data_disk_size(), fetchedRowsetMeta.data_disk_size());
 
         ASSERT_NO_FATAL_FAILURE(commit_txn(meta_service.get(), db_id, txn_id, label));
@@ -7869,6 +7891,8 @@ TEST(MetaServiceTest, UpdateTmpRowsetTest) {
         // simulate that there are new segments added to this rowset
         rowset.set_num_segments(rowset.num_segments() + 3);
         rowset.set_num_rows(rowset.num_rows() + 1000);
+        rowset.set_total_disk_size(rowset.total_disk_size() + 11000);
+        rowset.set_index_disk_size(rowset.index_disk_size() + 1000);
         rowset.set_data_disk_size(rowset.data_disk_size() + 10000);
 
         ASSERT_NO_FATAL_FAILURE(update_tmp_rowset(meta_service.get(), rowset, res));
diff --git a/cloud/test/recycler_test.cpp b/cloud/test/recycler_test.cpp
index 146873548398bf..0bc16644a82041 100644
--- a/cloud/test/recycler_test.cpp
+++ b/cloud/test/recycler_test.cpp
@@ -255,14 +255,63 @@ static int create_committed_rowset(TxnKv* txn_kv, StorageVaultAccessor* accessor
     return 0;
 }
 
+static int create_committed_rowset_with_rowset_id(TxnKv* txn_kv, StorageVaultAccessor* accessor,
+                                                  const std::string& resource_id, int64_t tablet_id,
+                                                  int64_t start_version, int64_t end_version,
+                                                  std::string rowset_id, bool segments_overlap,
+                                                  int num_segments) {
+    std::string key;
+    std::string val;
+
+    MetaRowsetKeyInfo key_info {instance_id, tablet_id, end_version};
+    meta_rowset_key(key_info, &key);
+
+    doris::RowsetMetaCloudPB rowset_pb;
+    rowset_pb.set_rowset_id(0); // useless but required
+    rowset_pb.set_rowset_id_v2(rowset_id);
+    rowset_pb.set_num_segments(num_segments);
+    rowset_pb.set_tablet_id(tablet_id);
+    rowset_pb.set_resource_id(resource_id);
+    rowset_pb.set_creation_time(current_time);
+    rowset_pb.set_start_version(start_version);
+    rowset_pb.set_end_version(end_version);
+    rowset_pb.set_segments_overlap_pb(segments_overlap ? OVERLAPPING : NONOVERLAPPING);
+    rowset_pb.SerializeToString(&val);
+
+    std::unique_ptr<Transaction> txn;
+    if (txn_kv->create_txn(&txn) != TxnErrorCode::TXN_OK) {
+        return -1;
+    }
+    txn->put(key, val);
+    if (txn->commit() != TxnErrorCode::TXN_OK) {
+        return -1;
+    }
+
+    for (int i = 0; i < num_segments; ++i) {
+        auto path = segment_path(tablet_id, rowset_id, i);
+        accessor->put_file(path, "");
+    }
+    return 0;
+}
+
+static void create_delete_bitmaps(Transaction* txn, int64_t tablet_id, std::string rowset_id,
+                                  int64_t start_version, int64_t end_version) {
+    for (int64_t ver {start_version}; ver <= end_version; ver++) {
+        auto key = meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+        std::string val {"test_data"};
+        txn->put(key, val);
+    }
+}
+
 static int create_tablet(TxnKv* txn_kv, int64_t table_id, int64_t index_id, int64_t partition_id,
-                         int64_t tablet_id) {
+                         int64_t tablet_id, bool is_mow = false) {
     std::unique_ptr<Transaction> txn;
     if (txn_kv->create_txn(&txn) != TxnErrorCode::TXN_OK) {
         return -1;
     }
     doris::TabletMetaCloudPB tablet_meta;
     tablet_meta.set_tablet_id(tablet_id);
+    tablet_meta.set_enable_unique_key_merge_on_write(is_mow);
     auto val = tablet_meta.SerializeAsString();
     auto key = meta_tablet_key({instance_id, table_id, index_id, partition_id, tablet_id});
     txn->put(key, val);
@@ -275,6 +324,7 @@ static int create_tablet(TxnKv* txn_kv, int64_t table_id, int64_t index_id, int6
     TabletIndexPB tablet_idx_pb;
     tablet_idx_pb.set_db_id(db_id);
     tablet_idx_pb.set_table_id(table_id);
+    tablet_idx_pb.set_index_id(index_id);
     tablet_idx_pb.set_partition_id(partition_id);
     tablet_idx_pb.set_tablet_id(tablet_id);
     auto idx_val = tablet_idx_pb.SerializeAsString();
@@ -2576,6 +2626,352 @@ TEST(CheckerTest, do_inspect) {
     }
 }
 
+TEST(CheckerTest, delete_bitmap_inverted_check_normal) {
+    // normal case, all delete bitmaps belong to a rowset
+    auto txn_kv = std::make_shared<MemTxnKv>();
+    ASSERT_EQ(txn_kv->init(), 0);
+
+    InstanceInfoPB instance;
+    instance.set_instance_id(instance_id);
+    auto obj_info = instance.add_obj_info();
+    obj_info->set_id("1");
+
+    InstanceChecker checker(txn_kv, instance_id);
+    ASSERT_EQ(checker.init(instance), 0);
+    auto accessor = checker.accessor_map_.begin()->second;
+
+    std::unique_ptr<Transaction> txn;
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn_kv->create_txn(&txn));
+
+    constexpr int table_id = 10000, index_id = 10001, partition_id = 10002;
+    // create some rowsets with delete bitmaps in merge-on-write tablet
+    for (int tablet_id = 600001; tablet_id <= 600010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        int64_t rowset_start_id = 400;
+        for (int ver = 2; ver <= 10; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   ver, ver, rowset_id, false, 1);
+            if (ver >= 5) {
+                auto delete_bitmap_key =
+                        meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+                std::string delete_bitmap_val {"test"};
+                txn->put(delete_bitmap_key, delete_bitmap_val);
+            } else {
+                // delete bitmaps may be spilitted into mulitiple KVs if too large
+                auto delete_bitmap_key =
+                        meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+                std::string delete_bitmap_val(1000, 'A');
+                cloud::put(txn.get(), delete_bitmap_key, delete_bitmap_val, 0, 300);
+            }
+        }
+    }
+
+    // also create some rowsets without delete bitmaps in non merge-on-write tablet
+    for (int tablet_id = 700001; tablet_id <= 700010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, false));
+        int64_t rowset_start_id = 500;
+        for (int ver = 2; ver < 10; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   ver, ver, rowset_id, false, 1);
+        }
+    }
+
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn->commit());
+
+    ASSERT_EQ(checker.do_delete_bitmap_inverted_check(), 0);
+}
+
+TEST(CheckerTest, delete_bitmap_inverted_check_abnormal) {
+    // abnormal case, some delete bitmaps arem leaked
+    auto txn_kv = std::make_shared<MemTxnKv>();
+    ASSERT_EQ(txn_kv->init(), 0);
+
+    InstanceInfoPB instance;
+    instance.set_instance_id(instance_id);
+    auto obj_info = instance.add_obj_info();
+    obj_info->set_id("1");
+
+    InstanceChecker checker(txn_kv, instance_id);
+    ASSERT_EQ(checker.init(instance), 0);
+    auto accessor = checker.accessor_map_.begin()->second;
+
+    // tablet_id -> [rowset_id, version, segment_id]
+    std::map<std::int64_t, std::set<std::tuple<std::string, int64_t, int64_t>>>
+            expected_abnormal_delete_bitmaps {}, real_abnormal_delete_bitmaps {};
+    std::map<std::int64_t, std::set<std::tuple<std::string, int64_t, int64_t>>>
+            expected_leaked_delete_bitmaps {}, real_leaked_delete_bitmaps {};
+    auto sp = SyncPoint::get_instance();
+    std::unique_ptr<int, std::function<void(int*)>> defer(
+            (int*)0x01, [](int*) { SyncPoint::get_instance()->clear_all_call_backs(); });
+    sp->set_call_back(
+            "InstanceChecker::do_delete_bitmap_inverted_check.get_abnormal_delete_bitmap",
+            [&real_abnormal_delete_bitmaps](auto&& args) {
+                int64_t tablet_id = *try_any_cast<int64_t*>(args[0]);
+                std::string rowset_id = *try_any_cast<std::string*>(args[1]);
+                int64_t version = *try_any_cast<int64_t*>(args[2]);
+                int64_t segment_id = *try_any_cast<int64_t*>(args[3]);
+                real_abnormal_delete_bitmaps[tablet_id].insert({rowset_id, version, segment_id});
+            });
+    sp->set_call_back(
+            "InstanceChecker::do_delete_bitmap_inverted_check.get_leaked_delete_bitmap",
+            [&real_leaked_delete_bitmaps](auto&& args) {
+                int64_t tablet_id = *try_any_cast<int64_t*>(args[0]);
+                std::string rowset_id = *try_any_cast<std::string*>(args[1]);
+                int64_t version = *try_any_cast<int64_t*>(args[2]);
+                int64_t segment_id = *try_any_cast<int64_t*>(args[3]);
+                real_leaked_delete_bitmaps[tablet_id].insert({rowset_id, version, segment_id});
+            });
+    sp->enable_processing();
+
+    std::unique_ptr<Transaction> txn;
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn_kv->create_txn(&txn));
+
+    constexpr int table_id = 10000, index_id = 10001, partition_id = 10002;
+    // create some rowsets with delete bitmaps in merge-on-write tablet
+    for (int tablet_id = 800001; tablet_id <= 800010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        int64_t rowset_start_id = 600;
+        for (int ver = 2; ver <= 20; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+
+            if (ver >= 10) {
+                // only create rowsets for some versions
+                create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                       ver, ver, rowset_id, false, 1);
+            } else {
+                expected_leaked_delete_bitmaps[tablet_id].insert({rowset_id, ver, 0});
+            }
+
+            if (ver >= 5) {
+                auto delete_bitmap_key =
+                        meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+                std::string delete_bitmap_val {"test"};
+                txn->put(delete_bitmap_key, delete_bitmap_val);
+            } else {
+                // delete bitmaps may be spilitted into mulitiple KVs if too large
+                auto delete_bitmap_key =
+                        meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+                std::string delete_bitmap_val(1000, 'A');
+                cloud::put(txn.get(), delete_bitmap_key, delete_bitmap_val, 0, 300);
+            }
+        }
+    }
+
+    // create some rowsets with delete bitmaps in non merge-on-write tablet
+    for (int tablet_id = 900001; tablet_id <= 900010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, false));
+        int64_t rowset_start_id = 700;
+        for (int ver = 2; ver < 6; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   ver, ver, rowset_id, false, 1);
+            auto delete_bitmap_key =
+                    meta_delete_bitmap_key({instance_id, tablet_id, rowset_id, ver, 0});
+            std::string delete_bitmap_val {"test2"};
+            txn->put(delete_bitmap_key, delete_bitmap_val);
+
+            expected_abnormal_delete_bitmaps[tablet_id].insert({rowset_id, ver, 0});
+        }
+    }
+
+    // create some rowsets without delete bitmaps in non merge-on-write tablet
+    for (int tablet_id = 700001; tablet_id <= 700010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, false));
+        int64_t rowset_start_id = 500;
+        for (int ver = 2; ver < 10; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   ver, ver, rowset_id, false, 1);
+        }
+    }
+
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn->commit());
+
+    ASSERT_EQ(checker.do_delete_bitmap_inverted_check(), 1);
+    ASSERT_EQ(expected_leaked_delete_bitmaps, real_leaked_delete_bitmaps);
+    ASSERT_EQ(expected_abnormal_delete_bitmaps, real_abnormal_delete_bitmaps);
+}
+
+TEST(CheckerTest, delete_bitmap_storage_optimize_check_normal) {
+    config::delete_bitmap_storage_optimize_check_version_gap = 0;
+
+    auto txn_kv = std::make_shared<MemTxnKv>();
+    ASSERT_EQ(txn_kv->init(), 0);
+
+    InstanceInfoPB instance;
+    instance.set_instance_id(instance_id);
+    auto obj_info = instance.add_obj_info();
+    obj_info->set_id("1");
+
+    InstanceChecker checker(txn_kv, instance_id);
+    ASSERT_EQ(checker.init(instance), 0);
+    auto accessor = checker.accessor_map_.begin()->second;
+
+    std::unique_ptr<Transaction> txn;
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn_kv->create_txn(&txn));
+
+    constexpr int table_id = 10000, index_id = 10001, partition_id = 10002;
+    int64_t rowset_start_id = 600;
+
+    for (int tablet_id = 800001; tablet_id <= 800005; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        std::vector<std::pair<int64_t, int64_t>> rowset_vers {{2, 2}, {3, 3}, {4, 4}, {5, 5},
+                                                              {6, 7}, {8, 8}, {9, 9}};
+        std::vector<std::pair<int64_t, int64_t>> delete_bitmaps_vers {
+                {7, 9}, {8, 9}, {7, 9}, {7, 9}, {7, 9}, {8, 9}, {9, 9}};
+        std::vector<bool> segments_overlap {true, true, true, true, false, true, true};
+        for (size_t i {0}; i < 7; i++) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   rowset_vers[i].first, rowset_vers[i].second,
+                                                   rowset_id, segments_overlap[i], 1);
+            create_delete_bitmaps(txn.get(), tablet_id, rowset_id, delete_bitmaps_vers[i].first,
+                                  delete_bitmaps_vers[i].second);
+        }
+    }
+
+    for (int tablet_id = 800006; tablet_id <= 800010; ++tablet_id) {
+        // [7-7] cumu compaction output rowset start_version == end_version
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        std::vector<std::pair<int64_t, int64_t>> rowset_vers {{2, 2}, {3, 3}, {4, 4}, {5, 5},
+                                                              {6, 6}, {7, 7}, {8, 8}, {9, 9}};
+        std::vector<std::pair<int64_t, int64_t>> delete_bitmaps_vers {
+                {7, 9}, {8, 9}, {7, 9}, {7, 9}, {7, 9}, {7, 9}, {8, 9}, {9, 9}};
+        std::vector<bool> segments_overlap {true, true, false, true, false, true, true, true};
+        for (size_t i {0}; i < 8; i++) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   rowset_vers[i].first, rowset_vers[i].second,
+                                                   rowset_id, segments_overlap[i], 1);
+            create_delete_bitmaps(txn.get(), tablet_id, rowset_id, delete_bitmaps_vers[i].first,
+                                  delete_bitmaps_vers[i].second);
+        }
+    }
+
+    for (int tablet_id = 800011; tablet_id <= 800015; ++tablet_id) {
+        // no rowsets are compacted
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        std::vector<std::pair<int64_t, int64_t>> rowset_vers {{2, 2}, {3, 3}, {4, 4}, {5, 5},
+                                                              {6, 6}, {7, 7}, {8, 8}, {9, 9}};
+        std::vector<std::pair<int64_t, int64_t>> delete_bitmaps_vers {
+                {2, 9}, {3, 9}, {4, 9}, {5, 9}, {6, 9}, {7, 9}, {8, 9}, {9, 9}};
+        std::vector<bool> segments_overlap {true, true, true, true, true, true, true, true};
+        for (size_t i {0}; i < 8; i++) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   rowset_vers[i].first, rowset_vers[i].second,
+                                                   rowset_id, segments_overlap[i], 1);
+            create_delete_bitmaps(txn.get(), tablet_id, rowset_id, delete_bitmaps_vers[i].first,
+                                  delete_bitmaps_vers[i].second);
+        }
+    }
+
+    for (int tablet_id = 800016; tablet_id <= 800020; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        std::vector<std::pair<int64_t, int64_t>> rowset_vers {
+                {2, 5}, {6, 6}, {7, 7}, {8, 8}, {9, 9}};
+        std::vector<std::pair<int64_t, int64_t>> delete_bitmaps_vers {
+                {5, 9}, {6, 9}, {7, 9}, {8, 9}, {9, 9}};
+        std::vector<bool> segments_overlap {false, true, true, true, true};
+        for (size_t i {0}; i < 5; i++) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   rowset_vers[i].first, rowset_vers[i].second,
+                                                   rowset_id, segments_overlap[i], 1);
+            create_delete_bitmaps(txn.get(), tablet_id, rowset_id, delete_bitmaps_vers[i].first,
+                                  delete_bitmaps_vers[i].second);
+        }
+    }
+
+    // also create some rowsets without delete bitmaps in non merge-on-write tablet
+    for (int tablet_id = 700001; tablet_id <= 700010; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, false));
+        int64_t rowset_start_id = 500;
+        for (int ver = 2; ver < 10; ++ver) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   ver, ver, rowset_id, false, 1);
+        }
+    }
+
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn->commit());
+    ASSERT_EQ(checker.do_delete_bitmap_storage_optimize_check(), 0);
+}
+
+TEST(CheckerTest, delete_bitmap_storage_optimize_check_abnormal) {
+    config::delete_bitmap_storage_optimize_check_version_gap = 0;
+    // abnormal case, some rowsets' delete bitmaps are not deleted as expected
+    auto txn_kv = std::make_shared<MemTxnKv>();
+    ASSERT_EQ(txn_kv->init(), 0);
+
+    InstanceInfoPB instance;
+    instance.set_instance_id(instance_id);
+    auto obj_info = instance.add_obj_info();
+    obj_info->set_id("1");
+
+    InstanceChecker checker(txn_kv, instance_id);
+    ASSERT_EQ(checker.init(instance), 0);
+    auto accessor = checker.accessor_map_.begin()->second;
+
+    // tablet_id -> [rowset_id]
+    std::map<std::int64_t, std::set<std::string>> expected_abnormal_rowsets {};
+    std::map<std::int64_t, std::set<std::string>> real_abnormal_rowsets {};
+    auto sp = SyncPoint::get_instance();
+    std::unique_ptr<int, std::function<void(int*)>> defer(
+            (int*)0x01, [](int*) { SyncPoint::get_instance()->clear_all_call_backs(); });
+    sp->set_call_back("InstanceChecker::check_delete_bitmap_storage_optimize.get_abnormal_rowset",
+                      [&real_abnormal_rowsets](auto&& args) {
+                          int64_t tablet_id = *try_any_cast<int64_t*>(args[0]);
+                          std::string rowset_id = *try_any_cast<std::string*>(args[1]);
+                          real_abnormal_rowsets[tablet_id].insert(rowset_id);
+                      });
+    sp->enable_processing();
+
+    std::unique_ptr<Transaction> txn;
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn_kv->create_txn(&txn));
+
+    constexpr int table_id = 10000, index_id = 10001, partition_id = 10002;
+
+    int64_t rowset_start_id = 700;
+    for (int tablet_id = 900001; tablet_id <= 900005; ++tablet_id) {
+        ASSERT_EQ(0,
+                  create_tablet(txn_kv.get(), table_id, index_id, partition_id, tablet_id, true));
+        std::vector<std::pair<int64_t, int64_t>> rowset_vers {{2, 2}, {3, 3}, {4, 4}, {5, 5},
+                                                              {6, 7}, {8, 8}, {9, 9}};
+        std::vector<std::pair<int64_t, int64_t>> delete_bitmaps_vers {
+                {2, 9}, {7, 9}, {4, 9}, {7, 9}, {7, 9}, {8, 9}, {9, 9}};
+        std::vector<bool> segments_overlap {true, true, true, true, false, true, true};
+        for (size_t i {0}; i < 7; i++) {
+            std::string rowset_id = std::to_string(rowset_start_id++);
+            create_committed_rowset_with_rowset_id(txn_kv.get(), accessor.get(), "1", tablet_id,
+                                                   rowset_vers[i].first, rowset_vers[i].second,
+                                                   rowset_id, segments_overlap[i], 1);
+            create_delete_bitmaps(txn.get(), tablet_id, rowset_id, delete_bitmaps_vers[i].first,
+                                  delete_bitmaps_vers[i].second);
+            if (delete_bitmaps_vers[i].first < 7) {
+                expected_abnormal_rowsets[tablet_id].insert(rowset_id);
+            }
+        }
+    }
+
+    ASSERT_EQ(TxnErrorCode::TXN_OK, txn->commit());
+
+    ASSERT_EQ(checker.do_delete_bitmap_storage_optimize_check(), 1);
+    ASSERT_EQ(expected_abnormal_rowsets, real_abnormal_rowsets);
+}
+
 TEST(RecyclerTest, delete_rowset_data) {
     auto txn_kv = std::make_shared<MemTxnKv>();
     ASSERT_EQ(txn_kv->init(), 0);
@@ -2681,4 +3077,109 @@ TEST(RecyclerTest, delete_rowset_data) {
     }
 }
 
+TEST(RecyclerTest, delete_rowset_data_without_inverted_index_storage_format) {
+    auto txn_kv = std::make_shared<MemTxnKv>();
+    ASSERT_EQ(txn_kv->init(), 0);
+
+    InstanceInfoPB instance;
+    instance.set_instance_id(instance_id);
+    auto obj_info = instance.add_obj_info();
+    obj_info->set_id("recycle_tmp_rowsets");
+    obj_info->set_ak(config::test_s3_ak);
+    obj_info->set_sk(config::test_s3_sk);
+    obj_info->set_endpoint(config::test_s3_endpoint);
+    obj_info->set_region(config::test_s3_region);
+    obj_info->set_bucket(config::test_s3_bucket);
+    obj_info->set_prefix("recycle_tmp_rowsets");
+
+    std::vector<doris::TabletSchemaCloudPB> schemas;
+    for (int i = 0; i < 5; ++i) {
+        auto& schema = schemas.emplace_back();
+        schema.set_schema_version(i);
+        //schema.set_inverted_index_storage_format(InvertedIndexStorageFormatPB::V1);
+        for (int j = 0; j < i; ++j) {
+            auto index = schema.add_index();
+            index->set_index_id(j);
+            index->set_index_type(IndexType::INVERTED);
+        }
+    }
+
+    {
+        InstanceRecycler recycler(txn_kv, instance, thread_group,
+                                  std::make_shared<TxnLazyCommitter>(txn_kv));
+        ASSERT_EQ(recycler.init(), 0);
+        auto accessor = recycler.accessor_map_.begin()->second;
+        int64_t txn_id_base = 114115;
+        int64_t tablet_id_base = 10015;
+        int64_t index_id_base = 1000;
+        // Delete each rowset directly using one RowsetPB
+        for (int i = 0; i < 100; ++i) {
+            int64_t txn_id = txn_id_base + i;
+            for (int j = 0; j < 20; ++j) {
+                auto rowset = create_rowset("recycle_tmp_rowsets", tablet_id_base + j,
+                                            index_id_base + j % 4, 5, schemas[i % 5], txn_id);
+                create_tmp_rowset(txn_kv.get(), accessor.get(), rowset, i & 1);
+                ASSERT_EQ(0, recycler.delete_rowset_data(rowset));
+            }
+        }
+
+        std::unique_ptr<ListIterator> list_iter;
+        ASSERT_EQ(0, accessor->list_all(&list_iter));
+        ASSERT_FALSE(list_iter->has_next());
+    }
+    {
+        InstanceInfoPB tmp_instance;
+        std::string resource_id = "recycle_tmp_rowsets";
+        tmp_instance.set_instance_id(instance_id);
+        auto tmp_obj_info = tmp_instance.add_obj_info();
+        tmp_obj_info->set_id(resource_id);
+        tmp_obj_info->set_ak(config::test_s3_ak);
+        tmp_obj_info->set_sk(config::test_s3_sk);
+        tmp_obj_info->set_endpoint(config::test_s3_endpoint);
+        tmp_obj_info->set_region(config::test_s3_region);
+        tmp_obj_info->set_bucket(config::test_s3_bucket);
+        tmp_obj_info->set_prefix(resource_id);
+
+        InstanceRecycler recycler(txn_kv, tmp_instance, thread_group,
+                                  std::make_shared<TxnLazyCommitter>(txn_kv));
+        ASSERT_EQ(recycler.init(), 0);
+        auto accessor = recycler.accessor_map_.begin()->second;
+        // Delete multiple rowset files using one series of RowsetPB
+        constexpr int index_id = 10001, tablet_id = 10002;
+        std::vector<doris::RowsetMetaCloudPB> rowset_pbs;
+        for (int i = 0; i < 10; ++i) {
+            auto rowset = create_rowset(resource_id, tablet_id, index_id, 5, schemas[i % 5]);
+            create_recycle_rowset(
+                    txn_kv.get(), accessor.get(), rowset,
+                    static_cast<RecycleRowsetPB::Type>(i % (RecycleRowsetPB::Type_MAX + 1)), true);
+
+            rowset_pbs.emplace_back(std::move(rowset));
+        }
+        ASSERT_EQ(0, recycler.delete_rowset_data(rowset_pbs));
+        std::unique_ptr<ListIterator> list_iter;
+        ASSERT_EQ(0, accessor->list_all(&list_iter));
+        ASSERT_FALSE(list_iter->has_next());
+    }
+    {
+        InstanceRecycler recycler(txn_kv, instance, thread_group,
+                                  std::make_shared<TxnLazyCommitter>(txn_kv));
+        ASSERT_EQ(recycler.init(), 0);
+        auto accessor = recycler.accessor_map_.begin()->second;
+        // Delete multiple rowset files using one series of RowsetPB
+        constexpr int index_id = 20001, tablet_id = 20002;
+        // Delete each rowset file directly using it's id to construct one path
+        for (int i = 0; i < 1000; ++i) {
+            auto rowset =
+                    create_rowset("recycle_tmp_rowsets", tablet_id, index_id, 5, schemas[i % 5]);
+            create_recycle_rowset(txn_kv.get(), accessor.get(), rowset, RecycleRowsetPB::COMPACT,
+                                  true);
+            ASSERT_EQ(0, recycler.delete_rowset_data(rowset.resource_id(), rowset.tablet_id(),
+                                                     rowset.rowset_id_v2()));
+        }
+        std::unique_ptr<ListIterator> list_iter;
+        ASSERT_EQ(0, accessor->list_all(&list_iter));
+        ASSERT_FALSE(list_iter->has_next());
+    }
+}
+
 } // namespace doris::cloud
diff --git a/cloud/test/s3_accessor_test.cpp b/cloud/test/s3_accessor_test.cpp
index 0dd51b749d86e2..c19f5f6a1dfdfb 100644
--- a/cloud/test/s3_accessor_test.cpp
+++ b/cloud/test/s3_accessor_test.cpp
@@ -17,8 +17,10 @@
 
 #include "recycler/s3_accessor.h"
 
+#include <aws/s3/S3Client.h>
 #include <aws/s3/model/ListObjectsV2Request.h>
 #include <butil/guid.h>
+#include <gen_cpp/cloud.pb.h>
 #include <gtest/gtest.h>
 
 #include <azure/storage/blobs/blob_options.hpp>
@@ -320,4 +322,70 @@ TEST(S3AccessorTest, gcs) {
     test_s3_accessor(*accessor);
 }
 
+TEST(S3AccessorTest, path_style_test) {
+    ObjectStoreInfoPB obj_info;
+    obj_info.set_prefix("doris-debug-instance-prefix");
+    obj_info.set_provider(ObjectStoreInfoPB_Provider_S3);
+    obj_info.set_ak("dummy_ak");
+    obj_info.set_sk("dummy_sk");
+    obj_info.set_endpoint("dummy-bucket");
+    obj_info.set_region("cn-north-1");
+    obj_info.set_bucket("dummy-bucket");
+    config::max_s3_client_retry = 0;
+
+    auto* sp = SyncPoint::get_instance();
+    sp->enable_processing();
+    std::vector<SyncPoint::CallbackGuard> guards;
+
+    std::string base_domain = "s3.cn-north-1.amazonaws.com.cn";
+    std::string domain_ip = "54.222.51.71"; // first ip of base_domain
+    // to test custom_domain,  add ${domain_ip} ${custom_domain} to /etc/hosts
+    // otherwise the related cases will fail
+    std::string custom_domain = "gavin.s3.aws.com";
+    // clang-format off
+    // http code 403 means there is nothing wrong the given domain in objinfo
+    //                 domain, use_path_style, http_code
+    std::vector<std::tuple<std::string, bool, int>> inputs {
+        {base_domain               , false , 403}, // works
+        {base_domain               , true  , 403}, // works
+        {"http://" + base_domain   , false , 403}, // works
+        {"http://" + base_domain   , true  , 403}, // works
+        {"https://" + base_domain  , false , 403}, // works
+        {"https://" + base_domain  , true  , 403}, // works
+        {"http://" + domain_ip     , false , 301}, // works, ip with virtual addressing
+        {"http://" + domain_ip     , true  , 301}, // works, ip with path style
+        {custom_domain             , false , -1} , // custom_domain could not resolve with virtual addressing
+        {custom_domain             , true  , 403}, // custom_domain working with path style
+        {"http://" + custom_domain , false , -1} , // custom_domain could not resolve with virtual addressing
+        {"https://" + custom_domain, true  , -1},  // certificate issue, custom_domain does not attached with any certs
+        // {"https://54.222.51.71" , false , -1} , // certificate issue
+        // {"https://54.222.51.71" , true  , -1} , // certificate issue
+    };
+
+    int case_idx = 0;
+    sp->set_call_back("S3ObjClient::delete_object",
+            [&case_idx, &inputs](auto&& args) {
+                auto* res = try_any_cast<Aws::S3::Model::DeleteObjectOutcome*>(args[0]);
+                EXPECT_EQ(std::get<2>(inputs[case_idx]), static_cast<int>(res->GetError().GetResponseCode())) << "<<<<<<<<<<<<<<<<<<<<< " << case_idx;
+                case_idx++;
+            },
+            &guards.emplace_back());
+    // clang-format on
+
+    for (auto& i : inputs) {
+        obj_info.set_endpoint(std::get<0>(i));
+        obj_info.set_use_path_style(std::get<1>(i));
+        auto s3_conf = S3Conf::from_obj_store_info(obj_info);
+        EXPECT_EQ(s3_conf->use_virtual_addressing, !obj_info.use_path_style()) << case_idx;
+        std::shared_ptr<S3Accessor> accessor;
+        int ret = S3Accessor::create(*s3_conf, &accessor);
+        EXPECT_EQ(ret, 0) << "<<<<<<<<<<<<<<<<<<<<< " << case_idx;
+        ret = accessor->init();
+        EXPECT_EQ(ret, 0) << "<<<<<<<<<<<<<<<<<<<<< " << case_idx;
+        // this function call will trigger syncpoint callback to increment case_idx
+        accessor->delete_file("abc"); // try to delete a nonexisted file, ignore the result
+        // EXPECT_EQ(ret, exp) << "<<<<<<<<<<<<<<<<<<<<< " << case_idx << " domain " << std::get<0>(i);
+    }
+}
+
 } // namespace doris::cloud
diff --git a/cloud/test/schema_kv_test.cpp b/cloud/test/schema_kv_test.cpp
index 07f658175c806f..52e54f5e494b7f 100644
--- a/cloud/test/schema_kv_test.cpp
+++ b/cloud/test/schema_kv_test.cpp
@@ -210,6 +210,8 @@ TEST(DetachSchemaKVTest, TabletTest) {
         EXPECT_EQ(get_rowset_res.stats().num_rowsets(), 1);
         EXPECT_EQ(get_rowset_res.stats().num_segments(), 0);
         EXPECT_EQ(get_rowset_res.stats().data_size(), 0);
+        EXPECT_EQ(get_rowset_res.stats().index_size(), 0);
+        EXPECT_EQ(get_rowset_res.stats().segment_size(), 0);
     }
 
     // new MS batch create tablets with write_schema_kv=true
@@ -481,6 +483,8 @@ TEST(DetachSchemaKVTest, RowsetTest) {
         EXPECT_EQ(get_rowset_res.stats().num_rowsets(), 2);
         EXPECT_EQ(get_rowset_res.stats().num_segments(), 1);
         EXPECT_EQ(get_rowset_res.stats().data_size(), 11000);
+        EXPECT_EQ(get_rowset_res.stats().index_size(), 1000);
+        EXPECT_EQ(get_rowset_res.stats().segment_size(), 10000);
     }
 
     // new MS read rowsets committed by both old and new MS
@@ -530,6 +534,8 @@ TEST(DetachSchemaKVTest, RowsetTest) {
         EXPECT_EQ(get_rowset_res->stats().num_rowsets(), 26);
         EXPECT_EQ(get_rowset_res->stats().num_segments(), 25);
         EXPECT_EQ(get_rowset_res->stats().data_size(), 275000);
+        EXPECT_EQ(get_rowset_res->stats().index_size(), 25000);
+        EXPECT_EQ(get_rowset_res->stats().segment_size(), 250000);
         if (schema != nullptr) {
             auto schema_version = get_rowset_res->rowset_meta(10).schema_version();
             get_rowset_res->mutable_rowset_meta(10)->mutable_tablet_schema()->set_schema_version(3);
diff --git a/conf/be.conf b/conf/be.conf
index 5ad5e07176d545..ddbc385522e848 100644
--- a/conf/be.conf
+++ b/conf/be.conf
@@ -24,7 +24,7 @@ LOG_DIR="${DORIS_HOME}/log/"
 JAVA_OPTS="-Dfile.encoding=UTF-8 -Xmx2048m -DlogPath=$LOG_DIR/jni.log -Xloggc:$LOG_DIR/be.gc.log.$CUR_DATE -XX:+UseGCLogFileRotation -XX:NumberOfGCLogFiles=10 -XX:GCLogFileSize=50M -Djavax.security.auth.useSubjectCredsOnly=false -Dsun.security.krb5.debug=true -Dsun.java.command=DorisBE -XX:-CriticalJNINatives"
 
 # For jdk 17, this JAVA_OPTS will be used as default JVM options
-JAVA_OPTS_FOR_JDK_17="-Dfile.encoding=UTF-8 -Xmx2048m -DlogPath=$LOG_DIR/jni.log -Xlog:gc*:$LOG_DIR/be.gc.log.$CUR_DATE:time,uptime:filecount=10,filesize=50M -Djavax.security.auth.useSubjectCredsOnly=false -Dsun.security.krb5.debug=true -Dsun.java.command=DorisBE -XX:-CriticalJNINatives -XX:+IgnoreUnrecognizedVMOptions --add-opens=java.base/java.lang=ALL-UNNAMED --add-opens=java.base/java.lang.invoke=ALL-UNNAMED --add-opens=java.base/java.lang.reflect=ALL-UNNAMED --add-opens=java.base/java.io=ALL-UNNAMED --add-opens=java.base/java.net=ALL-UNNAMED --add-opens=java.base/java.nio=ALL-UNNAMED --add-opens=java.base/java.util=ALL-UNNAMED --add-opens=java.base/java.util.concurrent=ALL-UNNAMED --add-opens=java.base/java.util.concurrent.atomic=ALL-UNNAMED --add-opens=java.base/sun.nio.ch=ALL-UNNAMED --add-opens=java.base/sun.nio.cs=ALL-UNNAMED --add-opens=java.base/sun.security.action=ALL-UNNAMED --add-opens=java.base/sun.util.calendar=ALL-UNNAMED --add-opens=java.security.jgss/sun.security.krb5=ALL-UNNAMED --add-opens=java.management/sun.management=ALL-UNNAMED"
+JAVA_OPTS_FOR_JDK_17="-Dfile.encoding=UTF-8 -Djol.skipHotspotSAAttach=true -Xmx2048m -DlogPath=$LOG_DIR/jni.log -Xlog:gc*:$LOG_DIR/be.gc.log.$CUR_DATE:time,uptime:filecount=10,filesize=50M -Djavax.security.auth.useSubjectCredsOnly=false -Dsun.security.krb5.debug=true -Dsun.java.command=DorisBE -XX:-CriticalJNINatives -XX:+IgnoreUnrecognizedVMOptions --add-opens=java.base/java.lang=ALL-UNNAMED --add-opens=java.base/java.lang.invoke=ALL-UNNAMED --add-opens=java.base/java.lang.reflect=ALL-UNNAMED --add-opens=java.base/java.io=ALL-UNNAMED --add-opens=java.base/java.net=ALL-UNNAMED --add-opens=java.base/java.nio=ALL-UNNAMED --add-opens=java.base/java.util=ALL-UNNAMED --add-opens=java.base/java.util.concurrent=ALL-UNNAMED --add-opens=java.base/java.util.concurrent.atomic=ALL-UNNAMED --add-opens=java.base/sun.nio.ch=ALL-UNNAMED --add-opens=java.base/sun.nio.cs=ALL-UNNAMED --add-opens=java.base/sun.security.action=ALL-UNNAMED --add-opens=java.base/sun.util.calendar=ALL-UNNAMED --add-opens=java.security.jgss/sun.security.krb5=ALL-UNNAMED --add-opens=java.management/sun.management=ALL-UNNAMED -Darrow.enable_null_check_for_get=false"
 
 # Set your own JAVA_HOME
 # JAVA_HOME=/path/to/jdk/
diff --git a/extension/logstash/lib/logstash/outputs/doris.rb b/extension/logstash/lib/logstash/outputs/doris.rb
index 02e7591b0a354b..21d3ee6e752b08 100644
--- a/extension/logstash/lib/logstash/outputs/doris.rb
+++ b/extension/logstash/lib/logstash/outputs/doris.rb
@@ -21,7 +21,6 @@
 require "logstash/outputs/base"
 require "logstash/namespace"
 require "logstash/json"
-require "logstash/util/shortname_resolver"
 require 'logstash/util/formater'
 require "uri"
 require "securerandom"
@@ -67,8 +66,6 @@ class LogStash::Outputs::Doris < LogStash::Outputs::Base
 
    config :save_file, :validate => :string, :default => "failed.data"
 
-   config :host_resolve_ttl_sec, :validate => :number, :default => 120
-
    config :max_retries, :validate => :number, :default => -1
 
    config :log_request, :validate => :boolean, :default => true
@@ -92,10 +89,6 @@ def print_plugin_info()
    def register
       @http_query = "/api/#{@db}/#{@table}/_stream_load"
 
-      @hostnames_pool =
-      parse_http_hosts(@http_hosts,
-      ShortNameResolver.new(ttl: @host_resolve_ttl_sec, logger: @logger))
-
       @request_headers = make_request_headers
       @logger.info("request headers: ", @request_headers)
 
@@ -141,39 +134,6 @@ def register
       print_plugin_info()
    end # def register
 
-   private
-
-   def parse_http_hosts(hosts, resolver)
-      ip_re = /^[\d]+\.[\d]+\.[\d]+\.[\d]+$/
-
-      lambda {
-         hosts.flat_map { |h|
-            scheme = URI(h).scheme
-            host = URI(h).host
-            port = URI(h).port
-            path = URI(h).path
-
-            if ip_re !~ host
-               resolver.get_addresses(host).map { |ip|
-                  "#{scheme}://#{ip}:#{port}#{path}"
-               }
-            else
-               [h]
-            end
-         }
-      }
-   end
-
-   private
-
-   def get_host_addresses()
-      begin
-         @hostnames_pool.call
-      rescue Exception => ex
-         @logger.error('Error while resolving host', :error => ex.to_s)
-      end
-   end
-
    def multi_receive(events)
       return if events.empty?
       send_events(events)
@@ -191,8 +151,6 @@ def send_events(events)
       # @logger.info("get event num: #{event_num}")
       @logger.debug("get documents: #{documents}")
 
-      hosts = get_host_addresses()
-
       http_headers = @request_headers.dup
       if !@group_commit
          # only set label if group_commit is off_mode or not set, since lable can not be used with group_commit
@@ -202,7 +160,7 @@ def send_events(events)
       req_count = 0
       sleep_for = 1
       while true
-         response = make_request(documents, http_headers, hosts, @http_query, hosts.sample)
+         response = make_request(documents, http_headers, @http_query, @http_hosts.sample)
 
          req_count += 1
          response_json = {}
@@ -246,11 +204,7 @@ def send_events(events)
    end
 
    private
-   def make_request(documents, http_headers, hosts, query, host = "")
-      if host == ""
-         host = hosts.pop
-      end
-
+   def make_request(documents, http_headers, query, host)
       url = host + query
 
       if @log_request or @logger.debug?
diff --git a/extension/logstash/lib/logstash/util/shortname_resolver.rb b/extension/logstash/lib/logstash/util/shortname_resolver.rb
deleted file mode 100644
index 1437ccba007988..00000000000000
--- a/extension/logstash/lib/logstash/util/shortname_resolver.rb
+++ /dev/null
@@ -1,58 +0,0 @@
-=begin
-Licensed to the Apache Software Foundation (ASF) under one
-or more contributor license agreements.  See the NOTICE file
-distributed with this work for additional information
-regarding copyright ownership.  The ASF licenses this file
-to you under the Apache License, Version 2.0 (the
-"License"); you may not use this file except in compliance
-with the License.  You may obtain a copy of the License at
-
-  http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing,
-software distributed under the License is distributed on an
-"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-KIND, either express or implied.  See the License for the
-specific language governing permissions and limitations
-under the License.
-=end
-require 'resolv'
-require 'mini_cache'
-
-class ShortNameResolver
-  def initialize(ttl:, logger:)
-    @ttl = ttl
-    @store = MiniCache::Store.new
-    @logger = logger
-  end
-
-  private
-  def resolve_cached(shortname)
-    @store.get_or_set(shortname) do
-      addresses = resolve(shortname)
-      raise "Bad shortname '#{shortname}'" if addresses.empty?
-      MiniCache::Data.new(addresses, expires_in: @ttl)
-    end
-  end
-
-  private
-  def resolve(shortname)
-    addresses = Resolv::DNS.open do |dns|
-      dns.getaddresses(shortname).map { |r| r.to_s }
-    end
-
-    @logger.info("Resolved shortname '#{shortname}' to addresses #{addresses}")
-
-    return addresses
-  end
-
-  public
-  def get_address(shortname)
-    return resolve_cached(shortname).sample
-  end
-
-  public
-  def get_addresses(shortname)
-    return resolve_cached(shortname)
-  end
-end
diff --git a/extension/logstash/logstash-output-doris.gemspec b/extension/logstash/logstash-output-doris.gemspec
index 689b93503f6a8b..30341b83156ed4 100644
--- a/extension/logstash/logstash-output-doris.gemspec
+++ b/extension/logstash/logstash-output-doris.gemspec
@@ -38,7 +38,6 @@ Gem::Specification.new do |s|
 
   # Gem dependencies
   s.add_runtime_dependency "logstash-core-plugin-api", ">= 1.60", "<= 2.99"
-  s.add_runtime_dependency 'mini_cache', ">= 1.0.0", "< 2.0.0"
   s.add_runtime_dependency "rest-client", '~> 2.1'
 
   s.add_development_dependency 'logstash-devutils', '~> 1.3'
diff --git a/fe/be-java-extensions/hadoop-hudi-scanner/pom.xml b/fe/be-java-extensions/hadoop-hudi-scanner/pom.xml
new file mode 100644
index 00000000000000..4b80d49de17527
--- /dev/null
+++ b/fe/be-java-extensions/hadoop-hudi-scanner/pom.xml
@@ -0,0 +1,227 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+
+    <parent>
+        <artifactId>be-java-extensions</artifactId>
+        <groupId>org.apache.doris</groupId>
+        <version>${revision}</version>
+    </parent>
+    <modelVersion>4.0.0</modelVersion>
+    <artifactId>hadoop-hudi-scanner</artifactId>
+
+    <properties>
+        <doris.home>${basedir}/../../</doris.home>
+        <fe_ut_parallel>1</fe_ut_parallel>
+        <hudi.version>0.15.0</hudi.version>
+        <avro.version>1.11.3</avro.version>
+        <luben.zstd.jni.version>1.5.4-2</luben.zstd.jni.version>
+        <hive-apache.version>3.1.2-22</hive-apache.version>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>org.apache.doris</groupId>
+            <artifactId>java-common</artifactId>
+            <version>${project.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>org.apache.thrift</groupId>
+                    <artifactId>libthrift</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-client -->
+        <dependency>
+            <groupId>org.apache.hadoop</groupId>
+            <artifactId>hadoop-hdfs-client</artifactId>
+            <version>${hadoop.version}</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.hadoop/hadoop-common -->
+        <dependency>
+            <groupId>org.apache.hadoop</groupId>
+            <artifactId>hadoop-common</artifactId>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.hadoop</groupId>
+            <artifactId>hadoop-aws</artifactId>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.hadoop</groupId>
+            <artifactId>hadoop-mapreduce-client-core</artifactId>
+        </dependency>
+
+        <dependency>
+            <groupId>org.junit.jupiter</groupId>
+            <artifactId>junit-jupiter</artifactId>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.hudi/hudi-common -->
+        <dependency>
+            <groupId>org.apache.hudi</groupId>
+            <artifactId>hudi-common</artifactId>
+            <version>${hudi.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>org.apache.hbase</groupId>
+                    <artifactId>hbase-client</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.apache.hbase</groupId>
+                    <artifactId>hbase-server</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.apache.thrift</groupId>
+                    <artifactId>libthrift</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>jackson-databind</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.hudi/hudi-io -->
+        <dependency>
+            <groupId>org.apache.hudi</groupId>
+            <artifactId>hudi-io</artifactId>
+            <version>${hudi.version}</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.hudi/hudi-hadoop-mr -->
+        <dependency>
+            <groupId>org.apache.hudi</groupId>
+            <artifactId>hudi-hadoop-mr</artifactId>
+            <version>${hudi.version}</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.parquet/parquet-hadoop -->
+        <dependency>
+            <groupId>org.apache.parquet</groupId>
+            <artifactId>parquet-hadoop-bundle</artifactId>
+            <version>${parquet.version}</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.parquet/parquet-avro -->
+        <dependency>
+            <groupId>org.apache.parquet</groupId>
+            <artifactId>parquet-avro</artifactId>
+            <version>${parquet.version}</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.apache.avro/avro -->
+        <dependency>
+            <groupId>org.apache.avro</groupId>
+            <artifactId>avro</artifactId>
+            <version>${avro.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>org.apache.commons</groupId>
+                    <artifactId>commons-compress</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>io.airlift</groupId>
+            <artifactId>concurrent</artifactId>
+            <version>202</version>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/io.airlift/aircompressor -->
+        <dependency>
+            <groupId>io.airlift</groupId>
+            <artifactId>aircompressor</artifactId>
+            <version>${aircompressor.version}</version>
+        </dependency>
+
+        <dependency>
+            <groupId>com.github.luben</groupId>
+            <artifactId>zstd-jni</artifactId>
+            <version>${luben.zstd.jni.version}</version>
+        </dependency>
+
+        <dependency>
+            <groupId>com.esotericsoftware</groupId>
+            <artifactId>kryo-shaded</artifactId>
+            <version>4.0.2</version>
+        </dependency>
+
+        <!-- hive -->
+        <dependency>
+            <groupId>io.trino.hive</groupId>
+            <artifactId>hive-apache</artifactId>
+            <version>${hive-apache.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>org.apache.thrift</groupId>
+                    <artifactId>libthrift</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.apache.parquet</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.apache.avro</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>io.airlift</groupId>
+                    <artifactId>aircompressor</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <finalName>hadoop-hudi-scanner</finalName>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-assembly-plugin</artifactId>
+                <configuration>
+                    <descriptors>
+                        <descriptor>src/main/resources/package.xml</descriptor>
+                    </descriptors>
+                    <archive>
+                        <manifest>
+                            <mainClass></mainClass>
+                        </manifest>
+                    </archive>
+                </configuration>
+                <executions>
+                    <execution>
+                        <id>make-assembly</id>
+                        <phase>package</phase>
+                        <goals>
+                            <goal>single</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiColumnValue.java b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiColumnValue.java
new file mode 100644
index 00000000000000..ae0199d07d27c5
--- /dev/null
+++ b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiColumnValue.java
@@ -0,0 +1,219 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.hudi;
+
+import org.apache.doris.common.jni.vec.ColumnType;
+import org.apache.doris.common.jni.vec.ColumnValue;
+
+import org.apache.hadoop.hive.common.type.HiveDecimal;
+import org.apache.hadoop.hive.serde2.io.TimestampWritableV2;
+import org.apache.hadoop.hive.serde2.objectinspector.ListObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.MapObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.StructField;
+import org.apache.hadoop.hive.serde2.objectinspector.StructObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.primitive.DateObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.primitive.TimestampObjectInspector;
+import org.apache.hadoop.io.LongWritable;
+
+import java.math.BigDecimal;
+import java.math.BigInteger;
+import java.sql.Timestamp;
+import java.time.Instant;
+import java.time.LocalDate;
+import java.time.LocalDateTime;
+import java.time.ZoneId;
+import java.util.List;
+import java.util.Map;
+
+public class HadoopHudiColumnValue implements ColumnValue {
+    private ColumnType dorisType;
+    private ObjectInspector fieldInspector;
+    private Object fieldData;
+    private final ZoneId zoneId;
+
+    public HadoopHudiColumnValue(ZoneId zoneId) {
+        this.zoneId = zoneId;
+    }
+
+    public void setRow(Object record) {
+        this.fieldData = record;
+    }
+
+    public void setField(ColumnType dorisType, ObjectInspector fieldInspector) {
+        this.dorisType = dorisType;
+        this.fieldInspector = fieldInspector;
+    }
+
+    private Object inspectObject() {
+        return ((PrimitiveObjectInspector) fieldInspector).getPrimitiveJavaObject(fieldData);
+    }
+
+    @Override
+    public boolean getBoolean() {
+        return (boolean) inspectObject();
+    }
+
+    @Override
+    public short getShort() {
+        return (short) inspectObject();
+    }
+
+    @Override
+    public int getInt() {
+        return (int) inspectObject();
+    }
+
+    @Override
+    public float getFloat() {
+        return (float) inspectObject();
+    }
+
+    @Override
+    public long getLong() {
+        return (long) inspectObject();
+    }
+
+    @Override
+    public double getDouble() {
+        return (double) inspectObject();
+    }
+
+    @Override
+    public String getString() {
+        return inspectObject().toString();
+    }
+
+    @Override
+    public byte[] getBytes() {
+        return (byte[]) inspectObject();
+    }
+
+
+    @Override
+    public byte getByte() {
+        throw new UnsupportedOperationException("Hoodie type does not support tinyint");
+    }
+
+    @Override
+    public BigDecimal getDecimal() {
+        return ((HiveDecimal) inspectObject()).bigDecimalValue();
+    }
+
+    @Override
+    public LocalDate getDate() {
+        return LocalDate.ofEpochDay((((DateObjectInspector) fieldInspector).getPrimitiveJavaObject(fieldData))
+                .toEpochDay());
+    }
+
+    @Override
+    public LocalDateTime getDateTime() {
+        if (fieldData instanceof Timestamp) {
+            return ((Timestamp) fieldData).toLocalDateTime();
+        } else if (fieldData instanceof TimestampWritableV2) {
+            return LocalDateTime.ofInstant(Instant.ofEpochSecond((((TimestampObjectInspector) fieldInspector)
+                    .getPrimitiveJavaObject(fieldData)).toEpochSecond()), zoneId);
+        } else {
+            long datetime = ((LongWritable) fieldData).get();
+            long seconds;
+            long nanoseconds;
+            if (dorisType.getPrecision() == 3) {
+                seconds = datetime / 1000;
+                nanoseconds = (datetime % 1000) * 1000000;
+            } else if (dorisType.getPrecision() == 6) {
+                seconds = datetime / 1000000;
+                nanoseconds = (datetime % 1000000) * 1000;
+            } else {
+                throw new RuntimeException("Hoodie timestamp only support milliseconds and microseconds, "
+                        + "wrong precision = " + dorisType.getPrecision());
+            }
+            return LocalDateTime.ofInstant(Instant.ofEpochSecond(seconds, nanoseconds), zoneId);
+        }
+    }
+
+    @Override
+    public boolean canGetStringAsBytes() {
+        return false;
+    }
+
+    @Override
+    public boolean isNull() {
+        return fieldData == null;
+    }
+
+    @Override
+    public BigInteger getBigInteger() {
+        throw new UnsupportedOperationException("Hoodie type does not support largeint");
+    }
+
+    @Override
+    public byte[] getStringAsBytes() {
+        throw new UnsupportedOperationException("Hoodie type does not support getStringAsBytes");
+    }
+
+    @Override
+    public void unpackArray(List<ColumnValue> values) {
+        ListObjectInspector inspector = (ListObjectInspector) fieldInspector;
+        List<?> items = inspector.getList(fieldData);
+        ObjectInspector itemInspector = inspector.getListElementObjectInspector();
+        for (int i = 0; i < items.size(); i++) {
+            Object item = items.get(i);
+            HadoopHudiColumnValue childValue = new HadoopHudiColumnValue(zoneId);
+            childValue.setRow(item);
+            childValue.setField(dorisType.getChildTypes().get(0), itemInspector);
+            values.add(childValue);
+        }
+    }
+
+    @Override
+    public void unpackMap(List<ColumnValue> keys, List<ColumnValue> values) {
+        MapObjectInspector inspector = (MapObjectInspector) fieldInspector;
+        ObjectInspector keyObjectInspector = inspector.getMapKeyObjectInspector();
+        ObjectInspector valueObjectInspector = inspector.getMapValueObjectInspector();
+        for (Map.Entry kv : inspector.getMap(fieldData).entrySet()) {
+            HadoopHudiColumnValue key = new HadoopHudiColumnValue(zoneId);
+            key.setRow(kv.getKey());
+            key.setField(dorisType.getChildTypes().get(0), keyObjectInspector);
+            keys.add(key);
+
+            HadoopHudiColumnValue value = new HadoopHudiColumnValue(zoneId);
+            value.setRow(kv.getValue());
+            value.setField(dorisType.getChildTypes().get(1), valueObjectInspector);
+            values.add(value);
+        }
+    }
+
+    @Override
+    public void unpackStruct(List<Integer> structFieldIndex, List<ColumnValue> values) {
+        StructObjectInspector inspector = (StructObjectInspector) fieldInspector;
+        List<? extends StructField> fields = inspector.getAllStructFieldRefs();
+        for (int i = 0; i < structFieldIndex.size(); i++) {
+            Integer idx = structFieldIndex.get(i);
+            HadoopHudiColumnValue value = new HadoopHudiColumnValue(zoneId);
+            Object obj = null;
+            if (idx != null) {
+                StructField sf = fields.get(idx);
+                obj = inspector.getStructFieldData(fieldData, sf);
+            }
+            value.setRow(obj);
+            value.setField(dorisType.getChildTypes().get(i), fields.get(i).getFieldObjectInspector());
+            values.add(value);
+        }
+    }
+}
diff --git a/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiJniScanner.java b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiJniScanner.java
new file mode 100644
index 00000000000000..f2b38815a366fe
--- /dev/null
+++ b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/java/org/apache/doris/hudi/HadoopHudiJniScanner.java
@@ -0,0 +1,271 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.hudi;
+
+import org.apache.doris.common.classloader.ThreadClassLoaderContext;
+import org.apache.doris.common.jni.JniScanner;
+import org.apache.doris.common.jni.vec.ColumnType;
+
+import com.google.common.base.Joiner;
+import com.google.common.base.Preconditions;
+import com.google.common.base.Strings;
+import com.google.common.collect.Maps;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.Path;
+import org.apache.hadoop.hive.common.JavaUtils;
+import org.apache.hadoop.hive.serde2.Deserializer;
+import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
+import org.apache.hadoop.hive.serde2.objectinspector.StructField;
+import org.apache.hadoop.hive.serde2.objectinspector.StructObjectInspector;
+import org.apache.hadoop.io.ArrayWritable;
+import org.apache.hadoop.io.NullWritable;
+import org.apache.hadoop.mapred.FileSplit;
+import org.apache.hadoop.mapred.InputFormat;
+import org.apache.hadoop.mapred.JobConf;
+import org.apache.hadoop.mapred.RecordReader;
+import org.apache.hadoop.mapred.Reporter;
+import org.apache.hadoop.util.ReflectionUtils;
+import org.apache.hudi.common.model.HoodieLogFile;
+import org.apache.hudi.common.util.Option;
+import org.apache.hudi.hadoop.realtime.HoodieRealtimeFileSplit;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import java.io.IOException;
+import java.time.ZoneId;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+import java.util.Properties;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+/**
+ * HadoopHudiJniScanner is a JniScanner implementation that reads Hudi data using hudi-hadoop-mr.
+ */
+public class HadoopHudiJniScanner extends JniScanner {
+    private static final Logger LOG = LoggerFactory.getLogger(HadoopHudiJniScanner.class);
+
+    private static final String HADOOP_CONF_PREFIX = "hadoop_conf.";
+
+    // Hudi data info
+    private final String basePath;
+    private final String dataFilePath;
+    private final long dataFileLength;
+    private final String[] deltaFilePaths;
+    private final String instantTime;
+    private final String serde;
+    private final String inputFormat;
+
+    // schema info
+    private final String hudiColumnNames;
+    private final String[] hudiColumnTypes;
+    private final String[] requiredFields;
+    private List<Integer> requiredColumnIds;
+    private ColumnType[] requiredTypes;
+
+    // Hadoop info
+    private RecordReader<NullWritable, ArrayWritable> reader;
+    private StructObjectInspector rowInspector;
+    private final ObjectInspector[] fieldInspectors;
+    private final StructField[] structFields;
+    private Deserializer deserializer;
+    private final Map<String, String> fsOptionsProps;
+
+    // scanner info
+    private final HadoopHudiColumnValue columnValue;
+    private final int fetchSize;
+    private final ClassLoader classLoader;
+
+    public HadoopHudiJniScanner(int fetchSize, Map<String, String> params) {
+        this.basePath = params.get("base_path");
+        this.dataFilePath = params.get("data_file_path");
+        this.dataFileLength = Long.parseLong(params.get("data_file_length"));
+        if (Strings.isNullOrEmpty(params.get("delta_file_paths"))) {
+            this.deltaFilePaths = new String[0];
+        } else {
+            this.deltaFilePaths = params.get("delta_file_paths").split(",");
+        }
+        this.instantTime = params.get("instant_time");
+        this.serde = params.get("serde");
+        this.inputFormat = params.get("input_format");
+
+        this.hudiColumnNames = params.get("hudi_column_names");
+        this.hudiColumnTypes = params.get("hudi_column_types").split("#");
+        this.requiredFields = params.get("required_fields").split(",");
+
+        this.fieldInspectors = new ObjectInspector[requiredFields.length];
+        this.structFields = new StructField[requiredFields.length];
+        this.fsOptionsProps = Maps.newHashMap();
+        for (Map.Entry<String, String> entry : params.entrySet()) {
+            if (entry.getKey().startsWith(HADOOP_CONF_PREFIX)) {
+                fsOptionsProps.put(entry.getKey().substring(HADOOP_CONF_PREFIX.length()), entry.getValue());
+            }
+            if (LOG.isDebugEnabled()) {
+                LOG.debug("get hudi params {}: {}", entry.getKey(), entry.getValue());
+            }
+        }
+
+        ZoneId zoneId;
+        if (Strings.isNullOrEmpty(params.get("time_zone"))) {
+            zoneId = ZoneId.systemDefault();
+        } else {
+            zoneId = ZoneId.of(params.get("time_zone"));
+        }
+        this.columnValue = new HadoopHudiColumnValue(zoneId);
+        this.fetchSize = fetchSize;
+        this.classLoader = this.getClass().getClassLoader();
+    }
+
+    @Override
+    public void open() throws IOException {
+        try (ThreadClassLoaderContext ignored = new ThreadClassLoaderContext(classLoader)) {
+            initRequiredColumnsAndTypes();
+            initTableInfo(requiredTypes, requiredFields, fetchSize);
+            Properties properties = getReaderProperties();
+            initReader(properties);
+        } catch (Exception e) {
+            close();
+            LOG.warn("failed to open hadoop hudi jni scanner", e);
+            throw new IOException("failed to open hadoop hudi jni scanner: " + e.getMessage(), e);
+        }
+    }
+
+    @Override
+    public int getNext() throws IOException {
+        try (ThreadClassLoaderContext ignored = new ThreadClassLoaderContext(classLoader)) {
+            NullWritable key = reader.createKey();
+            ArrayWritable value = reader.createValue();
+            int numRows = 0;
+            for (; numRows < fetchSize; numRows++) {
+                if (!reader.next(key, value)) {
+                    break;
+                }
+                Object rowData = deserializer.deserialize(value);
+                for (int i = 0; i < fields.length; i++) {
+                    Object fieldData = rowInspector.getStructFieldData(rowData, structFields[i]);
+                    columnValue.setRow(fieldData);
+                    // LOG.info("rows: {}, column: {}, col name: {}, col type: {}, inspector: {}",
+                    //        numRows, i, types[i].getName(), types[i].getType().name(),
+                    //        fieldInspectors[i].getTypeName());
+                    columnValue.setField(types[i], fieldInspectors[i]);
+                    appendData(i, columnValue);
+                }
+            }
+            return numRows;
+        } catch (Exception e) {
+            close();
+            LOG.warn("failed to get next in hadoop hudi jni scanner", e);
+            throw new IOException("failed to get next in hadoop hudi jni scanner: " + e.getMessage(), e);
+        }
+    }
+
+    @Override
+    public void close() throws IOException {
+        try (ThreadClassLoaderContext ignored = new ThreadClassLoaderContext(classLoader)) {
+            if (reader != null) {
+                reader.close();
+            }
+        } catch (IOException e) {
+            LOG.warn("failed to close hadoop hudi jni scanner", e);
+            throw new IOException("failed to close hadoop hudi jni scanner: " + e.getMessage(), e);
+        }
+    }
+
+    private void initRequiredColumnsAndTypes() {
+        String[] splitHudiColumnNames = hudiColumnNames.split(",");
+
+        Map<String, Integer> hudiColNameToIdx =
+                IntStream.range(0, splitHudiColumnNames.length)
+                        .boxed()
+                        .collect(Collectors.toMap(i -> splitHudiColumnNames[i], i -> i));
+
+        Map<String, String> hudiColNameToType =
+                IntStream.range(0, splitHudiColumnNames.length)
+                        .boxed()
+                        .collect(Collectors.toMap(i -> splitHudiColumnNames[i], i -> hudiColumnTypes[i]));
+
+        requiredTypes = Arrays.stream(requiredFields)
+                .map(field -> ColumnType.parseType(field, hudiColNameToType.get(field)))
+                .toArray(ColumnType[]::new);
+
+        requiredColumnIds = Arrays.stream(requiredFields)
+                .mapToInt(hudiColNameToIdx::get)
+                .boxed().collect(Collectors.toList());
+    }
+
+    private Properties getReaderProperties() {
+        Properties properties = new Properties();
+        properties.setProperty("hive.io.file.readcolumn.ids", Joiner.on(",").join(requiredColumnIds));
+        properties.setProperty("hive.io.file.readcolumn.names", Joiner.on(",").join(this.requiredFields));
+        properties.setProperty("columns", this.hudiColumnNames);
+        properties.setProperty("columns.types", Joiner.on(",").join(hudiColumnTypes));
+        properties.setProperty("serialization.lib", this.serde);
+        properties.setProperty("hive.io.file.read.all.columns", "false");
+        fsOptionsProps.forEach(properties::setProperty);
+        return properties;
+    }
+
+    private void initReader(Properties properties) throws Exception {
+        String realtimePath = dataFileLength != -1 ? dataFilePath : deltaFilePaths[0];
+        long realtimeLength = dataFileLength != -1 ? dataFileLength : 0;
+        Path path = new Path(realtimePath);
+        FileSplit fileSplit = new FileSplit(path, 0, realtimeLength, (String[]) null);
+        List<HoodieLogFile> logFiles = Arrays.stream(deltaFilePaths).map(HoodieLogFile::new)
+                .collect(Collectors.toList());
+        FileSplit hudiSplit =
+                new HoodieRealtimeFileSplit(fileSplit, basePath, logFiles, instantTime, false, Option.empty());
+
+        JobConf jobConf = new JobConf(new Configuration());
+        properties.stringPropertyNames().forEach(name -> jobConf.set(name, properties.getProperty(name)));
+        InputFormat<?, ?> inputFormatClass = createInputFormat(jobConf, inputFormat);
+        reader = (RecordReader<NullWritable, ArrayWritable>) inputFormatClass
+                .getRecordReader(hudiSplit, jobConf, Reporter.NULL);
+
+        deserializer = getDeserializer(jobConf, properties, serde);
+        rowInspector = getTableObjectInspector(deserializer);
+        for (int i = 0; i < requiredFields.length; i++) {
+            StructField field = rowInspector.getStructFieldRef(requiredFields[i]);
+            structFields[i] = field;
+            fieldInspectors[i] = field.getFieldObjectInspector();
+        }
+    }
+
+    private InputFormat<?, ?> createInputFormat(Configuration conf, String inputFormat) throws Exception {
+        Class<?> clazz = conf.getClassByName(inputFormat);
+        Class<? extends InputFormat<?, ?>> cls =
+                (Class<? extends InputFormat<?, ?>>) clazz.asSubclass(InputFormat.class);
+        return ReflectionUtils.newInstance(cls, conf);
+    }
+
+    private Deserializer getDeserializer(Configuration configuration, Properties properties, String name)
+            throws Exception {
+        Class<? extends Deserializer> deserializerClass = Class.forName(name, true, JavaUtils.getClassLoader())
+                .asSubclass(Deserializer.class);
+        Deserializer deserializer = deserializerClass.getConstructor().newInstance();
+        deserializer.initialize(configuration, properties);
+        return deserializer;
+    }
+
+    private StructObjectInspector getTableObjectInspector(Deserializer deserializer) throws Exception {
+        ObjectInspector inspector = deserializer.getObjectInspector();
+        Preconditions.checkArgument(inspector.getCategory() == ObjectInspector.Category.STRUCT,
+                "expected STRUCT: %s", inspector.getCategory());
+        return (StructObjectInspector) inspector;
+    }
+}
diff --git a/fe/be-java-extensions/hadoop-hudi-scanner/src/main/resources/package.xml b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/resources/package.xml
new file mode 100644
index 00000000000000..4bbb2610603363
--- /dev/null
+++ b/fe/be-java-extensions/hadoop-hudi-scanner/src/main/resources/package.xml
@@ -0,0 +1,41 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+<assembly xmlns="http://maven.apache.org/ASSEMBLY/2.0.0"
+          xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+          xsi:schemaLocation="http://maven.apache.org/ASSEMBLY/2.0.0 http://maven.apache.org/xsd/assembly-2.0.0.xsd">
+    <id>jar-with-dependencies</id>
+    <formats>
+        <format>jar</format>
+    </formats>
+    <includeBaseDirectory>false</includeBaseDirectory>
+    <dependencySets>
+        <dependencySet>
+            <outputDirectory>/</outputDirectory>
+            <useProjectArtifact>true</useProjectArtifact>
+            <unpack>true</unpack>
+            <scope>runtime</scope>
+            <unpackOptions>
+                <excludes>
+                    <exclude>**/Log4j2Plugins.dat</exclude>
+                </excludes>
+            </unpackOptions>
+        </dependencySet>
+    </dependencySets>
+</assembly>
diff --git a/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/HudiJniScanner.java b/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/HudiJniScanner.java
index a284c7adcdd105..bc082e56732476 100644
--- a/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/HudiJniScanner.java
+++ b/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/HudiJniScanner.java
@@ -17,11 +17,10 @@
 
 package org.apache.doris.hudi;
 
-
 import org.apache.doris.common.jni.JniScanner;
 import org.apache.doris.common.jni.vec.ColumnType;
 import org.apache.doris.common.security.authentication.AuthenticationConfig;
-import org.apache.doris.common.security.authentication.HadoopUGI;
+import org.apache.doris.common.security.authentication.HadoopAuthenticator;
 
 import com.google.common.util.concurrent.ThreadFactoryBuilder;
 import org.apache.avro.generic.GenericDatumReader;
@@ -160,14 +159,15 @@ public void open() throws IOException {
             cleanResolverLock.readLock().lock();
             try {
                 lastUpdateTime.set(System.currentTimeMillis());
+                AuthenticationConfig authenticationConfig = AuthenticationConfig.getKerberosConfig(split.hadoopConf());
+                HadoopAuthenticator hadoopAuthenticator = HadoopAuthenticator
+                        .getHadoopAuthenticator(authenticationConfig);
                 if (split.incrementalRead()) {
-                    recordIterator = HadoopUGI.ugiDoAs(AuthenticationConfig.getKerberosConfig(
-                                    split.hadoopConf()),
-                            () -> new MORIncrementalSplitReader(split).buildScanIterator(new Filter[0]));
+                    recordIterator = hadoopAuthenticator.doAs(() -> new MORIncrementalSplitReader(split)
+                            .buildScanIterator(new Filter[0]));
                 } else {
-                    recordIterator = HadoopUGI.ugiDoAs(AuthenticationConfig.getKerberosConfig(
-                                    split.hadoopConf()),
-                            () -> new MORSnapshotSplitReader(split).buildScanIterator(new Filter[0]));
+                    recordIterator = hadoopAuthenticator.doAs(() -> new MORSnapshotSplitReader(split)
+                            .buildScanIterator(new Filter[0]));
                 }
                 if (AVRO_RESOLVER_CACHE != null && AVRO_RESOLVER_CACHE.get() != null) {
                     cachedResolvers.computeIfAbsent(Thread.currentThread().getId(),
diff --git a/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/Utils.java b/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/Utils.java
index 5614f8bcc96eb1..c0fbec633e897c 100644
--- a/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/Utils.java
+++ b/fe/be-java-extensions/hudi-scanner/src/main/java/org/apache/doris/hudi/Utils.java
@@ -18,11 +18,12 @@
 package org.apache.doris.hudi;
 
 import org.apache.doris.common.security.authentication.AuthenticationConfig;
-import org.apache.doris.common.security.authentication.HadoopUGI;
+import org.apache.doris.common.security.authentication.HadoopAuthenticator;
 
 import org.apache.commons.io.FileUtils;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hudi.common.table.HoodieTableMetaClient;
+import org.apache.hudi.storage.hadoop.HadoopStorageConfiguration;
 
 import java.io.BufferedReader;
 import java.io.File;
@@ -75,7 +76,14 @@ public static void killProcess(long pid) {
     }
 
     public static HoodieTableMetaClient getMetaClient(Configuration conf, String basePath) {
-        return HadoopUGI.ugiDoAs(AuthenticationConfig.getKerberosConfig(conf), () -> HoodieTableMetaClient.builder()
-                .setConf(conf).setBasePath(basePath).build());
+        HadoopStorageConfiguration hadoopStorageConfiguration = new HadoopStorageConfiguration(conf);
+        AuthenticationConfig authenticationConfig = AuthenticationConfig.getKerberosConfig(conf);
+        HadoopAuthenticator hadoopAuthenticator = HadoopAuthenticator.getHadoopAuthenticator(authenticationConfig);
+        try {
+            return hadoopAuthenticator.doAs(() -> HoodieTableMetaClient.builder()
+                    .setConf(hadoopStorageConfiguration).setBasePath(basePath).build());
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to get HoodieTableMetaClient", e);
+        }
     }
 }
diff --git a/fe/be-java-extensions/hudi-scanner/src/main/scala/org/apache/doris/hudi/BaseSplitReader.scala b/fe/be-java-extensions/hudi-scanner/src/main/scala/org/apache/doris/hudi/BaseSplitReader.scala
index dcc068ad7006d8..fc8d74f9713c26 100644
--- a/fe/be-java-extensions/hudi-scanner/src/main/scala/org/apache/doris/hudi/BaseSplitReader.scala
+++ b/fe/be-java-extensions/hudi-scanner/src/main/scala/org/apache/doris/hudi/BaseSplitReader.scala
@@ -36,13 +36,15 @@ import org.apache.hudi.common.table.{HoodieTableConfig, HoodieTableMetaClient, T
 import org.apache.hudi.common.util.ValidationUtils.checkState
 import org.apache.hudi.common.util.{ConfigUtils, StringUtils}
 import org.apache.hudi.config.HoodieWriteConfig
-import org.apache.hudi.hadoop.CachingPath
+import org.apache.hudi.hadoop.fs.CachingPath
 import org.apache.hudi.internal.schema.convert.AvroInternalSchemaConverter
 import org.apache.hudi.internal.schema.utils.{InternalSchemaUtils, SerDeHelper}
 import org.apache.hudi.internal.schema.{HoodieSchemaException, InternalSchema}
-import org.apache.hudi.io.storage.HoodieAvroHFileReader
+import org.apache.hudi.io.hadoop.HoodieHBaseAvroHFileReader
 import org.apache.hudi.metadata.HoodieTableMetadataUtil
 import org.apache.hudi.{AvroConversionUtils, DataSourceReadOptions, DataSourceWriteOptions, HoodieSparkConfUtils, HoodieTableSchema, HoodieTableState}
+import org.apache.hudi.storage.StoragePath;
+import org.apache.hudi.storage.hadoop.HadoopStorageConfiguration;
 import org.apache.log4j.Logger
 import org.apache.spark.sql.adapter.Spark3_4Adapter
 import org.apache.spark.sql.avro.{HoodieAvroSchemaConverters, HoodieSparkAvroSchemaConverters}
@@ -430,7 +432,7 @@ abstract class BaseSplitReader(val split: HoodieSplit) {
     try {
       if (shouldExtractPartitionValuesFromPartitionPath) {
         val filePath = new Path(split.dataFilePath)
-        val tablePathWithoutScheme = CachingPath.getPathWithoutSchemeAndAuthority(tableInformation.metaClient.getBasePathV2)
+        val tablePathWithoutScheme = CachingPath.getPathWithoutSchemeAndAuthority(new Path(tableInformation.metaClient.getBasePathV2.toUri))
         val partitionPathWithoutScheme = CachingPath.getPathWithoutSchemeAndAuthority(filePath.getParent)
         val relativePath = new URI(tablePathWithoutScheme.toString).relativize(new URI(partitionPathWithoutScheme.toString)).toString
         val hiveStylePartitioningEnabled = tableConfig.getHiveStylePartitioningEnable.toBoolean
@@ -497,8 +499,11 @@ abstract class BaseSplitReader(val split: HoodieSplit) {
                                 options: Map[String, String],
                                 hadoopConf: Configuration): PartitionedFile => Iterator[InternalRow] = {
     partitionedFile => {
-      val reader = new HoodieAvroHFileReader(
-        hadoopConf, partitionedFile.filePath.toPath, new CacheConfig(hadoopConf))
+      var hadoopStorageConfiguration = new HadoopStorageConfiguration(hadoopConf);
+      var storagePath = new StoragePath(partitionedFile.toPath.toUri.getPath);
+      var emptySchema = org.apache.hudi.common.util.Option.empty[org.apache.avro.Schema]()
+      val reader = new HoodieHBaseAvroHFileReader(
+        hadoopStorageConfiguration, storagePath, emptySchema)
 
       val requiredRowSchema = requiredDataSchema.structTypeSchema
       // NOTE: Schema has to be parsed at this point, since Avro's [[Schema]] aren't serializable
diff --git a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/ColumnType.java b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/ColumnType.java
index 1a919d846310d0..37a58075978c18 100644
--- a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/ColumnType.java
+++ b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/ColumnType.java
@@ -207,16 +207,16 @@ public int getScale() {
     public int metaSize() {
         switch (type) {
             case UNSUPPORTED:
-                // set nullMap address as 0.
-                return 1;
+                // const flag / set nullMap address as 0.
+                return 2;
             case ARRAY:
             case MAP:
             case STRUCT:
-                // array & map : [nullMap | offsets | ... ]
-                // struct : [nullMap | ... ]
-                int size = 2;
+                // array & map : [const | nullMap | offsets | ... ]
+                // struct : [const | nullMap | ... ]
+                int size = 3;
                 if (type == Type.STRUCT) {
-                    size = 1;
+                    size = 2;
                 }
                 for (ColumnType c : childTypes) {
                     size += c.metaSize();
@@ -226,11 +226,11 @@ public int metaSize() {
             case BINARY:
             case CHAR:
             case VARCHAR:
-                // [nullMap | offsets | data ]
-                return 3;
+                // [const | nullMap | offsets | data ]
+                return 4;
             default:
-                // [nullMap | data]
-                return 2;
+                // [const | nullMap | data]
+                return 3;
         }
     }
 
diff --git a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorColumn.java b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorColumn.java
index 1542174cc1c587..839027b03b61c5 100644
--- a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorColumn.java
+++ b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorColumn.java
@@ -24,6 +24,7 @@
 
 import com.google.common.base.Preconditions;
 import com.google.common.collect.Lists;
+import org.apache.log4j.Logger;
 
 import java.math.BigDecimal;
 import java.math.BigInteger;
@@ -41,10 +42,14 @@
  * see <a href="https://github.com/apache/spark/blob/master/sql/core/src/main/java/org/apache/spark/sql/execution/vectorized/WritableColumnVector.java">WritableColumnVector</a>
  */
 public class VectorColumn {
+    public static final Logger LOG = Logger.getLogger(VectorColumn.class);
     // String is stored as array<byte>
     // The default string length to initialize the capacity.
     private static final int DEFAULT_STRING_LENGTH = 4;
 
+    //add a new flag for const column
+    private boolean isConst = false;
+
     // NullMap column address
     private long nullMap;
     private boolean[] nulls = null;
@@ -75,6 +80,7 @@ public class VectorColumn {
 
     // Create writable column
     private VectorColumn(ColumnType columnType, int capacity) {
+        this.isConst = false;
         this.columnType = columnType;
         this.capacity = 0;
         this.nullMap = 0;
@@ -106,6 +112,7 @@ private VectorColumn(ColumnType columnType, int capacity) {
 
     // restore the child of string column & restore meta column
     private VectorColumn(long address, int capacity, ColumnType columnType) {
+        this.isConst = false;
         this.columnType = columnType;
         this.capacity = capacity;
         this.nullMap = 0;
@@ -122,7 +129,7 @@ private VectorColumn(long address, int capacity, ColumnType columnType) {
         }
     }
 
-    // Create readable column
+    // Create readable column, and maybe pass by const column in Readable column
     private VectorColumn(ColumnType columnType, int numRows, long columnMetaAddress) {
         if (columnType.isUnsupported()) {
             throw new RuntimeException("Unsupported type for column: " + columnType.getName());
@@ -130,14 +137,27 @@ private VectorColumn(ColumnType columnType, int numRows, long columnMetaAddress)
         long address = columnMetaAddress;
         this.capacity = numRows;
         this.columnType = columnType;
+        Long constFlag = OffHeap.getLong(null, address);
+        address += 8;
+        if (constFlag != 0) {
+            this.isConst = true;
+        }
+        // record the real rows even if it's const column
+        // as only one rows in const column
+        int realRows = this.isConst ? 1 : numRows;
         this.nullMap = OffHeap.getLong(null, address);
         address += 8;
         this.numNulls = 0;
         if (this.nullMap != 0) {
-            nulls = OffHeap.getBoolean(null, nullMap, numRows);
+            nulls = OffHeap.getBoolean(null, nullMap, realRows);
             for (boolean isNull : nulls) {
                 if (isNull) {
-                    this.numNulls++;
+                    if (this.isConst) {
+                        // all of const is null value
+                        this.numNulls += numRows;
+                    } else {
+                        this.numNulls++;
+                    }
                 }
             }
         }
@@ -149,7 +169,7 @@ private VectorColumn(ColumnType columnType, int numRows, long columnMetaAddress)
             if (!columnType.isStruct()) {
                 this.offsets = OffHeap.getLong(null, address);
                 address += 8;
-                childRows = getArrayEndOffset(numRows - 1);
+                childRows = getArrayEndOffset(realRows - 1);
             }
             this.data = 0;
             List<ColumnType> children = columnType.getChildTypes();
@@ -162,7 +182,7 @@ private VectorColumn(ColumnType columnType, int numRows, long columnMetaAddress)
             this.offsets = OffHeap.getLong(null, address);
             address += 8;
             this.data = 0;
-            int length = OffHeap.getInt(null, this.offsets + (numRows - 1) * 4L);
+            int length = OffHeap.getInt(null, this.offsets + (realRows - 1) * 4L);
             childColumns = new VectorColumn[1];
             childColumns[0] = new VectorColumn(OffHeap.getLong(null, address), length,
                     new ColumnType("#stringBytes", Type.BYTE));
@@ -221,6 +241,10 @@ public ColumnType getColumnType() {
         return columnType;
     }
 
+    public boolean isConst() {
+        return isConst;
+    }
+
     /**
      * Release columns and meta information
      */
@@ -248,6 +272,7 @@ public void close() {
         capacity = 0;
         numNulls = 0;
         appendIndex = 0;
+        isConst = false;
     }
 
     private void throwReserveException(int requiredCapacity, Throwable cause) {
@@ -1450,6 +1475,11 @@ public void appendObjectColumn(Object[] batch, boolean isNullable) {
     }
 
     public Object[] getObjectColumn(int start, int end) {
+        // for const column only one row in column
+        if (isConst()) {
+            start = 0;
+            end = 1;
+        }
         switch (columnType.getType()) {
             case BOOLEAN:
                 return getBooleanColumn(start, end);
@@ -1583,6 +1613,7 @@ public void appendValue(ColumnValue o) {
 
     // for test only.
     public void dump(StringBuilder sb, int i) {
+        i = isConst() ? 0 : i;
         if (isNullAt(i)) {
             sb.append("NULL");
             return;
diff --git a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorTable.java b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorTable.java
index a8849d1fa2044d..c94c95b3e8be31 100644
--- a/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorTable.java
+++ b/fe/be-java-extensions/java-common/src/main/java/org/apache/doris/common/jni/vec/VectorTable.java
@@ -21,6 +21,8 @@
 import org.apache.doris.common.jni.utils.OffHeap;
 import org.apache.doris.common.jni.vec.ColumnType.Type;
 
+import org.apache.log4j.Logger;
+
 import java.util.Collections;
 import java.util.Map;
 
@@ -28,6 +30,7 @@
  * Store a batch of data as vector table.
  */
 public class VectorTable {
+    public static final Logger LOG = Logger.getLogger(VectorTable.class);
     private final VectorColumn[] columns;
     private final ColumnType[] columnTypes;
     private final String[] fields;
@@ -199,6 +202,10 @@ public int getNumColumns() {
         return columns.length;
     }
 
+    public boolean isConstColumn(int idx) {
+        return columns[idx].isConst();
+    }
+
     public long getMetaAddress() {
         if (!onlyReadable) {
             meta.reset();
@@ -229,6 +236,18 @@ public void close() {
     // for test only.
     public String dump(int rowLimit) {
         StringBuilder sb = new StringBuilder();
+        for (int col = 0; col < columns.length; col++) {
+            ColumnType.Type typeValue = columns[col].getColumnPrimitiveType();
+            sb.append(typeValue.name());
+            sb.append("(rows: " + columns[col].numRows());
+            sb.append(")(const: ");
+            sb.append(columns[col].isConst() ? "true) " : "false) ");
+            if (col != 0) {
+                sb.append(",    ");
+            }
+        }
+        sb.append("\n");
+
         for (int i = 0; i < rowLimit && i < getNumRows(); i++) {
             for (int j = 0; j < columns.length; j++) {
                 if (j != 0) {
diff --git a/fe/be-java-extensions/java-udf/src/main/java/org/apache/doris/udf/UdfExecutor.java b/fe/be-java-extensions/java-udf/src/main/java/org/apache/doris/udf/UdfExecutor.java
index 685e20de843869..1b5bff1e7c11d1 100644
--- a/fe/be-java-extensions/java-udf/src/main/java/org/apache/doris/udf/UdfExecutor.java
+++ b/fe/be-java-extensions/java-udf/src/main/java/org/apache/doris/udf/UdfExecutor.java
@@ -116,7 +116,8 @@ public long evaluate(Map<String, String> inputParams, Map<String, String> output
             Object[] parameters = new Object[numColumns];
             for (int i = 0; i < numRows; ++i) {
                 for (int j = 0; j < numColumns; ++j) {
-                    parameters[j] = inputs[j][i];
+                    int row = inputTable.isConstColumn(j) ? 0 : i;
+                    parameters[j] = inputs[j][row];
                 }
                 result[i] = methodAccess.invoke(udf, evaluateIndex, parameters);
             }
diff --git a/fe/be-java-extensions/max-compute-scanner/src/main/java/org/apache/doris/maxcompute/MaxComputeJniScanner.java b/fe/be-java-extensions/max-compute-scanner/src/main/java/org/apache/doris/maxcompute/MaxComputeJniScanner.java
index 6cbed70adc7d46..d6325bdae4673a 100644
--- a/fe/be-java-extensions/max-compute-scanner/src/main/java/org/apache/doris/maxcompute/MaxComputeJniScanner.java
+++ b/fe/be-java-extensions/max-compute-scanner/src/main/java/org/apache/doris/maxcompute/MaxComputeJniScanner.java
@@ -25,6 +25,7 @@
 import com.aliyun.odps.account.AliyunAccount;
 import com.aliyun.odps.table.configuration.CompressionCodec;
 import com.aliyun.odps.table.configuration.ReaderOptions;
+import com.aliyun.odps.table.configuration.RestOptions;
 import com.aliyun.odps.table.enviroment.Credentials;
 import com.aliyun.odps.table.enviroment.EnvironmentSettings;
 import com.aliyun.odps.table.read.SplitReader;
@@ -67,6 +68,10 @@ public class MaxComputeJniScanner extends JniScanner {
     private static final String SCAN_SERIALIZER = "scan_serializer";
     private static final String TIME_ZONE = "time_zone";
 
+    private static final String CONNECT_TIMEOUT = "connect_timeout";
+    private static final String READ_TIMEOUT = "read_timeout";
+    private static final String RETRY_COUNT  = "retry_count";
+
     private enum SplitType {
         BYTE_SIZE,
         ROW_OFFSET
@@ -136,16 +141,40 @@ public MaxComputeJniScanner(int batchSize, Map<String, String> params) {
         Credentials credentials = Credentials.newBuilder().withAccount(odps.getAccount())
                 .withAppAccount(odps.getAppAccount()).build();
 
+
+        int connectTimeout = 10; // 10s
+        if (!Strings.isNullOrEmpty(params.get(CONNECT_TIMEOUT))) {
+            connectTimeout = Integer.parseInt(params.get(CONNECT_TIMEOUT));
+        }
+
+        int readTimeout = 120; // 120s
+        if (!Strings.isNullOrEmpty(params.get(READ_TIMEOUT))) {
+            readTimeout =  Integer.parseInt(params.get(READ_TIMEOUT));
+        }
+
+        int retryTimes = 4; // 4 times
+        if (!Strings.isNullOrEmpty(params.get(RETRY_COUNT))) {
+            retryTimes = Integer.parseInt(params.get(RETRY_COUNT));
+        }
+
+        RestOptions restOptions = RestOptions.newBuilder()
+                .withConnectTimeout(connectTimeout)
+                .withReadTimeout(readTimeout)
+                .withRetryTimes(retryTimes).build();
+
         settings = EnvironmentSettings.newBuilder()
                 .withCredentials(credentials)
                 .withServiceEndpoint(odps.getEndpoint())
                 .withQuotaName(quota)
+                .withRestOptions(restOptions)
                 .build();
 
         try {
             scan = (TableBatchReadSession) deserialize(scanSerializer);
         } catch (Exception e) {
-            LOG.info("deserialize TableBatchReadSession failed.", e);
+            String errorMsg = "Failed to deserialize table batch read session.";
+            LOG.warn(errorMsg, e);
+            throw new IllegalArgumentException(errorMsg, e);
         }
     }
 
@@ -176,11 +205,11 @@ public void open() throws IOException {
                     .withReuseBatch(true)
                     .build());
 
-        } catch (IOException e) {
-            LOG.info("createArrowReader failed.", e);
         } catch (Exception e) {
+            String errorMsg = "MaxComputeJniScanner Failed to open table batch read session.";
+            LOG.warn(errorMsg, e);
             close();
-            throw new IOException(e.getMessage(), e);
+            throw new IOException(errorMsg, e);
         }
     }
 
@@ -215,8 +244,9 @@ private int readVectors(int expectedRows) throws IOException {
                     break;
                 }
             } catch (Exception e) {
-                LOG.info("currentSplitReader hasNext fail", e);
-                break;
+                String errorMsg = "MaxComputeJniScanner readVectors hasNext fail";
+                LOG.warn(errorMsg, e);
+                throw new IOException(e.getMessage(), e);
             }
 
             try {
@@ -241,7 +271,10 @@ private int readVectors(int expectedRows) throws IOException {
                 }
                 curReadRows += batchRows;
             } catch (Exception e) {
-                throw new RuntimeException("Fail to read arrow data, reason: " + e.getMessage(), e);
+                String errorMsg = String.format("MaxComputeJniScanner Fail to read arrow data. "
+                        + "curReadRows = {}, expectedRows = {}", curReadRows, expectedRows);
+                LOG.warn(errorMsg, e);
+                throw new RuntimeException(errorMsg, e);
             }
         }
         return curReadRows;
diff --git a/fe/be-java-extensions/pom.xml b/fe/be-java-extensions/pom.xml
index bbe056739d51ec..5d56ef76e7c3ef 100644
--- a/fe/be-java-extensions/pom.xml
+++ b/fe/be-java-extensions/pom.xml
@@ -22,6 +22,7 @@ under the License.
     <modelVersion>4.0.0</modelVersion>
     <modules>
         <module>hudi-scanner</module>
+        <module>hadoop-hudi-scanner</module>
         <module>java-common</module>
         <module>java-udf</module>
         <module>jdbc-scanner</module>
diff --git a/fe/fe-common/src/main/java/org/apache/doris/common/Config.java b/fe/fe-common/src/main/java/org/apache/doris/common/Config.java
index 2ef391bb7ab390..247c61ecd365ec 100644
--- a/fe/fe-common/src/main/java/org/apache/doris/common/Config.java
+++ b/fe/fe-common/src/main/java/org/apache/doris/common/Config.java
@@ -425,6 +425,10 @@ public class Config extends ConfigBase {
                     + "`/proc/sys/net/core/somaxconn` at the same time"})
     public static int mysql_nio_backlog_num = 1024;
 
+    @ConfField(description = {"是否启用 mysql 连接中的 TCP keep alive，默认禁用",
+            "Whether to enable TCP Keep-Alive for MySQL connections, disabled by default"})
+    public static boolean mysql_nio_enable_keep_alive = false;
+
     @ConfField(description = {"thrift client 的连接超时时间，单位是毫秒。0 表示不设置超时时间。",
             "The connection timeout of thrift client, in milliseconds. 0 means no timeout."})
     public static int thrift_client_timeout_ms = 0;
diff --git a/fe/fe-common/src/main/java/org/apache/doris/common/security/authentication/HadoopUGI.java b/fe/fe-common/src/main/java/org/apache/doris/common/security/authentication/HadoopUGI.java
deleted file mode 100644
index 2f73440ecfa368..00000000000000
--- a/fe/fe-common/src/main/java/org/apache/doris/common/security/authentication/HadoopUGI.java
+++ /dev/null
@@ -1,103 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-package org.apache.doris.common.security.authentication;
-
-import org.apache.commons.lang3.StringUtils;
-import org.apache.hadoop.security.UserGroupInformation;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-
-import java.io.IOException;
-import java.security.PrivilegedExceptionAction;
-
-@Deprecated
-public class HadoopUGI {
-    private static final Logger LOG = LogManager.getLogger(HadoopUGI.class);
-
-    /**
-     * login and return hadoop ugi
-     * @param config auth config
-     * @return ugi
-     */
-    private static UserGroupInformation loginWithUGI(AuthenticationConfig config) {
-        if (config == null || !config.isValid()) {
-            return null;
-        }
-        if (config instanceof KerberosAuthenticationConfig) {
-            try {
-                // TODO: remove after iceberg and hudi kerberos test case pass
-                try {
-                    //  login hadoop with keytab and try checking TGT
-                    UserGroupInformation ugi = UserGroupInformation.getCurrentUser();
-                    LOG.debug("Current login user: {}", ugi.getUserName());
-                    String principal = ((KerberosAuthenticationConfig) config).getKerberosPrincipal();
-                    if (ugi.hasKerberosCredentials() && StringUtils.equals(ugi.getUserName(), principal)) {
-                        // if the current user is logged by kerberos and is the same user
-                        // just use checkTGTAndReloginFromKeytab because this method will only relogin
-                        // when the TGT is expired or is close to expiry
-                        ugi.checkTGTAndReloginFromKeytab();
-                        return ugi;
-                    }
-                } catch (IOException e) {
-                    LOG.warn("A SecurityException occurs with kerberos, do login immediately.", e);
-                }
-                return new HadoopKerberosAuthenticator((KerberosAuthenticationConfig) config).getUGI();
-            } catch (IOException e) {
-                throw new RuntimeException(e);
-            }
-        } else {
-            String hadoopUserName = ((SimpleAuthenticationConfig) config).getUsername();
-            if (hadoopUserName == null) {
-                hadoopUserName = "hadoop";
-                ((SimpleAuthenticationConfig) config).setUsername(hadoopUserName);
-                LOG.debug(AuthenticationConfig.HADOOP_USER_NAME + " is unset, use default user: hadoop");
-            }
-
-            UserGroupInformation ugi;
-            try {
-                ugi = UserGroupInformation.getLoginUser();
-                if (ugi.getUserName().equals(hadoopUserName)) {
-                    return ugi;
-                }
-            } catch (IOException e) {
-                LOG.warn("A SecurityException occurs with simple, do login immediately.", e);
-            }
-
-            ugi = UserGroupInformation.createRemoteUser(hadoopUserName);
-            UserGroupInformation.setLoginUser(ugi);
-            LOG.debug("Login by proxy user, hadoop.username: {}", hadoopUserName);
-            return ugi;
-        }
-    }
-
-    public static <T> T ugiDoAs(AuthenticationConfig authConf, PrivilegedExceptionAction<T> action) {
-        UserGroupInformation ugi = HadoopUGI.loginWithUGI(authConf);
-        try {
-            if (ugi != null) {
-                if (authConf instanceof KerberosAuthenticationConfig) {
-                    ugi.checkTGTAndReloginFromKeytab();
-                }
-                return ugi.doAs(action);
-            } else {
-                return action.run();
-            }
-        } catch (Exception e) {
-            throw new RuntimeException(e.getMessage(), e);
-        }
-    }
-}
diff --git a/fe/fe-core/src/main/antlr4/org/apache/doris/nereids/DorisParser.g4 b/fe/fe-core/src/main/antlr4/org/apache/doris/nereids/DorisParser.g4
index 6e2a518ec20982..c3fe7bb145ba72 100644
--- a/fe/fe-core/src/main/antlr4/org/apache/doris/nereids/DorisParser.g4
+++ b/fe/fe-core/src/main/antlr4/org/apache/doris/nereids/DorisParser.g4
@@ -178,9 +178,12 @@ supportedCreateStatement
     | CREATE (OR REPLACE)? VIEW (IF NOT EXISTS)? name=multipartIdentifier
         (LEFT_PAREN cols=simpleColumnDefs RIGHT_PAREN)?
         (COMMENT STRING_LITERAL)? AS query                                #createView
+    | CREATE FILE name=STRING_LITERAL
+        ((FROM | IN) database=identifier)? properties=propertyClause            #createFile        
     | CREATE (EXTERNAL)? TABLE (IF NOT EXISTS)? name=multipartIdentifier
         LIKE existedTable=multipartIdentifier
         (WITH ROLLUP (rollupNames=identifierList)?)?                      #createTableLike
+    | CREATE ROLE (IF NOT EXISTS)? name=identifier (COMMENT STRING_LITERAL)?    #createRole        
     | CREATE ROW POLICY (IF NOT EXISTS)? name=identifier
         ON table=multipartIdentifier
         AS type=(RESTRICTIVE | PERMISSIVE)
@@ -188,6 +191,7 @@ supportedCreateStatement
         USING LEFT_PAREN booleanExpression RIGHT_PAREN                    #createRowPolicy
     | CREATE SQL_BLOCK_RULE (IF NOT EXISTS)?
         name=identifier properties=propertyClause?                        #createSqlBlockRule
+    | CREATE ENCRYPTKEY (IF NOT EXISTS)? multipartIdentifier AS STRING_LITERAL  #createEncryptkey
     ;
 
 supportedAlterStatement
@@ -212,6 +216,8 @@ supportedDropStatement
     | DROP FILE name=STRING_LITERAL
         ((FROM | IN) database=identifier)? properties=propertyClause            #dropFile
     | DROP WORKLOAD POLICY (IF EXISTS)? name=identifierOrText                   #dropWorkloadPolicy
+    | DROP REPOSITORY name=identifier                                           #dropRepository
+
     ;
 
 supportedShowStatement
@@ -226,11 +232,14 @@ supportedShowStatement
     | SHOW ALL? GRANTS                                                              #showGrants
     | SHOW GRANTS FOR userIdentify                                                  #showGrantsForUser
     | SHOW LOAD PROFILE loadIdPath=STRING_LITERAL                                   #showLoadProfile
+    | SHOW CREATE REPOSITORY FOR identifier                                         #showCreateRepository
     | SHOW VIEW
         (FROM |IN) tableName=multipartIdentifier
         ((FROM | IN) database=identifier)?                                          #showView
     | SHOW PLUGINS                                                                  #showPlugins    
     | SHOW REPOSITORIES                                                             #showRepositories
+    | SHOW ENCRYPTKEYS ((FROM | IN) database=multipartIdentifier)?
+        (LIKE STRING_LITERAL)?                                                      #showEncryptKeys    
     | SHOW BRIEF? CREATE TABLE name=multipartIdentifier                             #showCreateTable
     | SHOW FULL? PROCESSLIST                                                        #showProcessList
     | SHOW ROLES                                                                    #showRoles        
@@ -250,6 +259,7 @@ supportedShowStatement
     | SHOW FULL? TRIGGERS ((FROM | IN) database=multipartIdentifier)? wildWhere?    #showTriggers    
     | SHOW TABLET DIAGNOSIS tabletId=INTEGER_VALUE                                  #showDiagnoseTablet
     | SHOW FRONTENDS name=identifier?                                               #showFrontends 
+    | SHOW DATABASE databaseId=INTEGER_VALUE                                        #showDatabaseId
     | SHOW TABLE tableId=INTEGER_VALUE                                              #showTableId
     | SHOW TRASH (ON backend=STRING_LITERAL)?                                       #showTrash
     | SHOW WHITELIST                                                                #showWhitelist
@@ -294,7 +304,6 @@ unsupportedShowStatement
     | SHOW STORAGE POLICY (USING (FOR policy=identifierOrText)?)?                   #showStoragePolicy
     | SHOW STAGES                                                                   #showStages
     | SHOW STORAGE (VAULT | VAULTS)                                                 #showStorageVault
-    | SHOW CREATE REPOSITORY FOR identifier                                         #showCreateRepository
     | SHOW OPEN TABLES ((FROM | IN) database=multipartIdentifier)? wildWhere?       #showOpenTables
     | SHOW TABLE STATUS ((FROM | IN) database=multipartIdentifier)? wildWhere?      #showTableStatus
     | SHOW FULL? TABLES ((FROM | IN) database=multipartIdentifier)? wildWhere?      #showTables
@@ -305,7 +314,6 @@ unsupportedShowStatement
         LEFT_PAREN functionArguments? RIGHT_PAREN
         ((FROM | IN) database=multipartIdentifier)?                                 #showCreateFunction
     | SHOW (DATABASES | SCHEMAS) (FROM catalog=identifier)? wildWhere?              #showDatabases
-    | SHOW DATABASE databaseId=INTEGER_VALUE                                        #showDatabaseId
     | SHOW DATA TYPES                                                               #showDataTypes
     | SHOW CATALOGS wildWhere?                                                      #showCatalogs
     | SHOW CATALOG name=identifier                                                  #showCatalog
@@ -324,7 +332,8 @@ unsupportedShowStatement
         ((FROM | IN) database=multipartIdentifier)? wildWhere?
         sortClause? limitClause?                                                    #showAlterTable
     | SHOW DATA SKEW FROM baseTableRef                                              #showDataSkew
-    | SHOW DATA (FROM tableName=multipartIdentifier)? sortClause? propertyClause?   #showData
+    | SHOW DATA (ALL)? (FROM tableName=multipartIdentifier)?
+        sortClause? propertyClause?                                                 #showData
     | SHOW TEMPORARY? PARTITIONS FROM tableName=multipartIdentifier
         wildWhere? sortClause? limitClause?                                         #showPartitions
     | SHOW TABLET tabletId=INTEGER_VALUE                                            #showTabletId
@@ -347,7 +356,6 @@ unsupportedShowStatement
     | SHOW TRANSACTION ((FROM | IN) database=multipartIdentifier)? wildWhere?       #showTransaction
     | SHOW QUERY PROFILE queryIdPath=STRING_LITERAL                                 #showQueryProfile
     | SHOW CACHE HOTSPOT tablePath=STRING_LITERAL                                   #showCacheHotSpot
-    | SHOW ENCRYPTKEYS ((FROM | IN) database=multipartIdentifier)? wildWhere?       #showEncryptKeys
     | SHOW SYNC JOB ((FROM | IN) database=multipartIdentifier)?                     #showSyncJob
     | SHOW TABLE CREATION ((FROM | IN) database=multipartIdentifier)? wildWhere?    #showTableCreation
     | SHOW CATALOG RECYCLE BIN wildWhere?                                           #showCatalogRecycleBin
@@ -480,6 +488,10 @@ unsupportedCancelStatement
 
 supportedAdminStatement
     : ADMIN SHOW REPLICA DISTRIBUTION FROM baseTableRef                             #adminShowReplicaDistribution
+    | ADMIN DIAGNOSE TABLET tabletId=INTEGER_VALUE                                  #adminDiagnoseTablet
+    | ADMIN SHOW REPLICA STATUS FROM baseTableRef (WHERE STATUS EQ|NEQ STRING_LITERAL)?   #adminShowReplicaStatus
+    | ADMIN COMPACT TABLE baseTableRef (WHERE TYPE EQ STRING_LITERAL)?              #adminCompactTable
+    | ADMIN CHECK tabletList properties=propertyClause?                             #adminCheckTablets
     ;
 
 supportedRecoverStatement
@@ -491,15 +503,12 @@ supportedRecoverStatement
     ;
 
 unsupportedAdminStatement
-    : ADMIN SHOW REPLICA STATUS FROM baseTableRef wildWhere?                        #adminShowReplicaStatus
-    | ADMIN SET REPLICA STATUS PROPERTIES LEFT_PAREN propertyItemList RIGHT_PAREN   #adminSetReplicaStatus
+    : ADMIN SET REPLICA STATUS PROPERTIES LEFT_PAREN propertyItemList RIGHT_PAREN   #adminSetReplicaStatus
     | ADMIN SET REPLICA VERSION PROPERTIES LEFT_PAREN propertyItemList RIGHT_PAREN  #adminSetReplicaVersion
     | ADMIN REPAIR TABLE baseTableRef                                               #adminRepairTable
     | ADMIN CANCEL REPAIR TABLE baseTableRef                                        #adminCancelRepairTable
-    | ADMIN COMPACT TABLE baseTableRef wildWhere?                                   #adminCompactTable
     | ADMIN SET (FRONTEND | (ALL FRONTENDS)) CONFIG
         (LEFT_PAREN propertyItemList RIGHT_PAREN)? ALL?                             #adminSetFrontendConfig
-    | ADMIN CHECK tabletList properties=propertyClause?                             #adminCheckTablets
     | ADMIN REBALANCE DISK (ON LEFT_PAREN backends+=STRING_LITERAL
         (COMMA backends+=STRING_LITERAL) RIGHT_PAREN)?                              #adminRebalanceDisk
     | ADMIN CANCEL REBALANCE DISK (ON LEFT_PAREN backends+=STRING_LITERAL
@@ -508,7 +517,6 @@ unsupportedAdminStatement
         (COMMA backends+=STRING_LITERAL) RIGHT_PAREN)?                              #adminCleanTrash
     | ADMIN SET TABLE name=multipartIdentifier
         PARTITION VERSION properties=propertyClause?                                #adminSetPartitionVersion
-    | ADMIN DIAGNOSE TABLET tabletId=INTEGER_VALUE                                  #adminDiagnoseTablet
     | ADMIN SHOW TABLET STORAGE FORMAT VERBOSE?                                     #adminShowTabletStorageFormat
     | ADMIN COPY TABLET tabletId=INTEGER_VALUE properties=propertyClause?           #adminCopyTablet
     | ADMIN SET TABLE name=multipartIdentifier STATUS properties=propertyClause?    #adminSetTableStatus
@@ -678,7 +686,6 @@ unsupportedDropStatement
         functionIdentifier LEFT_PAREN functionArguments? RIGHT_PAREN            #dropFunction
     | DROP TABLE (IF EXISTS)? name=multipartIdentifier FORCE?                   #dropTable
     | DROP VIEW (IF EXISTS)? name=multipartIdentifier                           #dropView
-    | DROP REPOSITORY name=identifier                                           #dropRepository
     | DROP INDEX (IF EXISTS)? name=identifier ON tableName=multipartIdentifier  #dropIndex
     | DROP RESOURCE (IF EXISTS)? name=identifierOrText                          #dropResource
     | DROP ROW POLICY (IF EXISTS)? policyName=identifier
@@ -749,9 +756,6 @@ unsupportedCreateStatement
         (SUPERUSER | DEFAULT ROLE role=STRING_LITERAL)?
         passwordOption (COMMENT STRING_LITERAL)?                                #createUser
     | CREATE (READ ONLY)? REPOSITORY name=identifier WITH storageBackend        #createRepository
-    | CREATE ROLE (IF NOT EXISTS)? name=identifier (COMMENT STRING_LITERAL)?    #createRole
-    | CREATE FILE name=STRING_LITERAL
-        ((FROM | IN) database=identifier)? properties=propertyClause            #createFile
     | CREATE INDEX (IF NOT EXISTS)? name=identifier
         ON tableName=multipartIdentifier identifierList
         (USING (BITMAP | NGRAM_BF | INVERTED))?
@@ -766,7 +770,6 @@ unsupportedCreateStatement
         (CONDITIONS LEFT_PAREN workloadPolicyConditions RIGHT_PAREN)?
         (ACTIONS LEFT_PAREN workloadPolicyActions RIGHT_PAREN)?
         properties=propertyClause?                                              #createWorkloadPolicy
-    | CREATE ENCRYPTKEY (IF NOT EXISTS)? multipartIdentifier AS STRING_LITERAL  #createEncryptkey
     | CREATE STORAGE POLICY (IF NOT EXISTS)?
         name=identifier properties=propertyClause?                              #createStoragePolicy
     | BUILD INDEX name=identifier ON tableName=multipartIdentifier
diff --git a/fe/fe-core/src/main/cup/sql_parser.cup b/fe/fe-core/src/main/cup/sql_parser.cup
index 03f1f02f158f84..05804343bc3417 100644
--- a/fe/fe-core/src/main/cup/sql_parser.cup
+++ b/fe/fe-core/src/main/cup/sql_parser.cup
@@ -1014,6 +1014,8 @@ nonterminal List<Expr> copy_select_expr_list;
 //genearted column
 nonterminal Boolean opt_generated_always;
 
+nonterminal Boolean opt_detailed;
+
 precedence nonassoc COMMA;
 precedence nonassoc STRING_LITERAL;
 precedence nonassoc KW_COLUMNS;
@@ -4493,13 +4495,13 @@ show_param ::=
         RESULT = new ShowDataSkewStmt(table_ref);
     :}
     /* Show data statement: used to show data size of specified range */
-     | KW_DATA order_by_clause:orderByClause opt_properties:prop
+     | KW_DATA opt_detailed:detailed order_by_clause:orderByClause opt_properties:prop
     {:
-        RESULT = new ShowDataStmt(null, orderByClause, prop);
+        RESULT = new ShowDataStmt(null, orderByClause, prop, detailed);
     :}
-    | KW_DATA KW_FROM table_name:dbTblName order_by_clause:orderByClause
+    | KW_DATA opt_detailed:detailed KW_FROM table_name:dbTblName order_by_clause:orderByClause
     {:
-        RESULT = new ShowDataStmt(dbTblName, orderByClause, null);
+        RESULT = new ShowDataStmt(dbTblName, orderByClause, null, detailed);
     :}
     | opt_tmp:tmp KW_PARTITIONS KW_FROM table_name:tblName opt_wild_where order_by_clause:orderByClause limit_clause: limitClause
     {:
@@ -5063,6 +5065,17 @@ cancel_param ::=
     :}
     ;
 
+opt_detailed ::=
+     /* empty */
+    {:
+        RESULT = false;
+    :}
+    | KW_ALL
+    {:
+        RESULT = true;
+    :}
+    ;
+
 // Delete stmt
 delete_stmt ::=
     KW_DELETE KW_FROM table_name:table opt_partition_names:partitionNames opt_table_alias:alias opt_using_clause:fromClause where_clause:wherePredicate
diff --git a/fe/fe-core/src/main/java/org/apache/doris/alter/CloudSchemaChangeJobV2.java b/fe/fe-core/src/main/java/org/apache/doris/alter/CloudSchemaChangeJobV2.java
index 92a74e46b922be..f765dd1bb7fdca 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/alter/CloudSchemaChangeJobV2.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/alter/CloudSchemaChangeJobV2.java
@@ -242,9 +242,9 @@ private void createShadowIndexReplicaForPartition(OlapTable tbl) throws Exceptio
 
                 short shadowShortKeyColumnCount = indexShortKeyMap.get(shadowIdxId);
                 List<Column> shadowSchema = indexSchemaMap.get(shadowIdxId);
-                List<Integer> clusterKeyIndexes = null;
+                List<Integer> clusterKeyUids = null;
                 if (shadowIdxId == tbl.getBaseIndexId() || isShadowIndexOfBase(shadowIdxId, tbl)) {
-                    clusterKeyIndexes = OlapTable.getClusterKeyIndexes(shadowSchema);
+                    clusterKeyUids = OlapTable.getClusterKeyUids(shadowSchema);
                 }
                 int shadowSchemaHash = indexSchemaVersionAndHashMap.get(shadowIdxId).schemaHash;
                 int shadowSchemaVersion = indexSchemaVersionAndHashMap.get(shadowIdxId).schemaVersion;
@@ -277,7 +277,7 @@ private void createShadowIndexReplicaForPartition(OlapTable tbl) throws Exceptio
                                             tbl.getEnableMowLightDelete(),
                                             tbl.getInvertedIndexFileStorageFormat(),
                                             tbl.rowStorePageSize(),
-                                            tbl.variantEnableFlattenNested(), clusterKeyIndexes,
+                                            tbl.variantEnableFlattenNested(), clusterKeyUids,
                                             tbl.storagePageSize());
                     requestBuilder.addTabletMetas(builder);
                 } // end for rollupTablets
diff --git a/fe/fe-core/src/main/java/org/apache/doris/alter/SchemaChangeJobV2.java b/fe/fe-core/src/main/java/org/apache/doris/alter/SchemaChangeJobV2.java
index 58e3e05e214a9d..a624dc3c733374 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/alter/SchemaChangeJobV2.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/alter/SchemaChangeJobV2.java
@@ -287,9 +287,9 @@ protected void createShadowIndexReplica() throws AlterCancelException {
 
                     short shadowShortKeyColumnCount = indexShortKeyMap.get(shadowIdxId);
                     List<Column> shadowSchema = indexSchemaMap.get(shadowIdxId);
-                    List<Integer> clusterKeyIndexes = null;
+                    List<Integer> clusterKeyUids = null;
                     if (shadowIdxId == tbl.getBaseIndexId() || isShadowIndexOfBase(shadowIdxId, tbl)) {
-                        clusterKeyIndexes = OlapTable.getClusterKeyIndexes(shadowSchema);
+                        clusterKeyUids = OlapTable.getClusterKeyUids(shadowSchema);
                     }
                     int shadowSchemaHash = indexSchemaVersionAndHashMap.get(shadowIdxId).schemaHash;
                     long originIndexId = indexIdMap.get(shadowIdxId);
@@ -340,10 +340,10 @@ protected void createShadowIndexReplica() throws AlterCancelException {
                             }
                             createReplicaTask.setInvertedIndexFileStorageFormat(tbl
                                                     .getInvertedIndexFileStorageFormat());
-                            if (!CollectionUtils.isEmpty(clusterKeyIndexes)) {
-                                createReplicaTask.setClusterKeyIndexes(clusterKeyIndexes);
-                                LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key indexes: {}",
-                                        tableId, partitionId, shadowIdxId, shadowTabletId, clusterKeyIndexes);
+                            if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+                                createReplicaTask.setClusterKeyUids(clusterKeyUids);
+                                LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key uids: {}",
+                                        tableId, partitionId, shadowIdxId, shadowTabletId, clusterKeyUids);
                             }
                             batchTask.addTask(createReplicaTask);
                         } // end for rollupReplicas
diff --git a/fe/fe-core/src/main/java/org/apache/doris/analysis/DropUserStmt.java b/fe/fe-core/src/main/java/org/apache/doris/analysis/DropUserStmt.java
index f9bb218744fc85..5f9872e42ad7cc 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/analysis/DropUserStmt.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/analysis/DropUserStmt.java
@@ -63,8 +63,8 @@ public void analyze(Analyzer analyzer) throws AnalysisException, UserException {
 
         userIdent.analyze();
 
-        if (userIdent.isRootUser()) {
-            ErrorReport.reportAnalysisException(ErrorCode.ERR_COMMON_ERROR, "Can not drop root user");
+        if (userIdent.isSystemUser()) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_COMMON_ERROR, "Can not drop system user");
         }
 
         // only user with GLOBAL level's GRANT_PRIV can drop user.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/analysis/IndexDef.java b/fe/fe-core/src/main/java/org/apache/doris/analysis/IndexDef.java
index 7f406d2a7e1365..f51e63e4fbec0f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/analysis/IndexDef.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/analysis/IndexDef.java
@@ -43,12 +43,17 @@ public class IndexDef {
     private boolean isBuildDeferred = false;
     private PartitionNames partitionNames;
     private List<Integer> columnUniqueIds = Lists.newArrayList();
+    private static final int MIN_NGRAM_SIZE = 1;
+    private static final int MAX_NGRAM_SIZE = 255;
+    private static final int MIN_BF_SIZE = 64;
+    private static final int MAX_BF_SIZE = 65535;
 
     public static final String NGRAM_SIZE_KEY = "gram_size";
     public static final String NGRAM_BF_SIZE_KEY = "bf_size";
     public static final String DEFAULT_NGRAM_SIZE = "2";
     public static final String DEFAULT_NGRAM_BF_SIZE = "256";
 
+
     public IndexDef(String indexName, boolean ifNotExists, List<String> columns, IndexType indexType,
                     Map<String, String> properties, String comment) {
         this.indexName = indexName;
@@ -238,8 +243,8 @@ public void checkColumn(Column column, KeysType keysType, boolean enableUniqueKe
                     throw new AnalysisException("index should only be used in columns of DUP_KEYS/UNIQUE_KEYS table"
                         + " or key columns of AGG_KEYS table. invalid index: " + indexName);
                 } else if (keysType == KeysType.UNIQUE_KEYS && !enableUniqueKeyMergeOnWrite
-                               && indexType == IndexType.INVERTED && properties != null
-                               && properties.containsKey(InvertedIndexUtil.INVERTED_INDEX_PARSER_KEY)) {
+                        && indexType == IndexType.INVERTED && properties != null
+                        && properties.containsKey(InvertedIndexUtil.INVERTED_INDEX_PARSER_KEY)) {
                     throw new AnalysisException("INVERTED index with parser can NOT be used in value columns of"
                         + " UNIQUE_KEYS table with merge_on_write disable. invalid index: " + indexName);
                 }
@@ -256,21 +261,29 @@ public void checkColumn(Column column, KeysType keysType, boolean enableUniqueKe
                 if (properties.size() != 2) {
                     throw new AnalysisException("ngram_bf index should have gram_size and bf_size properties");
                 }
-                try {
-                    int ngramSize = Integer.parseInt(properties.get(NGRAM_SIZE_KEY));
-                    int bfSize = Integer.parseInt(properties.get(NGRAM_BF_SIZE_KEY));
-                    if (ngramSize > 256 || ngramSize < 1) {
-                        throw new AnalysisException("gram_size should be integer and less than 256");
-                    }
-                    if (bfSize > 65535 || bfSize < 64) {
-                        throw new AnalysisException("bf_size should be integer and between 64 and 65535");
-                    }
-                } catch (NumberFormatException e) {
-                    throw new AnalysisException("invalid ngram properties:" + e.getMessage(), e);
-                }
+
+                parseAndValidateProperty(properties, NGRAM_SIZE_KEY, MIN_NGRAM_SIZE, MAX_NGRAM_SIZE);
+                parseAndValidateProperty(properties, NGRAM_BF_SIZE_KEY, MIN_BF_SIZE, MAX_BF_SIZE);
             }
         } else {
             throw new AnalysisException("Unsupported index type: " + indexType);
         }
     }
+
+    private void parseAndValidateProperty(Map<String, String> properties, String key, int minValue, int maxValue)
+            throws AnalysisException {
+        String valueStr = properties.get(key);
+        if (valueStr == null) {
+            throw new AnalysisException("Property '" + key + "' is missing.");
+        }
+        try {
+            int value = Integer.parseInt(valueStr);
+            if (value < minValue || value > maxValue) {
+                throw new AnalysisException("'" + key + "' should be an integer between "
+                                                + minValue + " and " + maxValue + ".");
+            }
+        } catch (NumberFormatException e) {
+            throw new AnalysisException("Invalid value for '" + key + "': " + valueStr, e);
+        }
+    }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/analysis/InvertedIndexUtil.java b/fe/fe-core/src/main/java/org/apache/doris/analysis/InvertedIndexUtil.java
index abba2762d5664d..dd6a1a7612ab6d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/analysis/InvertedIndexUtil.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/analysis/InvertedIndexUtil.java
@@ -54,6 +54,8 @@ public class InvertedIndexUtil {
 
     public static String INVERTED_INDEX_PARSER_STOPWORDS_KEY = "stopwords";
 
+    public static String INVERTED_INDEX_DICT_COMPRESSION_KEY = "dict_compression";
+
     public static String getInvertedIndexParser(Map<String, String> properties) {
         String parser = properties == null ? null : properties.get(INVERTED_INDEX_PARSER_KEY);
         // default is "none" if not set
@@ -157,7 +159,8 @@ public static void checkInvertedIndexProperties(Map<String, String> properties)
                 INVERTED_INDEX_PARSER_CHAR_FILTER_REPLACEMENT,
                 INVERTED_INDEX_PARSER_IGNORE_ABOVE_KEY,
                 INVERTED_INDEX_PARSER_LOWERCASE_KEY,
-                INVERTED_INDEX_PARSER_STOPWORDS_KEY
+                INVERTED_INDEX_PARSER_STOPWORDS_KEY,
+                INVERTED_INDEX_DICT_COMPRESSION_KEY
         ));
 
         for (String key : properties.keySet()) {
@@ -174,6 +177,7 @@ public static void checkInvertedIndexProperties(Map<String, String> properties)
         String ignoreAbove = properties.get(INVERTED_INDEX_PARSER_IGNORE_ABOVE_KEY);
         String lowerCase = properties.get(INVERTED_INDEX_PARSER_LOWERCASE_KEY);
         String stopWords = properties.get(INVERTED_INDEX_PARSER_STOPWORDS_KEY);
+        String dictCompression = properties.get(INVERTED_INDEX_DICT_COMPRESSION_KEY);
 
         if (parser != null && !parser.matches("none|english|unicode|chinese|standard")) {
             throw new AnalysisException("Invalid inverted index 'parser' value: " + parser
@@ -221,5 +225,11 @@ public static void checkInvertedIndexProperties(Map<String, String> properties)
             throw new AnalysisException("Invalid inverted index 'stopWords' value: " + stopWords
                     + ", stopWords must be none");
         }
+
+        if (dictCompression != null && !dictCompression.matches("true|false")) {
+            throw new AnalysisException(
+                    "Invalid inverted index 'dict_compression' value: "
+                            + dictCompression + ", dict_compression must be true or false");
+        }
     }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/analysis/ShowDataStmt.java b/fe/fe-core/src/main/java/org/apache/doris/analysis/ShowDataStmt.java
index 26b77e0b3d5d26..398b0d7ec05d42 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/analysis/ShowDataStmt.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/analysis/ShowDataStmt.java
@@ -100,26 +100,64 @@ public class ShowDataStmt extends ShowStmt implements NotFallbackInParser {
             new ImmutableList.Builder<String>().add("TableName").add("IndexName").add("Size").add("ReplicaCount")
                     .add("RowCount").add("RemoteSize").build();
 
+    private static final ShowResultSetMetaData SHOW_DETAILED_TABLE_DATA_META_DATA =
+            ShowResultSetMetaData.builder()
+                    .addColumn(new Column("TableName", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("ReplicaCount", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("LocalTotalSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("LocalDataSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("LocalIndexSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteTotalSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteDataSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteIndexSize", ScalarType.createVarchar(30)))
+                    .build();
+
+    private static final ShowResultSetMetaData SHOW_DETAILED_INDEX_DATA_META_DATA =
+            ShowResultSetMetaData.builder()
+                    .addColumn(new Column("TableName", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("IndexName", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("ReplicaCount", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("RowCount", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("LocalTotalSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("LocalDataSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("LocalIndexSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteTotalSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteDataSize", ScalarType.createVarchar(30)))
+                    .addColumn(new Column("RemoteIndexSize", ScalarType.createVarchar(30)))
+                    .build();
+
     TableName tableName;
     String dbName;
-    List<List<String>> totalRows;
+    List<List<String>> totalRows = Lists.newArrayList();
     List<List<Object>> totalRowsObject = Lists.newArrayList();
 
-    private List<OrderByElement> orderByElements;
-    private List<OrderByPair> orderByPairs;
+    private List<OrderByElement> orderByElements = null;
+    private List<OrderByPair> orderByPairs = null;
 
-    private final Map<String, String> properties;
+    private Map<String, String> properties = null;
+    private boolean detailed = true;
 
     private static final String WAREHOUSE = "entire_warehouse";
     private static final String DB_LIST = "db_names";
 
-    public ShowDataStmt(TableName tableName, List<OrderByElement> orderByElements, Map<String, String> properties) {
+    private long totalSize = 0;
+    private long totalReplicaCount = 0;
+    private long totalRemoteSize = 0;
+    private long totalLocalInvertedSize = 0;
+    private long totalLocalSegmentSize = 0;
+    private long totalRemoteInvertedSize = 0;
+    private long totalRemoteSegmentSize = 0;
+
+    public ShowDataStmt(TableName tableName, List<OrderByElement> orderByElements,
+                                    Map<String, String> properties, boolean detailed) {
         this.tableName = tableName;
-        this.totalRows = Lists.newArrayList();
         this.orderByElements = orderByElements;
         this.properties = properties;
+        this.detailed = detailed;
     }
 
+    public ShowDataStmt() {}
+
     @Override
     public void analyze(Analyzer analyzer) throws UserException {
         super.analyze(analyzer);
@@ -156,208 +194,245 @@ public void analyze(Analyzer analyzer) throws UserException {
             }
         }
 
-        if (tableName == null) {
-            db.readLock();
-            try {
-                long totalSize = 0;
-                long totalReplicaCount = 0;
-                long totalRemoteSize = 0;
-                // sort by table name
-                List<Table> tables = db.getTables();
-                SortedSet<Table> sortedTables = new TreeSet<>(new Comparator<Table>() {
-                    @Override
-                    public int compare(Table t1, Table t2) {
-                        return t1.getName().compareTo(t2.getName());
-                    }
-                });
-
-                for (Table table : tables) {
-                    if (!Env.getCurrentEnv().getAccessManager()
-                            .checkTblPriv(ConnectContext.get(), InternalCatalog.INTERNAL_CATALOG_NAME, dbName,
-                                    table.getName(),
-                                    PrivPredicate.SHOW)) {
-                        continue;
-                    }
-                    sortedTables.add(table);
-                }
+        if (hasTable()) {
+            if (!Env.getCurrentEnv().getAccessManager().checkTblPriv(ConnectContext.get(), tableName,
+                    PrivPredicate.SHOW)) {
+                ErrorReport.reportAnalysisException(ErrorCode.ERR_TABLEACCESS_DENIED_ERROR, "SHOW DATA",
+                        ConnectContext.get().getQualifiedUser(),
+                        ConnectContext.get().getRemoteIP(),
+                        dbName + ": " + tableName);
+            }
+            OlapTable table = (OlapTable) db.getTableOrMetaException(tableName.getTbl(), TableType.OLAP);
+            getSingleTableStats(table);
+        } else {
+            getSingleDbStats(db);
+        }
+        return;
+    }
 
-                for (Table table : sortedTables) {
-                    if (!table.isManagedTable()) {
-                        continue;
-                    }
+    private void collectDbStats(Database db) {
+        // sort by table name
+        List<Table> tables = db.getTables();
+        SortedSet<Table> sortedTables = new TreeSet<>(new Comparator<Table>() {
+            @Override
+            public int compare(Table t1, Table t2) {
+                return t1.getName().compareTo(t2.getName());
+            }
+        });
 
-                    OlapTable olapTable = (OlapTable) table;
-                    long tableSize = 0;
-                    long replicaCount = 0;
-                    long remoteSize = 0;
+        for (Table table : tables) {
+            if (!Env.getCurrentEnv().getAccessManager()
+                    .checkTblPriv(ConnectContext.get(), InternalCatalog.INTERNAL_CATALOG_NAME, dbName,
+                            table.getName(),
+                            PrivPredicate.SHOW)) {
+                continue;
+            }
+            sortedTables.add(table);
+        }
 
-                    tableSize = olapTable.getDataSize();
-                    replicaCount = olapTable.getReplicaCount();
-                    remoteSize = olapTable.getRemoteDataSize();
+        for (Table table : sortedTables) {
+            if (!table.isManagedTable()) {
+                continue;
+            }
 
-                    //|TableName|Size|ReplicaCount|RemoteSize
-                    List<Object> row = Arrays.asList(table.getName(), tableSize, replicaCount, remoteSize);
-                    totalRowsObject.add(row);
+            OlapTable olapTable = (OlapTable) table;
+            long tableSize = 0;
+            long replicaCount = 0;
+            long remoteSize = 0;
 
-                    totalSize += tableSize;
-                    totalReplicaCount += replicaCount;
-                    totalRemoteSize += remoteSize;
-                } // end for tables
+            tableSize = olapTable.getDataSize();
+            replicaCount = olapTable.getReplicaCount();
+            remoteSize = olapTable.getRemoteDataSize();
 
-                // sort by
-                if (orderByPairs != null && !orderByPairs.isEmpty()) {
-                    // k-> index, v-> isDesc
-                    Map<Integer, Boolean> sortMap = Maps.newLinkedHashMap();
-                    for (OrderByPair orderByPair : orderByPairs) {
-                        sortMap.put(orderByPair.getIndex(), orderByPair.isDesc());
+            if (!detailed) {
+                totalRowsObject.add(Arrays.asList(table.getName(), tableSize, replicaCount, remoteSize));
+            } else {
+                long localIndexSize = olapTable.getLocalIndexFileSize();
+                long localSegmentSize = olapTable.getLocalSegmentSize();
+                long remoteIndexSize = olapTable.getRemoteIndexFileSize();
+                long remoteSegmentSize = olapTable.getRemoteSegmentSize();
+                totalRowsObject.add(Arrays.asList(table.getName(), tableSize, replicaCount, remoteSize,
+                        localIndexSize, localSegmentSize, remoteIndexSize, remoteSegmentSize));
+                totalLocalInvertedSize += localIndexSize;
+                totalLocalSegmentSize += localSegmentSize;
+                totalRemoteInvertedSize += remoteIndexSize;
+                totalRemoteSegmentSize += remoteSegmentSize;
+            }
 
-                    }
-                    totalRowsObject.sort(sortRows(sortMap));
-                }
+            totalSize += tableSize;
+            totalReplicaCount += replicaCount;
+            totalRemoteSize += remoteSize;
+        } // end for tables
+    }
 
-                // for output
-                for (List<Object> row : totalRowsObject) {
-                    //|TableName|Size|ReplicaCount|RemoteSize
-                    Pair<Double, String> tableSizePair = DebugUtil.getByteUint((long) row.get(1));
-                    String readableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(tableSizePair.first) + " "
-                            + tableSizePair.second;
-                    Pair<Double, String> remoteSizePair = DebugUtil.getByteUint((long) row.get(3));
-                    String remoteReadableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(remoteSizePair.first) + " "
-                            + remoteSizePair.second;
-                    List<String> result = Arrays.asList(String.valueOf(row.get(0)),
-                            readableSize, String.valueOf(row.get(2)), remoteReadableSize);
-                    totalRows.add(result);
-                }
+    private void collectTableStats(OlapTable table) {
+        // sort by index name
+        Map<String, Long> indexNames = table.getIndexNameToId();
+        Map<String, Long> sortedIndexNames = new TreeMap<String, Long>();
+        for (Map.Entry<String, Long> entry : indexNames.entrySet()) {
+            sortedIndexNames.put(entry.getKey(), entry.getValue());
+        }
 
-                Pair<Double, String> totalSizePair = DebugUtil.getByteUint(totalSize);
-                String readableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(totalSizePair.first) + " "
-                        + totalSizePair.second;
-                Pair<Double, String> totalRemoteSizePair = DebugUtil.getByteUint(totalRemoteSize);
-                String remoteReadableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(totalRemoteSizePair.first) + " "
-                        + totalRemoteSizePair.second;
-                List<String> total = Arrays.asList("Total", readableSize, String.valueOf(totalReplicaCount),
-                         remoteReadableSize);
-                totalRows.add(total);
-
-                // quota
-                long quota = db.getDataQuota();
-                long replicaQuota = db.getReplicaQuota();
-                Pair<Double, String> quotaPair = DebugUtil.getByteUint(quota);
-                String readableQuota = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(quotaPair.first) + " "
-                        + quotaPair.second;
-
-                List<String> quotaRow = Arrays.asList("Quota", readableQuota, String.valueOf(replicaQuota), "");
-                totalRows.add(quotaRow);
-
-                // left
-                long left = Math.max(0, quota - totalSize);
-                long replicaCountLeft = Math.max(0, replicaQuota - totalReplicaCount);
-                Pair<Double, String> leftPair = DebugUtil.getByteUint(left);
-                String readableLeft = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(leftPair.first) + " "
-                        + leftPair.second;
-                List<String> leftRow = Arrays.asList("Left", readableLeft, String.valueOf(replicaCountLeft), "");
-                totalRows.add(leftRow);
-            } finally {
-                db.readUnlock();
+        for (Long indexId : sortedIndexNames.values()) {
+            long indexSize = 0;
+            long indexReplicaCount = 0;
+            long indexRowCount = 0;
+            long indexRemoteSize = 0;
+            long localIndexSize = 0;
+            long localSegmentSize = 0;
+            long remoteIndexSize = 0;
+            long remoteSegmentSize = 0;
+            for (Partition partition : table.getAllPartitions()) {
+                MaterializedIndex mIndex = partition.getIndex(indexId);
+                indexSize += mIndex.getDataSize(false);
+                indexReplicaCount += mIndex.getReplicaCount();
+                indexRowCount += mIndex.getRowCount() == -1 ? 0 : mIndex.getRowCount();
+                indexRemoteSize += mIndex.getRemoteDataSize();
+                localIndexSize += mIndex.getLocalIndexSize();
+                localSegmentSize += mIndex.getLocalSegmentSize();
+                remoteIndexSize += mIndex.getRemoteIndexSize();
+                remoteSegmentSize += mIndex.getRemoteSegmentSize();
             }
-        } else {
-            if (!Env.getCurrentEnv().getAccessManager().checkTblPriv(ConnectContext.get(), tableName,
-                    PrivPredicate.SHOW)) {
-                ErrorReport.reportAnalysisException(ErrorCode.ERR_TABLEACCESS_DENIED_ERROR, "SHOW DATA",
-                        ConnectContext.get().getQualifiedUser(),
-                        ConnectContext.get().getRemoteIP(),
-                        dbName + ": " + tableName);
+
+            String indexName = table.getIndexNameById(indexId);
+            if (!detailed) {
+                totalRowsObject.add(Arrays.asList(tableName, indexName, indexSize, indexReplicaCount,
+                        indexRowCount, indexRemoteSize));
+            } else {
+                totalRowsObject.add(Arrays.asList(tableName, indexName, indexSize, indexReplicaCount, indexRowCount,
+                            indexRemoteSize, localIndexSize, localSegmentSize, remoteIndexSize, remoteSegmentSize));
             }
 
-            OlapTable olapTable = (OlapTable) db
-                    .getTableOrMetaException(tableName.getTbl(), TableType.OLAP);
-            long totalSize = 0;
-            long totalReplicaCount = 0;
-            long totalRemoteSize = 0;
-            olapTable.readLock();
-            try {
-                // sort by index name
-                Map<String, Long> indexNames = olapTable.getIndexNameToId();
-                Map<String, Long> sortedIndexNames = new TreeMap<String, Long>();
-                for (Map.Entry<String, Long> entry : indexNames.entrySet()) {
-                    sortedIndexNames.put(entry.getKey(), entry.getValue());
-                }
+            totalSize += indexSize;
+            totalReplicaCount += indexReplicaCount;
+            totalRemoteSize += indexRemoteSize;
+            totalLocalInvertedSize += localIndexSize;
+            totalLocalSegmentSize += localSegmentSize;
+            totalRemoteInvertedSize += remoteIndexSize;
+            totalRemoteSegmentSize += remoteSegmentSize;
+        } // end for indices
+    }
 
-                for (Long indexId : sortedIndexNames.values()) {
-                    long indexSize = 0;
-                    long indexReplicaCount = 0;
-                    long indexRowCount = 0;
-                    long indexRemoteSize = 0;
-                    for (Partition partition : olapTable.getAllPartitions()) {
-                        MaterializedIndex mIndex = partition.getIndex(indexId);
-                        indexSize += mIndex.getDataSize(false);
-                        indexReplicaCount += mIndex.getReplicaCount();
-                        indexRowCount += mIndex.getRowCount() == -1 ? 0 : mIndex.getRowCount();
-                        indexRemoteSize += mIndex.getRemoteDataSize();
-                    }
+    private void sortResult() {
+        if (orderByPairs != null && !orderByPairs.isEmpty()) {
+            // k-> index, v-> isDesc
+            Map<Integer, Boolean> sortMap = Maps.newLinkedHashMap();
+            for (OrderByPair orderByPair : orderByPairs) {
+                sortMap.put(orderByPair.getIndex(), orderByPair.isDesc());
 
-                    String indexName = olapTable.getIndexNameById(indexId);
-                    // .add("TableName").add("IndexName").add("Size").add("ReplicaCount").add("RowCount")
-                    //      .add("RemoteSize")
-                    List<Object> row = Arrays.asList(tableName, indexName, indexSize, indexReplicaCount,
-                             indexRowCount, indexRemoteSize);
-                    totalRowsObject.add(row);
-
-                    totalSize += indexSize;
-                    totalReplicaCount += indexReplicaCount;
-                    totalRemoteSize += indexRemoteSize;
-                } // end for indices
-
-                // sort by
-                if (orderByPairs != null && !orderByPairs.isEmpty()) {
-                    // k-> index, v-> isDesc
-                    Map<Integer, Boolean> sortMap = Maps.newLinkedHashMap();
-                    for (OrderByPair orderByPair : orderByPairs) {
-                        sortMap.put(orderByPair.getIndex(), orderByPair.isDesc());
+            }
+            totalRowsObject.sort(sortRows(sortMap));
+        }
+    }
 
-                    }
-                    totalRowsObject.sort(sortRows(sortMap));
-                }
+    private void buildDbStatsOutput(long quota, long replicaQuota) {
+        // for output
+        for (List<Object> row : totalRowsObject) {
+            if (!detailed) {
+                totalRows.add(Arrays.asList(String.valueOf(row.get(0)),
+                        DebugUtil.printByteWithUnit((long) row.get(1)), String.valueOf(row.get(2)),
+                        DebugUtil.printByteWithUnit((long) row.get(3))));
+            } else {
+                totalRows.add(Arrays.asList(String.valueOf(row.get(0)), String.valueOf(row.get(2)),
+                        DebugUtil.printByteWithUnit((long) row.get(1)), DebugUtil.printByteWithUnit((long) row.get(5)),
+                        DebugUtil.printByteWithUnit((long) row.get(4)), DebugUtil.printByteWithUnit((long) row.get(3)),
+                        DebugUtil.printByteWithUnit((long) row.get(7)),
+                        DebugUtil.printByteWithUnit((long) row.get(6))));
+            }
+        }
 
-                // for output
-                for (int index = 0; index <= totalRowsObject.size() - 1; index++) {
-                    //| TableName| IndexName | Size | ReplicaCount | RowCount | RemoteSize
-                    List<Object> row = totalRowsObject.get(index);
-                    List<String> result;
-                    Pair<Double, String> tableSizePair = DebugUtil.getByteUint((long) row.get(2));
-                    String readableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(tableSizePair.first)
-                            + " " + tableSizePair.second;
-                    Pair<Double, String> remoteSizePair = DebugUtil.getByteUint((long) row.get(5));
-                    String remoteReadableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(remoteSizePair.first) + " "
-                            + remoteSizePair.second;
-                    if (index == 0) {
-                        result = Arrays.asList(tableName.getTbl(), String.valueOf(row.get(1)),
-                                readableSize, String.valueOf(row.get(3)),
-                                String.valueOf(row.get(4)), remoteReadableSize);
-                    } else {
-                        result = Arrays.asList("", String.valueOf(row.get(1)),
-                                readableSize, String.valueOf(row.get(3)),
-                                String.valueOf(row.get(4)), remoteReadableSize);
-                    }
-                    totalRows.add(result);
-                }
+        long left = Math.max(0, quota - totalSize);
+        long replicaCountLeft = Math.max(0, replicaQuota - totalReplicaCount);
 
-                Pair<Double, String> totalSizePair = DebugUtil.getByteUint(totalSize);
-                String readableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(totalSizePair.first) + " "
-                        + totalSizePair.second;
-                Pair<Double, String> totalRemoteSizePair = DebugUtil.getByteUint(totalRemoteSize);
-                String remoteReadableSize = DebugUtil.DECIMAL_FORMAT_SCALE_3.format(totalRemoteSizePair.first) + " "
-                        + totalRemoteSizePair.second;
-                List<String> row = Arrays.asList("", "Total", readableSize, String.valueOf(totalReplicaCount), "",
-                         remoteReadableSize);
-                totalRows.add(row);
-            } finally {
-                olapTable.readUnlock();
+        if (!detailed) {
+            totalRows.add(Arrays.asList("Total", DebugUtil.printByteWithUnit(totalSize),
+                    String.valueOf(totalReplicaCount), DebugUtil.printByteWithUnit(totalRemoteSize)));
+            totalRows.add(Arrays.asList("Quota", DebugUtil.printByteWithUnit(quota),
+                                                                    String.valueOf(replicaQuota), ""));
+            totalRows.add(Arrays.asList("Left", DebugUtil.printByteWithUnit(left),
+                                                                String.valueOf(replicaCountLeft), ""));
+        } else {
+            totalRows.add(Arrays.asList("Total", String.valueOf(totalReplicaCount),
+                    DebugUtil.printByteWithUnit(totalSize),
+                    DebugUtil.printByteWithUnit(totalLocalSegmentSize),
+                    DebugUtil.printByteWithUnit(totalLocalInvertedSize),
+                    DebugUtil.printByteWithUnit(totalRemoteSize),
+                    DebugUtil.printByteWithUnit(totalRemoteSegmentSize),
+                    DebugUtil.printByteWithUnit(totalRemoteInvertedSize)));
+            totalRows.add(Arrays.asList("Quota", String.valueOf(replicaQuota),
+                                                DebugUtil.printByteWithUnit(quota), "", "", "", "", ""));
+            totalRows.add(Arrays.asList("Left", String.valueOf(replicaCountLeft),
+                                                DebugUtil.printByteWithUnit(left), "", "", "", "", ""));
+        }
+    }
+
+    private void buildTableStatsOutput() {
+        for (int index = 0; index < totalRowsObject.size(); index++) {
+            List<Object> row = totalRowsObject.get(index);
+            String indexName = index == 0 ? tableName.getTbl() : "";
+            if (!detailed) {
+                totalRows.add(Arrays.asList(indexName, String.valueOf(row.get(1)),
+                        DebugUtil.printByteWithUnit((long) row.get(2)), String.valueOf(row.get(3)),
+                        String.valueOf(row.get(4)), DebugUtil.printByteWithUnit((long) row.get(5))));
+            } else {
+                totalRows.add(Arrays.asList(indexName, String.valueOf(row.get(1)),
+                        String.valueOf(row.get(3)), String.valueOf(row.get(4)),
+                        DebugUtil.printByteWithUnit((long) row.get(2)), DebugUtil.printByteWithUnit((long) row.get(7)),
+                        DebugUtil.printByteWithUnit((long) row.get(6)), DebugUtil.printByteWithUnit((long) row.get(5)),
+                        DebugUtil.printByteWithUnit((long) row.get(9)),
+                        DebugUtil.printByteWithUnit((long) row.get(8))));
             }
         }
+
+        // Total
+        if (!detailed) {
+            totalRows.add(Arrays.asList("", "Total", DebugUtil.printByteWithUnit(totalSize),
+                    String.valueOf(totalReplicaCount), "", DebugUtil.printByteWithUnit(totalRemoteSize)));
+        } else {
+            totalRows.add(Arrays.asList("", "Total", String.valueOf(totalReplicaCount), "",
+                    DebugUtil.printByteWithUnit(totalSize), DebugUtil.printByteWithUnit(totalLocalSegmentSize),
+                    DebugUtil.printByteWithUnit(totalLocalInvertedSize),
+                    DebugUtil.printByteWithUnit(totalRemoteSize),
+                    DebugUtil.printByteWithUnit(totalRemoteSegmentSize),
+                    DebugUtil.printByteWithUnit(totalRemoteInvertedSize)));
+        }
+    }
+
+    // |TableName|Size|ReplicaCount|RemoteSize|
+    // |TableName|ReplicaCount|LocalTotalSize|LocalDataSize|LocalIndexSize|
+    //                        |RemoteTotalSize|RemoteDataSize|RemoteIndexSize|
+    private void getSingleDbStats(Database db) {
+        db.readLock();
+        long quota = 0;
+        long replicaQuota = 0;
+        try {
+            collectDbStats(db);
+            quota = db.getDataQuota();
+            replicaQuota = db.getReplicaQuota();
+        } finally {
+            db.readUnlock();
+        }
+        // sort by
+        sortResult();
+        buildDbStatsOutput(quota, replicaQuota);
     }
 
-    public static int analyzeColumn(String columnName, String tableName) throws AnalysisException {
+    // |TableName|IndexName|Size|ReplicaCount|RowCount|RemoteSize|
+    // |TableName|IndexName|ReplicaCount||RowCount|LocalTotalSize |LocalDataSize |LocalIndexSize|
+    //                                            |RemoteTotalSize|RemoteDataSize|RemoteIndexSize|
+    private void getSingleTableStats(OlapTable table) {
+        table.readLock();
+        try {
+            collectTableStats(table);
+        } finally {
+            table.readUnlock();
+        }
+        // sort by
+        sortResult();
+        buildTableStatsOutput();
+    }
+
+    private int analyzeColumn(String columnName, String tableName) throws AnalysisException {
         ImmutableList<String> titles = SHOW_TABLE_DATA_META_DATA_ORIGIN;
         if (tableName != null) {
             titles = SHOW_INDEX_DATA_META_DATA_ORIGIN;
@@ -371,7 +446,7 @@ public static int analyzeColumn(String columnName, String tableName) throws Anal
         throw new AnalysisException("Title name[" + columnName + "] does not exist");
     }
 
-    private static Comparator<List<Object>> sortRows(Map<Integer, Boolean> sortMap) {
+    private Comparator<List<Object>> sortRows(Map<Integer, Boolean> sortMap) {
         Ordering ordering = Ordering.natural();
 
         return new Comparator<List<Object>>() {
@@ -400,28 +475,41 @@ public List<List<String>> getResultRows() throws AnalysisException {
 
     @Override
     public ShowResultSetMetaData getMetaData() {
-        String value = null;
         if (properties != null) {
-            value = properties.get(WAREHOUSE);
-        }
-        if (value != null && value.equals("true")) {
-            return SHOW_WAREHOUSE_DATA_META_DATA;
+            String value = properties.get(WAREHOUSE);
+            if (value != null && value.equals("true")) {
+                return SHOW_WAREHOUSE_DATA_META_DATA;
+            }
         }
 
         if (Strings.isNullOrEmpty(dbName)) {
             return SHOW_DATABASE_DATA_META_DATA;
         }
-        if (tableName != null) {
-            return SHOW_INDEX_DATA_META_DATA;
+
+        if (hasTable()) {
+            if (!detailed) {
+                return SHOW_INDEX_DATA_META_DATA;
+            } else {
+                return SHOW_DETAILED_INDEX_DATA_META_DATA;
+            }
         } else {
-            return SHOW_TABLE_DATA_META_DATA;
+            if (!detailed) {
+                return SHOW_TABLE_DATA_META_DATA;
+            } else {
+                return SHOW_DETAILED_TABLE_DATA_META_DATA;
+            }
         }
     }
 
     @Override
     public String toSql() {
         StringBuilder builder = new StringBuilder();
-        builder.append("SHOW DATA");
+        builder.append("SHOW ");
+        if (detailed) {
+            builder.append("DETAILED DATA");
+        } else {
+            builder.append("DATA");
+        }
 
         if (tableName != null) {
             builder.append(" FROM ");
@@ -445,6 +533,7 @@ public String toString() {
         return toSql();
     }
 
+    // |DBName|DataSize|RecycleSize|
     private boolean getDbStatsByProperties() {
         if (properties == null) {
             return false;
@@ -507,6 +596,7 @@ private boolean getDbStatsByProperties() {
         return false;
     }
 
+    // |DbId|DbName|Size|RemoteSize|RecycleSize|RecycleRemoteSize|
     private void getAllDbStats() throws AnalysisException {
         // check auth
         if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/analysis/UserIdentity.java b/fe/fe-core/src/main/java/org/apache/doris/analysis/UserIdentity.java
index 122f28ca45092b..6898915dab73ce 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/analysis/UserIdentity.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/analysis/UserIdentity.java
@@ -189,6 +189,10 @@ public boolean isAdminUser() {
         return user.equals(Auth.ADMIN_USER);
     }
 
+    public boolean isSystemUser() {
+        return isRootUser() || isAdminUser();
+    }
+
     public TUserIdentity toThrift() {
         Preconditions.checkState(isAnalyzed);
         TUserIdentity tUserIdent = new TUserIdentity();
diff --git a/fe/fe-core/src/main/java/org/apache/doris/backup/BackupHandler.java b/fe/fe-core/src/main/java/org/apache/doris/backup/BackupHandler.java
index d70544add98747..6a12eee3a78cb3 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/backup/BackupHandler.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/backup/BackupHandler.java
@@ -281,9 +281,14 @@ public void alterRepository(AlterRepositoryStmt stmt) throws DdlException {
 
     // handle drop repository stmt
     public void dropRepository(DropRepositoryStmt stmt) throws DdlException {
+        dropRepository(stmt.getRepoName());
+    }
+
+    // handle drop repository stmt
+    public void dropRepository(String repoName) throws DdlException {
         tryLock();
         try {
-            Repository repo = repoMgr.getRepo(stmt.getRepoName());
+            Repository repo = repoMgr.getRepo(repoName);
             if (repo == null) {
                 ErrorReport.reportDdlException(ErrorCode.ERR_COMMON_ERROR, "Repository does not exist");
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/backup/RestoreJob.java b/fe/fe-core/src/main/java/org/apache/doris/backup/RestoreJob.java
index f1abb0c9e632bc..6dfd02b3a42648 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/backup/RestoreJob.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/backup/RestoreJob.java
@@ -1312,9 +1312,9 @@ private void createReplicas(Database db, AgentBatchTask batchTask, OlapTable loc
             MaterializedIndexMeta indexMeta = localTbl.getIndexMetaByIndexId(restoredIdx.getId());
             List<Index> indexes = restoredIdx.getId() == localTbl.getBaseIndexId()
                                     ? localTbl.getCopiedIndexes() : null;
-            List<Integer> clusterKeyIndexes = null;
+            List<Integer> clusterKeyUids = null;
             if (indexMeta.getIndexId() == localTbl.getBaseIndexId() || localTbl.isShadowIndex(indexMeta.getIndexId())) {
-                clusterKeyIndexes = OlapTable.getClusterKeyIndexes(indexMeta.getSchema());
+                clusterKeyUids = OlapTable.getClusterKeyUids(indexMeta.getSchema());
             }
             for (Tablet restoreTablet : restoredIdx.getTablets()) {
                 TabletRef baseTabletRef = tabletBases == null ? null : tabletBases.get(restoreTablet.getId());
@@ -1363,11 +1363,11 @@ private void createReplicas(Database db, AgentBatchTask batchTask, OlapTable loc
                         LOG.info("set base tablet {} for replica {} in restore job {}, tablet id={}",
                                 baseTabletRef.tabletId, restoreReplica.getId(), jobId, restoreTablet.getId());
                     }
-                    if (!CollectionUtils.isEmpty(clusterKeyIndexes)) {
-                        task.setClusterKeyIndexes(clusterKeyIndexes);
-                        LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key indexes: {}",
+                    if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+                        task.setClusterKeyUids(clusterKeyUids);
+                        LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key uids: {}",
                                 localTbl.getId(), restorePart.getId(), restoredIdx.getId(), restoreTablet.getId(),
-                                clusterKeyIndexes);
+                                clusterKeyUids);
                     }
                     batchTask.addTask(task);
                 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinAggregateFunctions.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinAggregateFunctions.java
index 1db9cf6477e8fb..655a3dfce2985d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinAggregateFunctions.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinAggregateFunctions.java
@@ -57,6 +57,8 @@
 import org.apache.doris.nereids.trees.expressions.functions.agg.MultiDistinctSum;
 import org.apache.doris.nereids.trees.expressions.functions.agg.MultiDistinctSum0;
 import org.apache.doris.nereids.trees.expressions.functions.agg.Ndv;
+import org.apache.doris.nereids.trees.expressions.functions.agg.OrthogonalBitmapExprCalculate;
+import org.apache.doris.nereids.trees.expressions.functions.agg.OrthogonalBitmapExprCalculateCount;
 import org.apache.doris.nereids.trees.expressions.functions.agg.OrthogonalBitmapIntersect;
 import org.apache.doris.nereids.trees.expressions.functions.agg.OrthogonalBitmapIntersectCount;
 import org.apache.doris.nereids.trees.expressions.functions.agg.OrthogonalBitmapUnionCount;
@@ -124,7 +126,8 @@ public class BuiltinAggregateFunctions implements FunctionHelper {
             agg(HllUnion.class, "hll_raw_agg", "hll_union"),
             agg(HllUnionAgg.class, "hll_union_agg"),
             agg(IntersectCount.class, "intersect_count"),
-            agg(LinearHistogram.class, FunctionSet.LINEAR_HISTOGRAM),
+            agg(Kurt.class, "kurt", "kurt_pop", "kurtosis"),
+            agg(LinearHistogram.class, "linear_histogram"),
             agg(MapAgg.class, "map_agg"),
             agg(Max.class, "max"),
             agg(MaxBy.class, "max_by"),
@@ -135,6 +138,8 @@ public class BuiltinAggregateFunctions implements FunctionHelper {
             agg(MultiDistinctSum.class, "multi_distinct_sum"),
             agg(MultiDistinctSum0.class, "multi_distinct_sum0"),
             agg(Ndv.class, "approx_count_distinct", "ndv"),
+            agg(OrthogonalBitmapExprCalculate.class, "orthogonal_bitmap_expr_calculate"),
+            agg(OrthogonalBitmapExprCalculateCount.class, "orthogonal_bitmap_expr_calculate_count"),
             agg(OrthogonalBitmapIntersect.class, "orthogonal_bitmap_intersect"),
             agg(OrthogonalBitmapIntersectCount.class, "orthogonal_bitmap_intersect_count"),
             agg(OrthogonalBitmapUnionCount.class, "orthogonal_bitmap_union_count"),
@@ -148,6 +153,7 @@ public class BuiltinAggregateFunctions implements FunctionHelper {
             agg(Retention.class, "retention"),
             agg(SequenceCount.class, "sequence_count"),
             agg(SequenceMatch.class, "sequence_match"),
+            agg(Skew.class, "skew", "skew_pop", "skewness"),
             agg(Stddev.class, "stddev_pop", "stddev"),
             agg(StddevSamp.class, "stddev_samp"),
             agg(Sum.class, "sum"),
@@ -157,9 +163,7 @@ public class BuiltinAggregateFunctions implements FunctionHelper {
             agg(TopNWeighted.class, "topn_weighted"),
             agg(Variance.class, "var_pop", "variance_pop", "variance"),
             agg(VarianceSamp.class, "var_samp", "variance_samp"),
-            agg(WindowFunnel.class, "window_funnel"),
-            agg(Skew.class, "skew", "skew_pop", "skewness"),
-            agg(Kurt.class, "kurt", "kurt_pop", "kurtosis")
+            agg(WindowFunnel.class, "window_funnel")
     );
 
     public final Set<String> aggFuncNames = aggregateFunctions.stream()
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/CloudTabletStatMgr.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/CloudTabletStatMgr.java
index 309b433572c942..3babb0e001a204 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/CloudTabletStatMgr.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/CloudTabletStatMgr.java
@@ -165,6 +165,8 @@ protected void runAfterCatalogReady() {
 
                 Long tableDataSize = 0L;
                 Long tableTotalReplicaDataSize = 0L;
+                Long tableTotalLocalIndexSize = 0L;
+                Long tableTotalLocalSegmentSize = 0L;
 
                 Long tableReplicaCount = 0L;
 
@@ -185,6 +187,8 @@ protected void runAfterCatalogReady() {
                                 long tabletRowsetCount = 0L;
                                 long tabletSegmentCount = 0L;
                                 long tabletRowCount = 0L;
+                                long tabletIndexSize = 0L;
+                                long tabletSegmentSize = 0L;
 
                                 for (Replica replica : tablet.getReplicas()) {
                                     if (replica.getDataSize() > tabletDataSize) {
@@ -204,6 +208,13 @@ protected void runAfterCatalogReady() {
                                         tabletSegmentCount = replica.getSegmentCount();
                                     }
 
+                                    if (replica.getLocalInvertedIndexSize() > tabletIndexSize) {
+                                        tabletIndexSize = replica.getLocalInvertedIndexSize();
+                                    }
+                                    if (replica.getLocalSegmentSize() > tabletSegmentSize) {
+                                        tabletSegmentSize = replica.getLocalSegmentSize();
+                                    }
+
                                     tableReplicaCount++;
                                 }
 
@@ -214,6 +225,8 @@ protected void runAfterCatalogReady() {
 
                                 tableRowsetCount += tabletRowsetCount;
                                 tableSegmentCount += tabletSegmentCount;
+                                tableTotalLocalIndexSize += tabletIndexSize;
+                                tableTotalLocalSegmentSize += tabletSegmentSize;
                             } // end for tablets
                             index.setRowCountReported(true);
                             index.setRowCount(indexRowCount);
@@ -223,7 +236,8 @@ protected void runAfterCatalogReady() {
                     //  this is only one thread to update table statistics, readLock is enough
                     olapTable.setStatistics(new OlapTable.Statistics(db.getName(),
                             table.getName(), tableDataSize, tableTotalReplicaDataSize, 0L,
-                            tableReplicaCount, tableRowCount, tableRowsetCount, tableSegmentCount));
+                            tableReplicaCount, tableRowCount, tableRowsetCount, tableSegmentCount,
+                            tableTotalLocalIndexSize, tableTotalLocalSegmentSize, 0L, 0L));
                     LOG.debug("finished to set row num for table: {} in database: {}",
                              table.getName(), db.getFullName());
                 } finally {
@@ -232,7 +246,7 @@ protected void runAfterCatalogReady() {
 
                 newCloudTableStatsMap.put(Pair.of(dbId, table.getId()), new OlapTable.Statistics(db.getName(),
                         table.getName(), tableDataSize, tableTotalReplicaDataSize, 0L,
-                        tableReplicaCount, tableRowCount, tableRowsetCount, tableSegmentCount));
+                        tableReplicaCount, tableRowCount, tableRowsetCount, tableSegmentCount, 0L, 0L, 0L, 0L));
             }
         }
         this.cloudTableStatsMap = newCloudTableStatsMap;
@@ -253,6 +267,8 @@ private void updateTabletStat(GetTabletStatsResponse response) {
                 replica.setRowsetCount(stat.getNumRowsets());
                 replica.setSegmentCount(stat.getNumSegments());
                 replica.setRowCount(stat.getNumRows());
+                replica.setLocalInvertedIndexSize(stat.getIndexSize());
+                replica.setLocalSegmentSize(stat.getSegmentSize());
             }
         }
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/Column.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/Column.java
index 916a213027f2f6..0ae6a4f8bdb5eb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/Column.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/Column.java
@@ -1019,7 +1019,7 @@ public String toSql(boolean isUniqueTable, boolean isCompatible) {
             sb.append(" ON UPDATE ").append(defaultValue).append("");
         }
         if (StringUtils.isNotBlank(comment)) {
-            sb.append(" COMMENT '").append(getComment(true)).append("'");
+            sb.append(" COMMENT \"").append(getComment(true)).append("\"");
         }
         return sb.toString();
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/EncryptKeyHelper.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/EncryptKeyHelper.java
index 2e30f0ba86f326..934dd22f3a5b89 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/EncryptKeyHelper.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/EncryptKeyHelper.java
@@ -32,10 +32,16 @@ public class EncryptKeyHelper {
 
     public static void createEncryptKey(CreateEncryptKeyStmt stmt) throws UserException {
         EncryptKeyName name = stmt.getEncryptKeyName();
-        Database db = Env.getCurrentInternalCatalog().getDbOrDdlException(name.getDb());
-        db.addEncryptKey(stmt.getEncryptKey(), stmt.isIfNotExists());
+        createEncryptKey(name.getDb(), stmt.getEncryptKey(), stmt.isIfNotExists());
+    }
+
+    public static void createEncryptKey(String dbName, EncryptKey encryptKey,
+                                        boolean isIfNotExists) throws UserException {
+        Database db = Env.getCurrentInternalCatalog().getDbOrDdlException(dbName);
+        db.addEncryptKey(encryptKey, isIfNotExists);
     }
 
+
     public static void replayCreateEncryptKey(EncryptKey encryptKey) throws MetaNotFoundException {
         String dbName = encryptKey.getEncryptKeyName().getDb();
         Database db = Env.getCurrentInternalCatalog().getDbOrMetaException(dbName);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/Env.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/Env.java
index 7597a7d256b460..b3544b4de55460 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/Env.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/Env.java
@@ -3429,25 +3429,33 @@ public static void getSyncedDdlStmt(TableIf table, List<String> createTableStmt,
                 hidePassword, false, specificVersion, false, true);
     }
 
-    public static String getMTMVDdl(MTMV mtmv) {
-        StringBuilder sb = new StringBuilder("CREATE MATERIALIZED VIEW ");
-        sb.append(mtmv.getName());
-        addMTMVCols(mtmv, sb);
-        sb.append("\n");
-        sb.append(mtmv.getRefreshInfo());
-        addMTMVKeyInfo(mtmv, sb);
-        addTableComment(mtmv, sb);
-        addMTMVPartitionInfo(mtmv, sb);
-        DistributionInfo distributionInfo = mtmv.getDefaultDistributionInfo();
-        sb.append("\n").append(distributionInfo.toSql());
-        // properties
-        sb.append("\nPROPERTIES (\n");
-        addOlapTablePropertyInfo(mtmv, sb, false, false, null);
-        addMTMVPropertyInfo(mtmv, sb);
-        sb.append("\n)");
-        sb.append("\nAS ");
-        sb.append(mtmv.getQuerySql());
-        return sb.toString();
+    public static String getMTMVDdl(MTMV mtmv) throws AnalysisException {
+        if (!mtmv.tryReadLock(1, TimeUnit.MINUTES)) {
+            throw new AnalysisException(
+                    "get table read lock timeout, database=" + mtmv.getDBName() + ",table=" + mtmv.getName());
+        }
+        try {
+            StringBuilder sb = new StringBuilder("CREATE MATERIALIZED VIEW ");
+            sb.append(mtmv.getName());
+            addMTMVCols(mtmv, sb);
+            sb.append("\n");
+            sb.append(mtmv.getRefreshInfo());
+            addMTMVKeyInfo(mtmv, sb);
+            addTableComment(mtmv, sb);
+            addMTMVPartitionInfo(mtmv, sb);
+            DistributionInfo distributionInfo = mtmv.getDefaultDistributionInfo();
+            sb.append("\n").append(distributionInfo.toSql());
+            // properties
+            sb.append("\nPROPERTIES (\n");
+            addOlapTablePropertyInfo(mtmv, sb, false, false, null);
+            addMTMVPropertyInfo(mtmv, sb);
+            sb.append("\n)");
+            sb.append("\nAS ");
+            sb.append(mtmv.getQuerySql());
+            return sb.toString();
+        } finally {
+            mtmv.readUnlock();
+        }
     }
 
     private static void addMTMVKeyInfo(MTMV mtmv, StringBuilder sb) {
@@ -6555,14 +6563,18 @@ public void compactTable(AdminCompactTableStmt stmt) throws DdlException {
         String dbName = stmt.getDbName();
         String tableName = stmt.getTblName();
         String type = stmt.getCompactionType();
+        List<String> partitionNames = stmt.getPartitions();
+        compactTable(dbName, tableName, type, partitionNames);
+    }
 
+    public void compactTable(String dbName, String tableName, String type, List<String> partitionNames)
+            throws DdlException {
         Database db = getInternalCatalog().getDbOrDdlException(dbName);
         OlapTable olapTable = db.getOlapTableOrDdlException(tableName);
 
         AgentBatchTask batchTask = new AgentBatchTask();
         olapTable.readLock();
         try {
-            List<String> partitionNames = stmt.getPartitions();
             LOG.info("Table compaction. database: {}, table: {}, partition: {}, type: {}", dbName, tableName,
                     Joiner.on(", ").join(partitionNames), type);
             for (String parName : partitionNames) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/MTMV.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/MTMV.java
index 955bfd4279fd5c..daf1aac333d653 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/MTMV.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/MTMV.java
@@ -392,7 +392,7 @@ public Pair<Map<String, Set<String>>, Map<String, String>> calculateDoublyPartit
         Map<String, String> baseToMv = Maps.newHashMap();
         Map<PartitionKeyDesc, Set<String>> relatedPartitionDescs = MTMVPartitionUtil
                 .generateRelatedPartitionDescs(mvPartitionInfo, mvProperties);
-        Map<String, PartitionItem> mvPartitionItems = getAndCopyPartitionItems();
+        Map<String, PartitionItem> mvPartitionItems = getAndCopyPartitionItemsWithoutLock();
         for (Entry<String, PartitionItem> entry : mvPartitionItems.entrySet()) {
             Set<String> basePartitionNames = relatedPartitionDescs.getOrDefault(entry.getValue().toPartitionKeyDesc(),
                     Sets.newHashSet());
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/MaterializedIndex.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/MaterializedIndex.java
index 6e4f6a2248e719..5e367b538cd74c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/MaterializedIndex.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/MaterializedIndex.java
@@ -197,6 +197,46 @@ public long getReplicaCount() {
         return replicaCount;
     }
 
+    public long getLocalIndexSize() {
+        long localIndexSize = 0;
+        for (Tablet tablet : getTablets()) {
+            for (Replica replica : tablet.getReplicas()) {
+                localIndexSize += replica.getLocalInvertedIndexSize();
+            }
+        }
+        return localIndexSize;
+    }
+
+    public long getLocalSegmentSize() {
+        long localSegmentSize = 0;
+        for (Tablet tablet : getTablets()) {
+            for (Replica replica : tablet.getReplicas()) {
+                localSegmentSize += replica.getLocalSegmentSize();
+            }
+        }
+        return localSegmentSize;
+    }
+
+    public long getRemoteIndexSize() {
+        long remoteIndexSize = 0;
+        for (Tablet tablet : getTablets()) {
+            for (Replica replica : tablet.getReplicas()) {
+                remoteIndexSize += replica.getRemoteInvertedIndexSize();
+            }
+        }
+        return remoteIndexSize;
+    }
+
+    public long getRemoteSegmentSize() {
+        long remoteSegmentSize = 0;
+        for (Tablet tablet : getTablets()) {
+            for (Replica replica : tablet.getReplicas()) {
+                remoteSegmentSize += replica.getRemoteSegmentSize();
+            }
+        }
+        return remoteSegmentSize;
+    }
+
     public int getTabletOrderIdx(long tabletId) {
         int idx = 0;
         for (Tablet tablet : tablets) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/MetadataViewer.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/MetadataViewer.java
index 4da77267857f67..501d49e4add8d9 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/MetadataViewer.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/MetadataViewer.java
@@ -28,6 +28,8 @@
 import org.apache.doris.common.Config;
 import org.apache.doris.common.DdlException;
 import org.apache.doris.common.FeConstants;
+import org.apache.doris.nereids.trees.expressions.EqualTo;
+import org.apache.doris.nereids.trees.expressions.Expression;
 import org.apache.doris.resource.Tag;
 import org.apache.doris.system.Backend;
 import org.apache.doris.system.SystemInfoService;
@@ -152,6 +154,113 @@ private static List<List<String>> getTabletStatus(String dbName, String tblName,
         return result;
     }
 
+    /**
+     * Used for Nereids
+     */
+    public static List<List<String>> getTabletStatus(String dbName, String tblName, List<String> partitions,
+                                                      ReplicaStatus statusFilter, Expression op) throws DdlException {
+        List<List<String>> result = Lists.newArrayList();
+
+        Env env = Env.getCurrentEnv();
+        SystemInfoService infoService = Env.getCurrentSystemInfo();
+
+        Database db = env.getInternalCatalog().getDbOrDdlException(dbName);
+        OlapTable olapTable = db.getOlapTableOrDdlException(tblName);
+
+        olapTable.readLock();
+        try {
+            if (partitions.isEmpty()) {
+                partitions.addAll(olapTable.getPartitionNames());
+            } else {
+                // check partition
+                for (String partName : partitions) {
+                    Partition partition = olapTable.getPartition(partName);
+                    if (partition == null) {
+                        throw new DdlException("Partition does not exist: " + partName);
+                    }
+                }
+            }
+
+            for (String partName : partitions) {
+                Partition partition = olapTable.getPartition(partName);
+                long visibleVersion = partition.getVisibleVersion();
+                short replicationNum = olapTable.getPartitionInfo()
+                        .getReplicaAllocation(partition.getId()).getTotalReplicaNum();
+
+                for (MaterializedIndex index : partition.getMaterializedIndices(IndexExtState.VISIBLE)) {
+                    int schemaHash = olapTable.getSchemaHashByIndexId(index.getId());
+                    for (Tablet tablet : index.getTablets()) {
+                        long tabletId = tablet.getId();
+                        int count = replicationNum;
+                        for (Replica replica : tablet.getReplicas()) {
+                            --count;
+                            List<String> row = Lists.newArrayList();
+
+                            ReplicaStatus status = ReplicaStatus.OK;
+                            Backend be = infoService.getBackend(replica.getBackendIdWithoutException());
+                            if (be == null || !be.isAlive() || replica.isBad()) {
+                                status = ReplicaStatus.DEAD;
+                            } else if (replica.getVersion() < visibleVersion
+                                    || replica.getLastFailedVersion() > 0) {
+                                status = ReplicaStatus.VERSION_ERROR;
+
+                            } else if (replica.getSchemaHash() != -1 && replica.getSchemaHash() != schemaHash) {
+                                status = ReplicaStatus.SCHEMA_ERROR;
+                            } else if (replica.isUserDrop()) {
+                                status = ReplicaStatus.DROP;
+                            }
+
+                            if (filterReplica(status, statusFilter, op)) {
+                                continue;
+                            }
+
+                            row.add(String.valueOf(tabletId));
+                            row.add(String.valueOf(replica.getId()));
+                            row.add(String.valueOf(replica.getBackendIdWithoutException()));
+                            row.add(String.valueOf(replica.getVersion()));
+                            row.add(String.valueOf(replica.getLastFailedVersion()));
+                            row.add(String.valueOf(replica.getLastSuccessVersion()));
+                            row.add(String.valueOf(visibleVersion));
+                            row.add(String.valueOf(replica.getSchemaHash()));
+                            row.add(String.valueOf(replica.getTotalVersionCount()));
+                            row.add(String.valueOf(replica.isBad()));
+                            row.add(String.valueOf(replica.isUserDrop()));
+                            row.add(replica.getState().name());
+                            row.add(status.name());
+                            result.add(row);
+                        }
+
+                        if (filterReplica(ReplicaStatus.MISSING, statusFilter, op)) {
+                            continue;
+                        }
+
+                        // get missing replicas
+                        for (int i = 0; i < count; ++i) {
+                            List<String> row = Lists.newArrayList();
+                            row.add(String.valueOf(tabletId));
+                            row.add("-1");
+                            row.add("-1");
+                            row.add("-1");
+                            row.add("-1");
+                            row.add("-1");
+                            row.add("-1");
+                            row.add("-1");
+                            row.add(FeConstants.null_string);
+                            row.add(FeConstants.null_string);
+                            row.add(FeConstants.null_string);
+                            row.add(ReplicaStatus.MISSING.name());
+                            result.add(row);
+                        }
+                    }
+                }
+            }
+        } finally {
+            olapTable.readUnlock();
+        }
+
+        return result;
+    }
+
     private static boolean filterReplica(ReplicaStatus status, ReplicaStatus statusFilter, Operator op) {
         if (statusFilter == null) {
             return false;
@@ -163,6 +272,20 @@ private static boolean filterReplica(ReplicaStatus status, ReplicaStatus statusF
         }
     }
 
+    /**
+     * Used for Nereids
+     */
+    private static boolean filterReplica(ReplicaStatus status, ReplicaStatus statusFilter, Expression op) {
+        if (statusFilter == null) {
+            return false;
+        }
+        if (op instanceof EqualTo) {
+            return status != statusFilter;
+        } else {
+            return status == statusFilter;
+        }
+    }
+
     public static List<List<String>> getTabletDistribution(ShowReplicaDistributionStmt stmt) throws DdlException {
         return getTabletDistribution(stmt.getDbName(), stmt.getTblName(), stmt.getPartitionNames());
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/OlapTable.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/OlapTable.java
index 8925e483c29df7..c1d62a4be0d4d5 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/OlapTable.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/OlapTable.java
@@ -1688,11 +1688,22 @@ public long getAvgRowLength() {
     public long getDataLength() {
         long dataSize = 0;
         for (Map.Entry<Long, Partition> entry : idToPartition.entrySet()) {
-            dataSize += entry.getValue().getBaseIndex().getDataSize(false);
+            dataSize += entry.getValue().getBaseIndex().getLocalSegmentSize();
+            dataSize += entry.getValue().getBaseIndex().getRemoteSegmentSize();
         }
         return dataSize;
     }
 
+    @Override
+    public long getIndexLength() {
+        long indexSize = 0;
+        for (Map.Entry<Long, Partition> entry : idToPartition.entrySet()) {
+            indexSize += entry.getValue().getBaseIndex().getLocalIndexSize();
+            indexSize += entry.getValue().getBaseIndex().getRemoteIndexSize();
+        }
+        return indexSize;
+    }
+
     // Get the signature string of this table with specified partitions.
     // This method is used to determine whether the tables have the same schema.
     // Contains:
@@ -2873,6 +2884,9 @@ public boolean getEnableUniqueKeyMergeOnWrite() {
         if (tableProperty == null) {
             return false;
         }
+        if (getKeysType() != KeysType.UNIQUE_KEYS) {
+            return false;
+        }
         return tableProperty.getEnableUniqueKeyMergeOnWrite();
     }
 
@@ -3278,14 +3292,14 @@ private static List<Long> getVisibleVersionFromMeta(List<Long> dbIds, List<Long>
         }
     }
 
-    public static List<Integer> getClusterKeyIndexes(List<Column> columns) {
-        Map<Integer, Integer> clusterKeyIndexes = new TreeMap<>();
+    public static List<Integer> getClusterKeyUids(List<Column> columns) {
+        Map<Integer, Integer> clusterKeyUids = new TreeMap<>();
         for (Column column : columns) {
             if (column.isClusterKey()) {
-                clusterKeyIndexes.put(column.getClusterKeyId(), column.getUniqueId());
+                clusterKeyUids.put(column.getClusterKeyId(), column.getUniqueId());
             }
         }
-        return clusterKeyIndexes.isEmpty() ? null : new ArrayList<>(clusterKeyIndexes.values());
+        return clusterKeyUids.isEmpty() ? null : new ArrayList<>(clusterKeyUids.values());
     }
 
     public long getVisibleVersionTime() {
@@ -3312,19 +3326,23 @@ public Map<String, PartitionItem> getAndCopyPartitionItems() throws AnalysisExce
             throw new AnalysisException("get table read lock timeout, database=" + getDBName() + ",table=" + getName());
         }
         try {
-            Map<String, PartitionItem> res = Maps.newHashMap();
-            for (Entry<Long, PartitionItem> entry : getPartitionInfo().getIdToItem(false).entrySet()) {
-                Partition partition = idToPartition.get(entry.getKey());
-                if (partition != null) {
-                    res.put(partition.getName(), entry.getValue());
-                }
-            }
-            return res;
+            return getAndCopyPartitionItemsWithoutLock();
         } finally {
             readUnlock();
         }
     }
 
+    public Map<String, PartitionItem> getAndCopyPartitionItemsWithoutLock() throws AnalysisException {
+        Map<String, PartitionItem> res = Maps.newHashMap();
+        for (Entry<Long, PartitionItem> entry : getPartitionInfo().getIdToItem(false).entrySet()) {
+            Partition partition = idToPartition.get(entry.getKey());
+            if (partition != null) {
+                res.put(partition.getName(), entry.getValue());
+            }
+        }
+        return res;
+    }
+
     @Override
     public List<Column> getPartitionColumns(Optional<MvccSnapshot> snapshot) {
         return getPartitionColumns();
@@ -3387,6 +3405,18 @@ public static class Statistics {
         @Getter
         private Long segmentCount;
 
+        @Getter
+        private Long localInvertedIndexSize;   // multi replicas
+
+        @Getter
+        private Long localSegmentSize;         // multi replicas
+
+        @Getter
+        private Long remoteInvertedIndexSize;  // single replica
+
+        @Getter
+        private Long remoteSegmentSize;        // single replica
+
         public Statistics() {
             this.dbName = null;
             this.tableName = null;
@@ -3401,13 +3431,18 @@ public Statistics() {
             this.rowCount = 0L;
             this.rowsetCount = 0L;
             this.segmentCount = 0L;
-
+            this.localInvertedIndexSize = 0L;
+            this.localSegmentSize = 0L;
+            this.remoteInvertedIndexSize = 0L;
+            this.remoteSegmentSize = 0L;
         }
 
         public Statistics(String dbName, String tableName,
                 Long dataSize, Long totalReplicaDataSize,
                 Long remoteDataSize, Long replicaCount, Long rowCount,
-                Long rowsetCount, Long segmentCount) {
+                Long rowsetCount, Long segmentCount,
+                Long localInvertedIndexSize, Long localSegmentSize,
+                Long remoteInvertedIndexSize, Long remoteSegmentSize) {
 
             this.dbName = dbName;
             this.tableName = tableName;
@@ -3422,6 +3457,11 @@ public Statistics(String dbName, String tableName,
             this.rowCount = rowCount;
             this.rowsetCount = rowsetCount;
             this.segmentCount = segmentCount;
+
+            this.localInvertedIndexSize = localInvertedIndexSize;
+            this.localSegmentSize = localSegmentSize;
+            this.remoteInvertedIndexSize = remoteInvertedIndexSize;
+            this.remoteSegmentSize = remoteSegmentSize;
         }
     }
 
@@ -3445,6 +3485,22 @@ public long getReplicaCount() {
         return statistics.getReplicaCount();
     }
 
+    public long getLocalIndexFileSize() {
+        return statistics.getLocalInvertedIndexSize();
+    }
+
+    public long getLocalSegmentSize() {
+        return statistics.getLocalSegmentSize();
+    }
+
+    public long getRemoteIndexFileSize() {
+        return statistics.getRemoteInvertedIndexSize();
+    }
+
+    public long getRemoteSegmentSize() {
+        return statistics.getRemoteSegmentSize();
+    }
+
     public boolean isShadowIndex(long indexId) {
         String indexName = getIndexNameById(indexId);
         if (indexName != null && indexName.startsWith(org.apache.doris.alter.SchemaChangeHandler.SHADOW_NAME_PREFIX)) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/PartitionKey.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/PartitionKey.java
index f9640ccae14023..29bfda8b201d20 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/PartitionKey.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/PartitionKey.java
@@ -373,15 +373,14 @@ public String toSql() {
             if (expr == MaxLiteral.MAX_VALUE || expr.isNullLiteral()) {
                 value = expr.toSql();
                 sb.append(value);
-                continue;
             } else {
                 value = "\"" + expr.getRealValue() + "\"";
                 if (expr instanceof DateLiteral) {
                     DateLiteral dateLiteral = (DateLiteral) expr;
                     value = dateLiteral.toSql();
                 }
+                sb.append(value);
             }
-            sb.append(value);
 
             if (keys.size() - 1 != i) {
                 sb.append(", ");
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/Replica.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/Replica.java
index e86bd25cb5e926..d248cc40839988 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/Replica.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/Replica.java
@@ -26,6 +26,8 @@
 import org.apache.doris.thrift.TUniqueId;
 
 import com.google.gson.annotations.SerializedName;
+import lombok.Getter;
+import lombok.Setter;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
@@ -122,6 +124,23 @@ public static class ReplicaContext {
     @SerializedName(value = "lsvh", alternate = {"lastSuccessVersionHash"})
     private long lastSuccessVersionHash = 0L;
 
+    @Setter
+    @Getter
+    @SerializedName(value = "lis", alternate = {"localInvertedIndexSize"})
+    private Long localInvertedIndexSize = 0L;
+    @Setter
+    @Getter
+    @SerializedName(value = "lss", alternate = {"localSegmentSize"})
+    private Long localSegmentSize = 0L;
+    @Setter
+    @Getter
+    @SerializedName(value = "ris", alternate = {"remoteInvertedIndexSize"})
+    private Long remoteInvertedIndexSize = 0L;
+    @Setter
+    @Getter
+    @SerializedName(value = "rss", alternate = {"remoteSegmentSize"})
+    private Long remoteSegmentSize = 0L;
+
     private volatile long totalVersionCount = -1;
     private volatile long visibleVersionCount = -1;
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/Table.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/Table.java
index ed37a936e10819..0f1d91087d2988 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/Table.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/Table.java
@@ -446,6 +446,9 @@ public long getDataLength() {
         return 0;
     }
 
+    public long getIndexLength() {
+        return 0;
+    }
 
     public TTableDescriptor toThrift() {
         return null;
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/TableIf.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/TableIf.java
index 8f6e924f44a54d..4761ac9d86db2a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/TableIf.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/TableIf.java
@@ -174,6 +174,8 @@ default int getBaseColumnIdxByName(String colName) {
 
     long getAvgRowLength();
 
+    long getIndexLength();
+
     long getLastCheckTime();
 
     String getComment(boolean escapeQuota);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletInvertedIndex.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletInvertedIndex.java
index 4a421dc7b2b1ef..a51d1f55014fcc 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletInvertedIndex.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletInvertedIndex.java
@@ -37,13 +37,14 @@
 import org.apache.doris.transaction.TransactionStatus;
 
 import com.google.common.base.Preconditions;
-import com.google.common.collect.ArrayListMultimap;
 import com.google.common.collect.HashBasedTable;
 import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.LinkedHashMultimap;
 import com.google.common.collect.ListMultimap;
 import com.google.common.collect.Lists;
 import com.google.common.collect.Maps;
 import com.google.common.collect.Ordering;
+import com.google.common.collect.SetMultimap;
 import com.google.common.collect.Sets;
 import com.google.common.collect.Table;
 import com.google.common.collect.TreeMultimap;
@@ -135,7 +136,7 @@ public void tabletReport(long backendId, Map<Long, TTablet> backendTablets,
                              Set<Long> tabletFoundInMeta,
                              ListMultimap<TStorageMedium, Long> tabletMigrationMap,
                              Map<Long, Long> partitionVersionSyncMap,
-                             Map<Long, ListMultimap<Long, TPartitionVersionInfo>> transactionsToPublish,
+                             Map<Long, SetMultimap<Long, TPartitionVersionInfo>> transactionsToPublish,
                              ListMultimap<Long, Long> transactionsToClear,
                              ListMultimap<Long, Long> tabletRecoveryMap,
                              List<TTabletMetaInfo> tabletToUpdate,
@@ -314,7 +315,7 @@ && isLocal(tabletMeta.getStorageMedium())) {
     }
 
     private void handleBackendTransactions(long backendId, List<Long> transactionIds, long tabletId,
-            TabletMeta tabletMeta, Map<Long, ListMultimap<Long, TPartitionVersionInfo>> transactionsToPublish,
+            TabletMeta tabletMeta, Map<Long, SetMultimap<Long, TPartitionVersionInfo>> transactionsToPublish,
             ListMultimap<Long, Long> transactionsToClear) {
         GlobalTransactionMgrIface transactionMgr = Env.getCurrentGlobalTransactionMgr();
         long partitionId = tabletMeta.getPartitionId();
@@ -376,15 +377,15 @@ private TPartitionVersionInfo generatePartitionVersionInfoWhenReport(Transaction
     }
 
     private void publishPartition(TransactionState transactionState, long transactionId, TabletMeta tabletMeta,
-            long partitionId, Map<Long, ListMultimap<Long, TPartitionVersionInfo>> transactionsToPublish) {
+            long partitionId, Map<Long, SetMultimap<Long, TPartitionVersionInfo>> transactionsToPublish) {
         TPartitionVersionInfo versionInfo = generatePartitionVersionInfoWhenReport(transactionState,
                 transactionId, tabletMeta, partitionId);
         if (versionInfo != null) {
             synchronized (transactionsToPublish) {
-                ListMultimap<Long, TPartitionVersionInfo> map = transactionsToPublish.get(
+                SetMultimap<Long, TPartitionVersionInfo> map = transactionsToPublish.get(
                         transactionState.getDbId());
                 if (map == null) {
-                    map = ArrayListMultimap.create();
+                    map = LinkedHashMultimap.create();
                     transactionsToPublish.put(transactionState.getDbId(), map);
                 }
                 map.put(transactionId, versionInfo);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletStatMgr.java b/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletStatMgr.java
index aa46c362e38ba9..f79ed89215b4d3 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletStatMgr.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/catalog/TabletStatMgr.java
@@ -114,6 +114,11 @@ protected void runAfterCatalogReady() {
                 Long tableDataSize = 0L;
                 Long tableTotalReplicaDataSize = 0L;
 
+                Long tableTotalLocalIndexSize = 0L;
+                Long tableTotalLocalSegmentSize = 0L;
+                Long tableTotalRemoteIndexSize = 0L;
+                Long tableTotalRemoteSegmentSize = 0L;
+
                 Long tableRemoteDataSize = 0L;
 
                 Long tableReplicaCount = 0L;
@@ -171,6 +176,10 @@ protected void runAfterCatalogReady() {
                                         tabletRemoteDataSize = replica.getRemoteDataSize();
                                     }
                                     tableReplicaCount++;
+                                    tableTotalLocalIndexSize += replica.getLocalInvertedIndexSize();
+                                    tableTotalLocalSegmentSize += replica.getLocalSegmentSize();
+                                    tableTotalRemoteIndexSize += replica.getRemoteInvertedIndexSize();
+                                    tableTotalRemoteSegmentSize += replica.getRemoteSegmentSize();
                                 }
 
                                 tableDataSize += tabletDataSize;
@@ -196,7 +205,9 @@ protected void runAfterCatalogReady() {
                     // this is only one thread to update table statistics, readLock is enough
                     olapTable.setStatistics(new OlapTable.Statistics(db.getName(), table.getName(),
                             tableDataSize, tableTotalReplicaDataSize,
-                            tableRemoteDataSize, tableReplicaCount, tableRowCount, 0L, 0L));
+                            tableRemoteDataSize, tableReplicaCount, tableRowCount, 0L, 0L,
+                            tableTotalLocalIndexSize, tableTotalLocalSegmentSize,
+                            tableTotalRemoteIndexSize, tableTotalRemoteSegmentSize));
 
                     if (LOG.isDebugEnabled()) {
                         LOG.debug("finished to set row num for table: {} in database: {}",
@@ -220,6 +231,10 @@ private void updateTabletStat(Long beId, TTabletStatResult result) {
                     if (replica != null) {
                         replica.setDataSize(stat.getDataSize());
                         replica.setRemoteDataSize(stat.getRemoteDataSize());
+                        replica.setLocalInvertedIndexSize(stat.getLocalIndexSize());
+                        replica.setLocalSegmentSize(stat.getLocalSegmentSize());
+                        replica.setRemoteInvertedIndexSize(stat.getRemoteIndexSize());
+                        replica.setRemoteSegmentSize(stat.getRemoteSegmentSize());
                         replica.setRowCount(stat.getRowCount());
                         replica.setTotalVersionCount(stat.getTotalVersionCount());
                         replica.setVisibleVersionCount(stat.isSetVisibleVersionCount() ? stat.getVisibleVersionCount()
diff --git a/fe/fe-core/src/main/java/org/apache/doris/cloud/datasource/CloudInternalCatalog.java b/fe/fe-core/src/main/java/org/apache/doris/cloud/datasource/CloudInternalCatalog.java
index b8a364f9449042..fb0df9e488b3c2 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/cloud/datasource/CloudInternalCatalog.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/cloud/datasource/CloudInternalCatalog.java
@@ -156,10 +156,10 @@ protected Partition createPartitionWithIndices(long dbId, OlapTable tbl, long pa
             } else {
                 indexes = Lists.newArrayList();
             }
-            List<Integer> clusterKeyIndexes = null;
+            List<Integer> clusterKeyUids = null;
             if (indexId == tbl.getBaseIndexId()) {
-                // only base and shadow index need cluster key indexes
-                clusterKeyIndexes = OlapTable.getClusterKeyIndexes(columns);
+                // only base and shadow index need cluster key unique column ids
+                clusterKeyUids = OlapTable.getClusterKeyUids(columns);
             }
             Cloud.CreateTabletsRequest.Builder requestBuilder = Cloud.CreateTabletsRequest.newBuilder();
             List<String> rowStoreColumns =
@@ -180,7 +180,7 @@ protected Partition createPartitionWithIndices(long dbId, OlapTable tbl, long pa
                         tbl.getEnableMowLightDelete(),
                         tbl.getInvertedIndexFileStorageFormat(),
                         tbl.rowStorePageSize(),
-                        tbl.variantEnableFlattenNested(), clusterKeyIndexes,
+                        tbl.variantEnableFlattenNested(), clusterKeyUids,
                         tbl.storagePageSize());
                 requestBuilder.addTabletMetas(builder);
             }
@@ -231,7 +231,7 @@ public OlapFile.TabletMetaCloudPB.Builder createTabletMetaBuilder(long tableId,
             Long timeSeriesCompactionLevelThreshold, boolean disableAutoCompaction,
             List<Integer> rowStoreColumnUniqueIds, boolean enableMowLightDelete,
             TInvertedIndexFileStorageFormat invertedIndexFileStorageFormat, long pageSize,
-            boolean variantEnableFlattenNested, List<Integer> clusterKeyIdxes,
+            boolean variantEnableFlattenNested, List<Integer> clusterKeyUids,
             long storagePageSize) throws DdlException {
         OlapFile.TabletMetaCloudPB.Builder builder = OlapFile.TabletMetaCloudPB.newBuilder();
         builder.setTableId(tableId);
@@ -354,15 +354,19 @@ public OlapFile.TabletMetaCloudPB.Builder createTabletMetaBuilder(long tableId,
         if (invertedIndexFileStorageFormat != null) {
             if (invertedIndexFileStorageFormat == TInvertedIndexFileStorageFormat.V1) {
                 schemaBuilder.setInvertedIndexStorageFormat(OlapFile.InvertedIndexStorageFormatPB.V1);
-            } else {
+            } else if (invertedIndexFileStorageFormat == TInvertedIndexFileStorageFormat.V2) {
                 schemaBuilder.setInvertedIndexStorageFormat(OlapFile.InvertedIndexStorageFormatPB.V2);
+            } else if (invertedIndexFileStorageFormat == TInvertedIndexFileStorageFormat.V3) {
+                schemaBuilder.setInvertedIndexStorageFormat(OlapFile.InvertedIndexStorageFormatPB.V3);
+            } else {
+                throw new DdlException("invalid inverted index storage format");
             }
         }
         schemaBuilder.setRowStorePageSize(pageSize);
         schemaBuilder.setStoragePageSize(storagePageSize);
         schemaBuilder.setEnableVariantFlattenNested(variantEnableFlattenNested);
-        if (!CollectionUtils.isEmpty(clusterKeyIdxes)) {
-            schemaBuilder.addAllClusterKeyIdxes(clusterKeyIdxes);
+        if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+            schemaBuilder.addAllClusterKeyUids(clusterKeyUids);
         }
 
         OlapFile.TabletSchemaCloudPB schema = schemaBuilder.build();
diff --git a/fe/fe-core/src/main/java/org/apache/doris/common/proc/TabletHealthProcDir.java b/fe/fe-core/src/main/java/org/apache/doris/common/proc/TabletHealthProcDir.java
index 9e91eb88148d3c..6c36a926d088b8 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/common/proc/TabletHealthProcDir.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/common/proc/TabletHealthProcDir.java
@@ -67,7 +67,7 @@ public class TabletHealthProcDir implements ProcDirInterface {
 
     private Env env;
 
-    private ForkJoinPool taskPool = new ForkJoinPool();
+    private static ForkJoinPool taskPool = new ForkJoinPool();
 
     public TabletHealthProcDir(Env env) {
         Preconditions.checkNotNull(env);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/common/util/PropertyAnalyzer.java b/fe/fe-core/src/main/java/org/apache/doris/common/util/PropertyAnalyzer.java
index 5721db0c27e856..536ca5633bf30a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/common/util/PropertyAnalyzer.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/common/util/PropertyAnalyzer.java
@@ -637,6 +637,9 @@ public static Set<String> analyzeBloomFilterColumns(Map<String, String> properti
             }
 
             String[] bfColumnArr = bfColumnsStr.split(COMMA_SEPARATOR);
+            if (bfColumnArr.length == 0) {
+                return bfColumns;
+            }
             Set<String> bfColumnSet = Sets.newTreeSet(String.CASE_INSENSITIVE_ORDER);
             for (String bfColumn : bfColumnArr) {
                 bfColumn = bfColumn.trim();
@@ -1126,6 +1129,8 @@ public static TInvertedIndexFileStorageFormat analyzeInvertedIndexFileStorageFor
         } else {
             if (Config.inverted_index_storage_format.equalsIgnoreCase("V1")) {
                 return TInvertedIndexFileStorageFormat.V1;
+            } else if (Config.inverted_index_storage_format.equalsIgnoreCase("V3")) {
+                return TInvertedIndexFileStorageFormat.V3;
             } else {
                 return TInvertedIndexFileStorageFormat.V2;
             }
@@ -1135,9 +1140,13 @@ public static TInvertedIndexFileStorageFormat analyzeInvertedIndexFileStorageFor
             return TInvertedIndexFileStorageFormat.V1;
         } else if (invertedIndexFileStorageFormat.equalsIgnoreCase("v2")) {
             return TInvertedIndexFileStorageFormat.V2;
+        } else if (invertedIndexFileStorageFormat.equalsIgnoreCase("v3")) {
+            return TInvertedIndexFileStorageFormat.V3;
         } else if (invertedIndexFileStorageFormat.equalsIgnoreCase("default")) {
             if (Config.inverted_index_storage_format.equalsIgnoreCase("V1")) {
                 return TInvertedIndexFileStorageFormat.V1;
+            } else if (Config.inverted_index_storage_format.equalsIgnoreCase("V3")) {
+                return TInvertedIndexFileStorageFormat.V3;
             } else {
                 return TInvertedIndexFileStorageFormat.V2;
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/common/util/SmallFileMgr.java b/fe/fe-core/src/main/java/org/apache/doris/common/util/SmallFileMgr.java
index 0fc63a8e327476..5d01eb56033e1d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/common/util/SmallFileMgr.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/common/util/SmallFileMgr.java
@@ -177,6 +177,12 @@ public void createFile(CreateFileStmt stmt) throws DdlException {
                 stmt.getDownloadUrl(), stmt.getChecksum(), stmt.isSaveContent());
     }
 
+    public void createFile(String dbName, String catalog, String fileName, String downloadUrl, String md5sum,
+                            boolean saveContent) throws DdlException {
+        Database db = Env.getCurrentInternalCatalog().getDbOrDdlException(dbName);
+        downloadAndAddFile(db.getId(), catalog, fileName, downloadUrl, md5sum, saveContent);
+    }
+
     public void dropFile(DropFileStmt stmt) throws DdlException {
         String dbName = stmt.getDbName();
         Database db = Env.getCurrentInternalCatalog().getDbOrDdlException(dbName);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalTable.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalTable.java
index 6c72d0a67d4732..5451a219edfd3c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalTable.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalTable.java
@@ -239,6 +239,11 @@ public long getDataLength() {
         return 0;
     }
 
+    @Override
+    public long getIndexLength() {
+        return 0;
+    }
+
     @Override
     public long getCreateTime() {
         return 0;
@@ -394,7 +399,7 @@ public SelectedPartitions initSelectedPartitions(Optional<MvccSnapshot> snapshot
      * @param snapshot if not support mvcc, ignore this
      * @return partitionName ==> PartitionItem
      */
-    protected Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
+    public Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
         return Collections.emptyMap();
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/FileQueryScanNode.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/FileQueryScanNode.java
index 3107b4ed5d7b85..2672cc016eb528 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/FileQueryScanNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/FileQueryScanNode.java
@@ -433,6 +433,8 @@ private TScanRangeLocations splitToScanRange(
             }
         }
 
+        // set file format type, and the type might fall back to native format in setScanParams
+        rangeDesc.setFormatType(getFileFormatType());
         setScanParams(rangeDesc, fileSplit);
         curLocations.getScanRange().getExtScanRange().getFileScanRange().addToRanges(rangeDesc);
         TScanRangeLocation location = new TScanRangeLocation();
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/FileScanNode.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/FileScanNode.java
index 9845c0070fc430..29fdb2b09acfcd 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/FileScanNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/FileScanNode.java
@@ -126,7 +126,6 @@ public String getNodeExplainString(String prefix, TExplainLevel detailLevel) {
         output.append(prefix);
         if (isBatchMode()) {
             output.append("(approximate)");
-            splitAssignment.stop();
         }
         output.append("inputSplitNum=").append(selectedSplitNum).append(", totalFileSize=")
             .append(totalFileSize).append(", scanRanges=").append(scanRangeLocations.size()).append("\n");
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/InternalCatalog.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/InternalCatalog.java
index 64a759b9747044..212ee89fcea84c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/InternalCatalog.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/InternalCatalog.java
@@ -1416,7 +1416,7 @@ public void createTableAsSelect(CreateTableAsSelectStmt stmt) throws DdlExceptio
                     // we change it to tinyint nullable.
                     typeDef = TypeDef.create(PrimitiveType.TINYINT);
                 } else {
-                    typeDef = new TypeDef(resultExpr.getType());
+                    typeDef = new TypeDef(resultType);
                 }
                 if (i == 0) {
                     // If this is the first column, because olap table does not support the first column to be
@@ -2151,10 +2151,10 @@ protected Partition createPartitionWithIndices(long dbId, OlapTable tbl, long pa
             short shortKeyColumnCount = indexMeta.getShortKeyColumnCount();
             TStorageType storageType = indexMeta.getStorageType();
             List<Column> schema = indexMeta.getSchema();
-            List<Integer> clusterKeyIndexes = null;
+            List<Integer> clusterKeyUids = null;
             if (indexId == tbl.getBaseIndexId()) {
-                // only base and shadow index need cluster key indexes
-                clusterKeyIndexes = OlapTable.getClusterKeyIndexes(schema);
+                // only base and shadow index need cluster key unique column ids
+                clusterKeyUids = OlapTable.getClusterKeyUids(schema);
             }
             KeysType keysType = indexMeta.getKeysType();
             List<Index> indexes = indexId == tbl.getBaseIndexId() ? tbl.getCopiedIndexes() : null;
@@ -2188,10 +2188,10 @@ protected Partition createPartitionWithIndices(long dbId, OlapTable tbl, long pa
 
                     task.setStorageFormat(tbl.getStorageFormat());
                     task.setInvertedIndexFileStorageFormat(tbl.getInvertedIndexFileStorageFormat());
-                    if (!CollectionUtils.isEmpty(clusterKeyIndexes)) {
-                        task.setClusterKeyIndexes(clusterKeyIndexes);
-                        LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key indexes: {}",
-                                tbl.getId(), partitionId, indexId, tabletId, clusterKeyIndexes);
+                    if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+                        task.setClusterKeyUids(clusterKeyUids);
+                        LOG.info("table: {}, partition: {}, index: {}, tablet: {}, cluster key uids: {}",
+                                tbl.getId(), partitionId, indexId, tabletId, clusterKeyUids);
                     }
                     batchTask.addTask(task);
                     // add to AgentTaskQueue for handling finish report.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HMSExternalTable.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HMSExternalTable.java
index 134ad362fa1eed..7584b5b392feb5 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HMSExternalTable.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HMSExternalTable.java
@@ -17,6 +17,7 @@
 
 package org.apache.doris.datasource.hive;
 
+import org.apache.doris.analysis.TableSnapshot;
 import org.apache.doris.catalog.Column;
 import org.apache.doris.catalog.Env;
 import org.apache.doris.catalog.ListPartitionItem;
@@ -31,6 +32,7 @@
 import org.apache.doris.common.DdlException;
 import org.apache.doris.datasource.ExternalTable;
 import org.apache.doris.datasource.SchemaCacheValue;
+import org.apache.doris.datasource.TablePartitionValues;
 import org.apache.doris.datasource.hudi.HudiUtils;
 import org.apache.doris.datasource.iceberg.IcebergUtils;
 import org.apache.doris.datasource.mvcc.MvccSnapshot;
@@ -41,6 +43,7 @@
 import org.apache.doris.mtmv.MTMVSnapshotIf;
 import org.apache.doris.mtmv.MTMVTimestampSnapshot;
 import org.apache.doris.nereids.exceptions.NotSupportedException;
+import org.apache.doris.nereids.trees.plans.logical.LogicalFileScan.SelectedPartitions;
 import org.apache.doris.qe.GlobalVariable;
 import org.apache.doris.statistics.AnalysisInfo;
 import org.apache.doris.statistics.BaseAnalysisTask;
@@ -302,11 +305,32 @@ public List<Column> getPartitionColumns(Optional<MvccSnapshot> snapshot) {
 
     @Override
     public boolean supportInternalPartitionPruned() {
-        return getDlaType() == DLAType.HIVE;
+        return getDlaType() == DLAType.HIVE || getDlaType() == DLAType.HUDI;
+    }
+
+    public SelectedPartitions initHudiSelectedPartitions(Optional<TableSnapshot> tableSnapshot) {
+        if (getDlaType() != DLAType.HUDI) {
+            return SelectedPartitions.NOT_PRUNED;
+        }
+
+        if (getPartitionColumns().isEmpty()) {
+            return SelectedPartitions.NOT_PRUNED;
+        }
+        TablePartitionValues tablePartitionValues = HudiUtils.getPartitionValues(tableSnapshot, this);
+
+        Map<Long, PartitionItem> idToPartitionItem = tablePartitionValues.getIdToPartitionItem();
+        Map<Long, String> idToNameMap = tablePartitionValues.getPartitionIdToNameMap();
+
+        Map<String, PartitionItem> nameToPartitionItems = Maps.newHashMapWithExpectedSize(idToPartitionItem.size());
+        for (Entry<Long, PartitionItem> entry : idToPartitionItem.entrySet()) {
+            nameToPartitionItems.put(idToNameMap.get(entry.getKey()), entry.getValue());
+        }
+
+        return new SelectedPartitions(nameToPartitionItems.size(), nameToPartitionItems, false);
     }
 
     @Override
-    protected Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
+    public Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
         return getNameToPartitionItems();
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HiveMetaStoreClientHelper.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HiveMetaStoreClientHelper.java
index 0f839d238b2b1e..884cfbee45ba9f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HiveMetaStoreClientHelper.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hive/HiveMetaStoreClientHelper.java
@@ -40,7 +40,7 @@
 import org.apache.doris.catalog.Type;
 import org.apache.doris.common.DdlException;
 import org.apache.doris.common.security.authentication.AuthenticationConfig;
-import org.apache.doris.common.security.authentication.HadoopUGI;
+import org.apache.doris.common.security.authentication.HadoopAuthenticator;
 import org.apache.doris.datasource.ExternalCatalog;
 import org.apache.doris.fs.remote.dfs.DFSFileSystem;
 import org.apache.doris.thrift.TExprOpcode;
@@ -64,9 +64,11 @@
 import org.apache.hudi.avro.HoodieAvroUtils;
 import org.apache.hudi.common.table.HoodieTableMetaClient;
 import org.apache.hudi.common.table.TableSchemaResolver;
+import org.apache.hudi.storage.hadoop.HadoopStorageConfiguration;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
+import java.io.IOException;
 import java.security.PrivilegedExceptionAction;
 import java.time.LocalDateTime;
 import java.time.ZoneId;
@@ -822,17 +824,22 @@ public static <T> T ugiDoAs(long catalogId, PrivilegedExceptionAction<T> action)
 
     public static <T> T ugiDoAs(Configuration conf, PrivilegedExceptionAction<T> action) {
         // if hive config is not ready, then use hadoop kerberos to login
-        AuthenticationConfig krbConfig = AuthenticationConfig.getKerberosConfig(conf,
-                AuthenticationConfig.HADOOP_KERBEROS_PRINCIPAL,
-                AuthenticationConfig.HADOOP_KERBEROS_KEYTAB);
-        return HadoopUGI.ugiDoAs(krbConfig, action);
+        AuthenticationConfig authenticationConfig = AuthenticationConfig.getKerberosConfig(conf);
+        HadoopAuthenticator hadoopAuthenticator = HadoopAuthenticator.getHadoopAuthenticator(authenticationConfig);
+        try {
+            return hadoopAuthenticator.doAs(action);
+        } catch (IOException e) {
+            LOG.warn("HiveMetaStoreClientHelper ugiDoAs failed.", e);
+            throw new RuntimeException(e);
+        }
     }
 
     public static HoodieTableMetaClient getHudiClient(HMSExternalTable table) {
         String hudiBasePath = table.getRemoteTable().getSd().getLocation();
         Configuration conf = getConfiguration(table);
-        return HadoopUGI.ugiDoAs(AuthenticationConfig.getKerberosConfig(conf),
-                () -> HoodieTableMetaClient.builder().setConf(conf).setBasePath(hudiBasePath).build());
+        HadoopStorageConfiguration hadoopStorageConfiguration = new HadoopStorageConfiguration(conf);
+        return ugiDoAs(conf, () -> HoodieTableMetaClient.builder().setConf(hadoopStorageConfiguration)
+                .setBasePath(hudiBasePath).build());
     }
 
     public static Configuration getConfiguration(HMSExternalTable table) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/HudiUtils.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/HudiUtils.java
index d7803b1a516f9e..0f38abafaa4d98 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/HudiUtils.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/HudiUtils.java
@@ -17,24 +17,35 @@
 
 package org.apache.doris.datasource.hudi;
 
+import org.apache.doris.analysis.TableSnapshot;
 import org.apache.doris.catalog.ArrayType;
+import org.apache.doris.catalog.Env;
 import org.apache.doris.catalog.MapType;
 import org.apache.doris.catalog.ScalarType;
 import org.apache.doris.catalog.StructField;
 import org.apache.doris.catalog.StructType;
 import org.apache.doris.catalog.Type;
+import org.apache.doris.datasource.TablePartitionValues;
+import org.apache.doris.datasource.hive.HMSExternalTable;
+import org.apache.doris.datasource.hive.HiveMetaStoreClientHelper;
+import org.apache.doris.datasource.hudi.source.HudiCachedPartitionProcessor;
 
 import org.apache.avro.LogicalType;
 import org.apache.avro.LogicalTypes;
 import org.apache.avro.Schema;
 import org.apache.avro.Schema.Field;
+import org.apache.hudi.common.table.HoodieTableMetaClient;
 import org.apache.hudi.common.table.timeline.HoodieActiveTimeline;
+import org.apache.hudi.common.table.timeline.HoodieInstant;
 import org.apache.hudi.common.table.timeline.HoodieInstantTimeGenerator;
+import org.apache.hudi.common.table.timeline.HoodieTimeline;
+import org.apache.hudi.common.util.Option;
 
 import java.text.ParseException;
 import java.text.SimpleDateFormat;
 import java.util.ArrayList;
 import java.util.List;
+import java.util.Optional;
 import java.util.stream.Collectors;
 
 public class HudiUtils {
@@ -86,7 +97,7 @@ public static String convertAvroToHiveType(Schema schema) {
             case LONG:
                 if (logicalType instanceof LogicalTypes.TimestampMillis
                         || logicalType instanceof LogicalTypes.TimestampMicros) {
-                    return logicalType.getName();
+                    return "timestamp";
                 }
                 if (logicalType instanceof LogicalTypes.TimeMicros) {
                     return handleUnsupportedType(schema);
@@ -231,4 +242,43 @@ private static Type handleUnionType(Schema avroSchema) {
         }
         return Type.UNSUPPORTED;
     }
+
+    public static TablePartitionValues getPartitionValues(Optional<TableSnapshot> tableSnapshot,
+            HMSExternalTable hmsTable) {
+        TablePartitionValues partitionValues = new TablePartitionValues();
+        if (hmsTable.getPartitionColumns().isEmpty()) {
+            //isn't partition table.
+            return partitionValues;
+        }
+
+        HoodieTableMetaClient hudiClient = HiveMetaStoreClientHelper.getHudiClient(hmsTable);
+        HudiCachedPartitionProcessor processor = (HudiCachedPartitionProcessor) Env.getCurrentEnv()
+                .getExtMetaCacheMgr().getHudiPartitionProcess(hmsTable.getCatalog());
+        boolean useHiveSyncPartition = hmsTable.useHiveSyncPartition();
+
+        if (tableSnapshot.isPresent()) {
+            if (tableSnapshot.get().getType() == TableSnapshot.VersionType.VERSION) {
+                // Hudi does not support `FOR VERSION AS OF`, please use `FOR TIME AS OF`";
+                return partitionValues;
+            }
+            String queryInstant = tableSnapshot.get().getTime().replaceAll("[-: ]", "");
+
+            partitionValues =
+                    HiveMetaStoreClientHelper.ugiDoAs(
+                            HiveMetaStoreClientHelper.getConfiguration(hmsTable),
+                            () -> processor.getSnapshotPartitionValues(
+                                    hmsTable, hudiClient, queryInstant, useHiveSyncPartition));
+        } else {
+            HoodieTimeline timeline = hudiClient.getCommitsAndCompactionTimeline().filterCompletedInstants();
+            Option<HoodieInstant> snapshotInstant = timeline.lastInstant();
+            if (!snapshotInstant.isPresent()) {
+                return partitionValues;
+            }
+            partitionValues =
+                    HiveMetaStoreClientHelper.ugiDoAs(
+                            HiveMetaStoreClientHelper.getConfiguration(hmsTable),
+                            () -> processor.getPartitionValues(hmsTable, hudiClient, useHiveSyncPartition));
+        }
+        return partitionValues;
+    }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/COWIncrementalRelation.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/COWIncrementalRelation.java
index 7981a0b4f261ff..843dded27969ad 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/COWIncrementalRelation.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/COWIncrementalRelation.java
@@ -37,6 +37,7 @@
 import org.apache.hudi.common.table.timeline.TimelineUtils.HollowCommitHandling;
 import org.apache.hudi.common.util.Option;
 import org.apache.hudi.exception.HoodieException;
+import org.apache.hudi.storage.StoragePath;
 
 import java.io.IOException;
 import java.util.ArrayList;
@@ -105,7 +106,7 @@ public COWIncrementalRelation(Map<String, String> optParams, Configuration confi
         List<HoodieInstant> commitsToReturn = commitsTimelineToReturn.getInstants();
 
         // todo: support configuration hoodie.datasource.read.incr.filters
-        Path basePath = metaClient.getBasePathV2();
+        StoragePath basePath = metaClient.getBasePathV2();
         Map<String, String> regularFileIdToFullPath = new HashMap<>();
         Map<String, String> metaBootstrapFileIdToFullPath = new HashMap<>();
         HoodieTimeline replacedTimeline = commitsTimelineToReturn.getCompletedReplaceTimeline();
@@ -113,8 +114,8 @@ public COWIncrementalRelation(Map<String, String> optParams, Configuration confi
         for (HoodieInstant instant : replacedTimeline.getInstants()) {
             HoodieReplaceCommitMetadata.fromBytes(metaClient.getActiveTimeline().getInstantDetails(instant).get(),
                     HoodieReplaceCommitMetadata.class).getPartitionToReplaceFileIds().forEach(
-                        (key, value) -> value.forEach(
-                            e -> replacedFile.put(e, FSUtils.getPartitionPath(basePath, key).toString())));
+                            (key, value) -> value.forEach(
+                                    e -> replacedFile.put(e, FSUtils.constructAbsolutePath(basePath, key).toString())));
         }
 
         fileToWriteStat = new HashMap<>();
@@ -123,7 +124,7 @@ public COWIncrementalRelation(Map<String, String> optParams, Configuration confi
                     commitTimeline.getInstantDetails(commit).get(), HoodieCommitMetadata.class);
             metadata.getPartitionToWriteStats().forEach((partition, stats) -> {
                 for (HoodieWriteStat stat : stats) {
-                    fileToWriteStat.put(FSUtils.getPartitionPath(basePath, stat.getPath()).toString(), stat);
+                    fileToWriteStat.put(FSUtils.constructAbsolutePath(basePath, stat.getPath()).toString(), stat);
                 }
             });
             if (HoodieTimeline.METADATA_BOOTSTRAP_INSTANT_TS.equals(commit.getTimestamp())) {
@@ -158,7 +159,7 @@ public COWIncrementalRelation(Map<String, String> optParams, Configuration confi
 
         }
 
-        fs = basePath.getFileSystem(configuration);
+        fs = new Path(basePath.toUri().getPath()).getFileSystem(configuration);
         fullTableScan = shouldFullTableScan();
         includeStartTime = !fullTableScan;
         if (fullTableScan || commitsToReturn.isEmpty()) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiLocalEngineContext.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiLocalEngineContext.java
index 26ef6fdfef7086..fecc026cf8d046 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiLocalEngineContext.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiLocalEngineContext.java
@@ -17,10 +17,6 @@
 
 package org.apache.doris.datasource.hudi.source;
 
-import org.apache.doris.datasource.hive.HiveMetaStoreClientHelper;
-
-import org.apache.hadoop.conf.Configuration;
-import org.apache.hudi.common.config.SerializableConfiguration;
 import org.apache.hudi.common.data.HoodieAccumulator;
 import org.apache.hudi.common.data.HoodieAtomicLongAccumulator;
 import org.apache.hudi.common.data.HoodieData;
@@ -39,7 +35,7 @@
 import org.apache.hudi.common.util.Option;
 import org.apache.hudi.common.util.collection.ImmutablePair;
 import org.apache.hudi.common.util.collection.Pair;
-import org.apache.hudi.exception.HoodieException;
+import org.apache.hudi.storage.StorageConfiguration;
 
 import java.util.Collections;
 import java.util.Iterator;
@@ -50,18 +46,20 @@
 import java.util.stream.Stream;
 
 /**
- * This file is copied from org.apache.hudi.common.engine.HoodieLocalEngineContext.
+ * This file is copied from
+ * org.apache.hudi.common.engine.HudiLocalEngineContext.
  * Because we need set ugi in thread pool
- * A java based engine context, use this implementation on the query engine integrations if needed.
+ * A java based engine context, use this implementation on the query engine
+ * integrations if needed.
  */
 public final class HudiLocalEngineContext extends HoodieEngineContext {
 
-    public HudiLocalEngineContext(Configuration conf) {
+    public HudiLocalEngineContext(StorageConfiguration<?> conf) {
         this(conf, new LocalTaskContextSupplier());
     }
 
-    public HudiLocalEngineContext(Configuration conf, TaskContextSupplier taskContextSupplier) {
-        super(new SerializableConfiguration(conf), taskContextSupplier);
+    public HudiLocalEngineContext(StorageConfiguration<?> conf, TaskContextSupplier taskContextSupplier) {
+        super(conf, taskContextSupplier);
     }
 
     @Override
@@ -81,27 +79,18 @@ public <T> HoodieData<T> parallelize(List<T> data, int parallelism) {
 
     @Override
     public <I, O> List<O> map(List<I> data, SerializableFunction<I, O> func, int parallelism) {
-        return data.stream().parallel().map(v1 -> {
-            try {
-                return HiveMetaStoreClientHelper.ugiDoAs(getHadoopConf().get(), () -> func.apply(v1));
-            } catch (Exception e) {
-                throw new HoodieException("Error occurs when executing map", e);
-            }
-        }).collect(Collectors.toList());
+        return data.stream().parallel().map(FunctionWrapper.throwingMapWrapper(func)).collect(Collectors.toList());
     }
 
     @Override
     public <I, K, V> List<V> mapToPairAndReduceByKey(
-            List<I> data,
-            SerializablePairFunction<I, K, V> mapToPairFunc,
-            SerializableBiFunction<V, V, V> reduceFunc, int parallelism) {
+            List<I> data, SerializablePairFunction<I, K, V> mapToPairFunc, SerializableBiFunction<V, V, V> reduceFunc,
+            int parallelism) {
         return data.stream().parallel().map(FunctionWrapper.throwingMapToPairWrapper(mapToPairFunc))
-            .collect(Collectors.groupingBy(p -> p.getKey())).values().stream()
-            .map(list ->
-                    list.stream()
-                        .map(e -> e.getValue())
+                .collect(Collectors.groupingBy(p -> p.getKey())).values().stream()
+                .map(list -> list.stream().map(e -> e.getValue())
                         .reduce(FunctionWrapper.throwingReduceWrapper(reduceFunc)).get())
-            .collect(Collectors.toList());
+                .collect(Collectors.toList());
     }
 
     @Override
@@ -109,29 +98,28 @@ public <I, K, V> Stream<ImmutablePair<K, V>> mapPartitionsToPairAndReduceByKey(
             Stream<I> data, SerializablePairFlatMapFunction<Iterator<I>, K, V> flatMapToPairFunc,
             SerializableBiFunction<V, V, V> reduceFunc, int parallelism) {
         return FunctionWrapper.throwingFlatMapToPairWrapper(flatMapToPairFunc).apply(data.parallel().iterator())
-            .collect(Collectors.groupingBy(Pair::getKey)).entrySet().stream()
-            .map(entry -> new ImmutablePair<>(entry.getKey(), entry.getValue().stream().map(
-                Pair::getValue).reduce(FunctionWrapper.throwingReduceWrapper(reduceFunc)).orElse(null)))
-            .filter(Objects::nonNull);
+                .collect(Collectors.groupingBy(Pair::getKey)).entrySet().stream()
+                .map(entry -> new ImmutablePair<>(entry.getKey(), entry.getValue().stream().map(
+                        Pair::getValue).reduce(FunctionWrapper.throwingReduceWrapper(reduceFunc)).orElse(null)))
+                .filter(Objects::nonNull);
     }
 
     @Override
     public <I, K, V> List<V> reduceByKey(
             List<Pair<K, V>> data, SerializableBiFunction<V, V, V> reduceFunc, int parallelism) {
         return data.stream().parallel()
-            .collect(Collectors.groupingBy(p -> p.getKey())).values().stream()
-            .map(list ->
-                list.stream()
-                    .map(e -> e.getValue())
-                    .reduce(FunctionWrapper.throwingReduceWrapper(reduceFunc)).orElse(null))
-            .filter(Objects::nonNull)
-            .collect(Collectors.toList());
+                .collect(Collectors.groupingBy(p -> p.getKey())).values().stream()
+                .map(list -> list.stream().map(e -> e.getValue())
+                        .reduce(FunctionWrapper.throwingReduceWrapper(reduceFunc))
+                        .orElse(null))
+                .filter(Objects::nonNull)
+                .collect(Collectors.toList());
     }
 
     @Override
     public <I, O> List<O> flatMap(List<I> data, SerializableFunction<I, Stream<O>> func, int parallelism) {
-        return
-            data.stream().parallel().flatMap(FunctionWrapper.throwingFlatMapWrapper(func)).collect(Collectors.toList());
+        return data.stream().parallel().flatMap(FunctionWrapper.throwingFlatMapWrapper(func))
+                .collect(Collectors.toList());
     }
 
     @Override
@@ -142,8 +130,7 @@ public <I> void foreach(List<I> data, SerializableConsumer<I> consumer, int para
     @Override
     public <I, K, V> Map<K, V> mapToPair(List<I> data, SerializablePairFunction<I, K, V> func, Integer parallelism) {
         return data.stream().map(FunctionWrapper.throwingMapToPairWrapper(func)).collect(
-            Collectors.toMap(Pair::getLeft, Pair::getRight, (oldVal, newVal) -> newVal)
-        );
+                Collectors.toMap(Pair::getLeft, Pair::getRight, (oldVal, newVal) -> newVal));
     }
 
     @Override
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiPartitionProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiPartitionProcessor.java
index 738b2638588e03..0ab9fef951a378 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiPartitionProcessor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiPartitionProcessor.java
@@ -21,7 +21,6 @@
 import org.apache.hudi.common.table.HoodieTableMetaClient;
 import org.apache.hudi.common.table.timeline.HoodieTimeline;
 import org.apache.hudi.common.table.timeline.TimelineUtils;
-import org.apache.hudi.hadoop.utils.HoodieInputFormatUtils;
 import org.apache.hudi.metadata.HoodieTableMetadata;
 import org.apache.hudi.metadata.HoodieTableMetadataUtil;
 
@@ -49,14 +48,15 @@ public List<String> getAllPartitionNames(HoodieTableMetaClient tableMetaClient)
                 .build();
 
         HoodieTableMetadata newTableMetadata = HoodieTableMetadata.create(
-                new HudiLocalEngineContext(tableMetaClient.getHadoopConf()), metadataConfig,
+                new HudiLocalEngineContext(tableMetaClient.getStorageConf()), tableMetaClient.getStorage(),
+                metadataConfig,
                 tableMetaClient.getBasePathV2().toString(), true);
 
         return newTableMetadata.getAllPartitionPaths();
     }
 
     public List<String> getPartitionNamesBeforeOrEquals(HoodieTimeline timeline, String timestamp) {
-        return new ArrayList<>(HoodieInputFormatUtils.getWritePartitionPaths(
+        return new ArrayList<>(HoodieTableMetadataUtil.getWritePartitionPaths(
                 timeline.findInstantsBeforeOrEquals(timestamp).getInstants().stream().map(instant -> {
                     try {
                         return TimelineUtils.getCommitMetadata(instant, timeline);
@@ -67,7 +67,7 @@ public List<String> getPartitionNamesBeforeOrEquals(HoodieTimeline timeline, Str
     }
 
     public List<String> getPartitionNamesInRange(HoodieTimeline timeline, String startTimestamp, String endTimestamp) {
-        return new ArrayList<>(HoodieInputFormatUtils.getWritePartitionPaths(
+        return new ArrayList<>(HoodieTableMetadataUtil.getWritePartitionPaths(
                 timeline.findInstantsInRange(startTimestamp, endTimestamp).getInstants().stream().map(instant -> {
                     try {
                         return TimelineUtils.getCommitMetadata(instant, timeline);
@@ -101,8 +101,10 @@ public static List<String> parsePartitionValues(List<String> partitionColumns, S
             } else {
                 // If the partition column size is not equal to the partition fragments size
                 // and the partition column size > 1, we do not know how to map the partition
-                // fragments to the partition columns and therefore return an empty tuple. We don't
-                // fail outright so that in some cases we can fallback to reading the table as non-partitioned
+                // fragments to the partition columns and therefore return an empty tuple. We
+                // don't
+                // fail outright so that in some cases we can fallback to reading the table as
+                // non-partitioned
                 // one
                 throw new RuntimeException("Failed to parse partition values of path: " + partitionPath);
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiScanNode.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiScanNode.java
index a8f2a362bfde8d..b2cad8ab710178 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiScanNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiScanNode.java
@@ -21,22 +21,23 @@
 import org.apache.doris.analysis.TableSnapshot;
 import org.apache.doris.analysis.TupleDescriptor;
 import org.apache.doris.catalog.Env;
+import org.apache.doris.catalog.ListPartitionItem;
 import org.apache.doris.catalog.PartitionItem;
 import org.apache.doris.catalog.Type;
 import org.apache.doris.common.AnalysisException;
 import org.apache.doris.common.UserException;
+import org.apache.doris.common.util.FileFormatUtils;
 import org.apache.doris.common.util.LocationPath;
 import org.apache.doris.datasource.ExternalTable;
 import org.apache.doris.datasource.FileSplit;
 import org.apache.doris.datasource.TableFormatType;
-import org.apache.doris.datasource.TablePartitionValues;
 import org.apache.doris.datasource.hive.HiveMetaStoreClientHelper;
 import org.apache.doris.datasource.hive.HivePartition;
 import org.apache.doris.datasource.hive.source.HiveScanNode;
 import org.apache.doris.datasource.hudi.HudiUtils;
-import org.apache.doris.planner.ListPartitionPrunerV2;
 import org.apache.doris.planner.PlanNodeId;
 import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.SessionVariable;
 import org.apache.doris.spi.Split;
 import org.apache.doris.statistics.StatisticalType;
 import org.apache.doris.thrift.TExplainLevel;
@@ -48,8 +49,6 @@
 import com.google.common.collect.Lists;
 import com.google.common.collect.Maps;
 import org.apache.avro.Schema;
-import org.apache.hadoop.fs.FileStatus;
-import org.apache.hadoop.fs.Path;
 import org.apache.hudi.avro.HoodieAvroUtils;
 import org.apache.hudi.common.fs.FSUtils;
 import org.apache.hudi.common.model.BaseFile;
@@ -62,13 +61,14 @@
 import org.apache.hudi.common.table.timeline.HoodieTimeline;
 import org.apache.hudi.common.table.view.HoodieTableFileSystemView;
 import org.apache.hudi.common.util.Option;
+import org.apache.hudi.storage.StoragePath;
+import org.apache.hudi.storage.StoragePathInfo;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Arrays;
-import java.util.Collection;
 import java.util.Collections;
 import java.util.List;
 import java.util.Locale;
@@ -87,7 +87,7 @@ public class HudiScanNode extends HiveScanNode {
 
     private static final Logger LOG = LogManager.getLogger(HudiScanNode.class);
 
-    private boolean isCowOrRoTable;
+    private boolean isCowTable;
 
     private final AtomicLong noLogsSplitNum = new AtomicLong(0);
 
@@ -113,19 +113,23 @@ public class HudiScanNode extends HiveScanNode {
     private boolean incrementalRead = false;
     private TableScanParams scanParams;
     private IncrementalRelation incrementalRelation;
+    private SessionVariable sessionVariable;
 
     /**
      * External file scan node for Query Hudi table
-     * needCheckColumnPriv: Some of ExternalFileScanNode do not need to check column priv
+     * needCheckColumnPriv: Some of ExternalFileScanNode do not need to check column
+     * priv
      * eg: s3 tvf
-     * These scan nodes do not have corresponding catalog/database/table info, so no need to do priv check
+     * These scan nodes do not have corresponding catalog/database/table info, so no
+     * need to do priv check
      */
     public HudiScanNode(PlanNodeId id, TupleDescriptor desc, boolean needCheckColumnPriv,
-            Optional<TableScanParams> scanParams, Optional<IncrementalRelation> incrementalRelation) {
+            Optional<TableScanParams> scanParams, Optional<IncrementalRelation> incrementalRelation,
+            SessionVariable sessionVariable) {
         super(id, desc, "HUDI_SCAN_NODE", StatisticalType.HUDI_SCAN_NODE, needCheckColumnPriv);
-        isCowOrRoTable = hmsTable.isHoodieCowTable();
+        isCowTable = hmsTable.isHoodieCowTable();
         if (LOG.isDebugEnabled()) {
-            if (isCowOrRoTable) {
+            if (isCowTable) {
                 LOG.debug("Hudi table {} can read as cow/read optimize table", hmsTable.getFullQualifiers());
             } else {
                 LOG.debug("Hudi table {} is a mor table, and will use JNI to read data in BE",
@@ -136,11 +140,12 @@ public HudiScanNode(PlanNodeId id, TupleDescriptor desc, boolean needCheckColumn
         this.scanParams = scanParams.orElse(null);
         this.incrementalRelation = incrementalRelation.orElse(null);
         this.incrementalRead = (this.scanParams != null && this.scanParams.incrementalRead());
+        this.sessionVariable = sessionVariable;
     }
 
     @Override
     public TFileFormatType getFileFormatType() throws UserException {
-        if (isCowOrRoTable) {
+        if (canUseNativeReader()) {
             return super.getFileFormatType();
         } else {
             // Use jni to read hudi table in BE
@@ -185,13 +190,13 @@ protected void doInitialize() throws UserException {
             throw new UserException("Not support function '" + scanParams.getParamType() + "' in hudi table");
         }
         if (incrementalRead) {
-            if (isCowOrRoTable) {
+            if (isCowTable) {
                 try {
                     Map<String, String> serd = hmsTable.getRemoteTable().getSd().getSerdeInfo().getParameters();
                     if ("true".equals(serd.get("hoodie.query.as.ro.table"))
                             && hmsTable.getRemoteTable().getTableName().endsWith("_ro")) {
                         // Incremental read RO table as RT table, I don't know why?
-                        isCowOrRoTable = false;
+                        isCowTable = false;
                         LOG.warn("Execute incremental read on RO table: {}", hmsTable.getFullQualifiers());
                     }
                 } catch (Exception e) {
@@ -236,7 +241,22 @@ protected Map<String, String> getLocationProperties() throws UserException {
     @Override
     protected void setScanParams(TFileRangeDesc rangeDesc, Split split) {
         if (split instanceof HudiSplit) {
-            setHudiParams(rangeDesc, (HudiSplit) split);
+            HudiSplit hudiSplit = (HudiSplit) split;
+            if (rangeDesc.getFormatType() == TFileFormatType.FORMAT_JNI
+                    && !sessionVariable.isForceJniScanner()
+                    && hudiSplit.getHudiDeltaLogs().isEmpty()) {
+                // no logs, is read optimize table, fallback to use native reader
+                String fileFormat = FileFormatUtils.getFileFormatBySuffix(hudiSplit.getDataFilePath())
+                        .orElse("Unknown");
+                if (fileFormat.equals("parquet")) {
+                    rangeDesc.setFormatType(TFileFormatType.FORMAT_PARQUET);
+                } else if (fileFormat.equals("orc")) {
+                    rangeDesc.setFormatType(TFileFormatType.FORMAT_ORC);
+                } else {
+                    throw new RuntimeException("Unsupported file format: " + fileFormat);
+                }
+            }
+            setHudiParams(rangeDesc, hudiSplit);
         }
     }
 
@@ -255,56 +275,41 @@ private void setHudiParams(TFileRangeDesc rangeDesc, HudiSplit hudiSplit) {
         fileDesc.setColumnTypes(hudiSplit.getHudiColumnTypes());
         // TODO(gaoxin): support complex types
         // fileDesc.setNestedFields(hudiSplit.getNestedFields());
+        fileDesc.setHudiJniScanner(hudiSplit.getHudiJniScanner());
         tableFormatFileDesc.setHudiParams(fileDesc);
         rangeDesc.setTableFormatParams(tableFormatFileDesc);
     }
 
-    private List<HivePartition> getPrunedPartitions(
-            HoodieTableMetaClient metaClient, Option<String> snapshotTimestamp) throws AnalysisException {
+    private boolean canUseNativeReader() {
+        return !sessionVariable.isForceJniScanner() && isCowTable;
+    }
+
+    private List<HivePartition> getPrunedPartitions(HoodieTableMetaClient metaClient) {
         List<Type> partitionColumnTypes = hmsTable.getPartitionColumnTypes();
         if (!partitionColumnTypes.isEmpty()) {
-            HudiCachedPartitionProcessor processor = (HudiCachedPartitionProcessor) Env.getCurrentEnv()
-                    .getExtMetaCacheMgr().getHudiPartitionProcess(hmsTable.getCatalog());
-            TablePartitionValues partitionValues;
-            if (snapshotTimestamp.isPresent()) {
-                partitionValues = processor.getSnapshotPartitionValues(
-                        hmsTable, metaClient, snapshotTimestamp.get(), useHiveSyncPartition);
-            } else {
-                partitionValues = processor.getPartitionValues(hmsTable, metaClient, useHiveSyncPartition);
-            }
-            if (partitionValues != null) {
-                // 2. prune partitions by expr
-                partitionValues.readLock().lock();
-                try {
-                    Map<Long, PartitionItem> idToPartitionItem = partitionValues.getIdToPartitionItem();
-                    this.totalPartitionNum = idToPartitionItem.size();
-                    ListPartitionPrunerV2 pruner = new ListPartitionPrunerV2(idToPartitionItem,
-                            hmsTable.getPartitionColumns(), columnNameToRange,
-                            partitionValues.getUidToPartitionRange(),
-                            partitionValues.getRangeToId(),
-                            partitionValues.getSingleColumnRangeMap(),
-                            true);
-                    Collection<Long> filteredPartitionIds = pruner.prune();
-                    this.selectedPartitionNum = filteredPartitionIds.size();
-                    // 3. get partitions from cache
-                    String dbName = hmsTable.getDbName();
-                    String tblName = hmsTable.getName();
-                    String inputFormat = hmsTable.getRemoteTable().getSd().getInputFormat();
-                    String basePath = metaClient.getBasePathV2().toString();
-                    Map<Long, String> partitionIdToNameMap = partitionValues.getPartitionIdToNameMap();
-                    Map<Long, List<String>> partitionValuesMap = partitionValues.getPartitionValuesMap();
-                    return filteredPartitionIds.stream().map(id -> {
-                        String path = basePath + "/" + partitionIdToNameMap.get(id);
-                        return new HivePartition(
-                                dbName, tblName, false, inputFormat, path, partitionValuesMap.get(id),
-                                Maps.newHashMap());
-                    }).collect(Collectors.toList());
-                } finally {
-                    partitionValues.readLock().unlock();
-                }
-            }
+            this.totalPartitionNum = selectedPartitions.totalPartitionNum;
+            Map<String, PartitionItem> prunedPartitions = selectedPartitions.selectedPartitions;
+            this.selectedPartitionNum = prunedPartitions.size();
+
+            String dbName = hmsTable.getDbName();
+            String tblName = hmsTable.getName();
+            String inputFormat = hmsTable.getRemoteTable().getSd().getInputFormat();
+            String basePath = metaClient.getBasePathV2().toString();
+
+            List<HivePartition> hivePartitions = Lists.newArrayList();
+            prunedPartitions.forEach(
+                    (key, value) -> {
+                        String path = basePath + "/" + key;
+                        hivePartitions.add(new HivePartition(
+                                dbName, tblName, false, inputFormat, path,
+                                ((ListPartitionItem) value).getItems().get(0).getPartitionValuesAsStringList(),
+                                Maps.newHashMap()));
+                    }
+            );
+            return hivePartitions;
         }
-        // unpartitioned table, create a dummy partition to save location and inputformat,
+        // unpartitioned table, create a dummy partition to save location and
+        // inputformat,
         // so that we can unify the interface.
         HivePartition dummyPartition = new HivePartition(hmsTable.getDbName(), hmsTable.getName(), true,
                 hmsTable.getRemoteTable().getSd().getInputFormat(),
@@ -315,7 +320,7 @@ private List<HivePartition> getPrunedPartitions(
     }
 
     private List<Split> getIncrementalSplits() {
-        if (isCowOrRoTable) {
+        if (canUseNativeReader()) {
             List<Split> splits = incrementalRelation.collectSplits();
             noLogsSplitNum.addAndGet(splits.size());
             return splits;
@@ -336,15 +341,15 @@ private void getPartitionSplits(HivePartition partition, List<Split> splits) thr
             globPath = hudiClient.getBasePathV2().toString() + "/*";
         } else {
             partitionName = FSUtils.getRelativePartitionPath(hudiClient.getBasePathV2(),
-                    new Path(partition.getPath()));
+                    new StoragePath(partition.getPath()));
             globPath = String.format("%s/%s/*", hudiClient.getBasePathV2().toString(), partitionName);
         }
-        List<FileStatus> statuses = FSUtils.getGlobStatusExcludingMetaFolder(
-                hudiClient.getRawFs(), new Path(globPath));
+        List<StoragePathInfo> statuses = FSUtils.getGlobStatusExcludingMetaFolder(
+                hudiClient.getRawHoodieStorage(), new StoragePath(globPath));
         HoodieTableFileSystemView fileSystemView = new HoodieTableFileSystemView(hudiClient,
-                timeline, statuses.toArray(new FileStatus[0]));
+                timeline, statuses);
 
-        if (isCowOrRoTable) {
+        if (canUseNativeReader()) {
             fileSystemView.getLatestBaseFilesBeforeOrOn(partitionName, queryInstant).forEach(baseFile -> {
                 noLogsSplitNum.incrementAndGet();
                 String filePath = baseFile.getPath();
@@ -392,7 +397,7 @@ public List<Split> getSplits() throws UserException {
         if (!partitionInit) {
             prunedPartitions = HiveMetaStoreClientHelper.ugiDoAs(
                     HiveMetaStoreClientHelper.getConfiguration(hmsTable),
-                    () -> getPrunedPartitions(hudiClient, snapshotTimestamp));
+                    () -> getPrunedPartitions(hudiClient));
             partitionInit = true;
         }
         List<Split> splits = Collections.synchronizedList(new ArrayList<>());
@@ -454,7 +459,7 @@ public boolean isBatchMode() {
             // Non partition table will get one dummy partition
             prunedPartitions = HiveMetaStoreClientHelper.ugiDoAs(
                     HiveMetaStoreClientHelper.getConfiguration(hmsTable),
-                    () -> getPrunedPartitions(hudiClient, snapshotTimestamp));
+                    () -> getPrunedPartitions(hudiClient));
             partitionInit = true;
         }
         int numPartitions = ConnectContext.get().getSessionVariable().getNumPartitionsInBatchMode();
@@ -473,9 +478,9 @@ private HudiSplit generateHudiSplit(FileSlice fileSlice, List<String> partitionV
         fileSlice.getPartitionPath();
 
         List<String> logs = fileSlice.getLogFiles().map(HoodieLogFile::getPath)
-                .map(Path::toString)
+                .map(StoragePath::toString)
                 .collect(Collectors.toList());
-        if (logs.isEmpty()) {
+        if (logs.isEmpty() && !sessionVariable.isForceJniScanner()) {
             noLogsSplitNum.incrementAndGet();
         }
 
@@ -492,6 +497,7 @@ private HudiSplit generateHudiSplit(FileSlice fileSlice, List<String> partitionV
         split.setHudiColumnNames(columnNames);
         split.setHudiColumnTypes(columnTypes);
         split.setInstantTime(queryInstant);
+        split.setHudiJniScanner(sessionVariable.getHudiJniScanner());
         return split;
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiSplit.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiSplit.java
index c72f7621feaa55..2270d2017937da 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiSplit.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/HudiSplit.java
@@ -40,6 +40,5 @@ public HudiSplit(LocationPath file, long start, long length, long fileLength, St
     private List<String> hudiColumnNames;
     private List<String> hudiColumnTypes;
     private List<String> nestedFields;
+    private String hudiJniScanner;
 }
-
-
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/MORIncrementalRelation.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/MORIncrementalRelation.java
index c06fcc2a578d43..7df013599229fb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/MORIncrementalRelation.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/hudi/source/MORIncrementalRelation.java
@@ -20,9 +20,7 @@
 import org.apache.doris.spi.Split;
 
 import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.FileStatus;
 import org.apache.hadoop.fs.GlobPattern;
-import org.apache.hadoop.fs.Path;
 import org.apache.hudi.common.model.BaseFile;
 import org.apache.hudi.common.model.FileSlice;
 import org.apache.hudi.common.model.HoodieCommitMetadata;
@@ -34,6 +32,8 @@
 import org.apache.hudi.common.table.view.HoodieTableFileSystemView;
 import org.apache.hudi.exception.HoodieException;
 import org.apache.hudi.hadoop.utils.HoodieInputFormatUtils;
+import org.apache.hudi.metadata.HoodieTableMetadataUtil;
+import org.apache.hudi.storage.StoragePathInfo;
 
 import java.io.IOException;
 import java.util.ArrayList;
@@ -54,7 +54,7 @@ public class MORIncrementalRelation implements IncrementalRelation {
     private final boolean endInstantArchived;
     private final List<HoodieInstant> includedCommits;
     private final List<HoodieCommitMetadata> commitsMetadata;
-    private final FileStatus[] affectedFilesInCommits;
+    private final List<StoragePathInfo> affectedFilesInCommits;
     private final boolean fullTableScan;
     private final String globPattern;
     private final boolean includeStartTime;
@@ -96,7 +96,7 @@ public MORIncrementalRelation(Map<String, String> optParams, Configuration confi
         includedCommits = getIncludedCommits();
         commitsMetadata = getCommitsMetadata();
         affectedFilesInCommits = HoodieInputFormatUtils.listAffectedFilesForCommits(configuration,
-                new Path(metaClient.getBasePath()), commitsMetadata);
+                metaClient.getBasePathV2(), commitsMetadata);
         fullTableScan = shouldFullTableScan();
         if (hollowCommitHandling == HollowCommitHandling.USE_TRANSITION_TIME && fullTableScan) {
             throw new HoodieException("Cannot use stateTransitionTime while enables full table scan");
@@ -152,8 +152,8 @@ private boolean shouldFullTableScan() throws IOException {
         if (should) {
             return true;
         }
-        for (FileStatus fileStatus : affectedFilesInCommits) {
-            if (!metaClient.getFs().exists(fileStatus.getPath())) {
+        for (StoragePathInfo fileStatus : affectedFilesInCommits) {
+            if (!metaClient.getRawHoodieStorage().exists(fileStatus.getPath())) {
                 return true;
             }
         }
@@ -199,7 +199,7 @@ public List<FileSlice> collectFileSlices() throws HoodieException {
         String latestCommit = includedCommits.get(includedCommits.size() - 1).getTimestamp();
         HoodieTableFileSystemView fsView = new HoodieTableFileSystemView(metaClient, scanTimeline,
                 affectedFilesInCommits);
-        Stream<FileSlice> fileSlices = HoodieInputFormatUtils.getWritePartitionPaths(commitsMetadata)
+        Stream<FileSlice> fileSlices = HoodieTableMetadataUtil.getWritePartitionPaths(commitsMetadata)
                 .stream().flatMap(relativePartitionPath ->
                         fsView.getLatestMergedFileSlicesBeforeOrOn(relativePartitionPath, latestCommit));
         if ("".equals(globPattern)) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalCatalog.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalCatalog.java
index e6cd77103dbc3b..27e4976aedd85e 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalCatalog.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalCatalog.java
@@ -33,6 +33,7 @@
 import com.aliyun.odps.account.Account;
 import com.aliyun.odps.account.AliyunAccount;
 import com.aliyun.odps.security.SecurityManager;
+import com.aliyun.odps.table.configuration.RestOptions;
 import com.aliyun.odps.table.configuration.SplitOptions;
 import com.aliyun.odps.table.enviroment.Credentials;
 import com.aliyun.odps.table.enviroment.EnvironmentSettings;
@@ -71,6 +72,10 @@ public class MaxComputeExternalCatalog extends ExternalCatalog {
     private long splitRowCount;
     private long splitByteSize;
 
+    private int connectTimeout;
+    private int readTimeout;
+    private int retryTimes;
+
     private static final Map<String, ZoneId> REGION_ZONE_MAP;
     private static final List<String> REQUIRED_PROPERTIES = ImmutableList.of(
             MCProperties.PROJECT,
@@ -159,25 +164,38 @@ protected void initLocalObjectsImpl() {
         defaultProject = props.get(MCProperties.PROJECT);
         quota = props.getOrDefault(MCProperties.QUOTA, MCProperties.DEFAULT_QUOTA);
 
+        boolean splitCrossPartition =
+                Boolean.parseBoolean(props.getOrDefault(MCProperties.SPLIT_CROSS_PARTITION,
+                MCProperties.DEFAULT_SPLIT_CROSS_PARTITION));
 
         splitStrategy = props.getOrDefault(MCProperties.SPLIT_STRATEGY, MCProperties.DEFAULT_SPLIT_STRATEGY);
         if (splitStrategy.equals(MCProperties.SPLIT_BY_BYTE_SIZE_STRATEGY)) {
             splitByteSize = Long.parseLong(props.getOrDefault(MCProperties.SPLIT_BYTE_SIZE,
                     MCProperties.DEFAULT_SPLIT_BYTE_SIZE));
-
             splitOptions = SplitOptions.newBuilder()
                     .SplitByByteSize(splitByteSize)
-                    .withCrossPartition(false)
+                    .withCrossPartition(splitCrossPartition)
                     .build();
         } else {
             splitRowCount = Long.parseLong(props.getOrDefault(MCProperties.SPLIT_ROW_COUNT,
                     MCProperties.DEFAULT_SPLIT_ROW_COUNT));
             splitOptions = SplitOptions.newBuilder()
                     .SplitByRowOffset()
-                    .withCrossPartition(false)
+                    .withCrossPartition(splitCrossPartition)
                     .build();
         }
 
+        connectTimeout = Integer.parseInt(
+                props.getOrDefault(MCProperties.CONNECT_TIMEOUT, MCProperties.DEFAULT_CONNECT_TIMEOUT));
+        readTimeout = Integer.parseInt(
+                props.getOrDefault(MCProperties.READ_TIMEOUT, MCProperties.DEFAULT_READ_TIMEOUT));
+        retryTimes = Integer.parseInt(
+                props.getOrDefault(MCProperties.RETRY_COUNT, MCProperties.DEFAULT_RETRY_COUNT));
+
+        RestOptions restOptions = RestOptions.newBuilder()
+                .withConnectTimeout(connectTimeout)
+                .withReadTimeout(readTimeout)
+                .withRetryTimes(retryTimes).build();
 
         CloudCredential credential = MCProperties.getCredential(props);
         accessKey = credential.getAccessKey();
@@ -196,6 +214,7 @@ protected void initLocalObjectsImpl() {
                 .withCredentials(credentials)
                 .withServiceEndpoint(odps.getEndpoint())
                 .withQuotaName(quota)
+                .withRestOptions(restOptions)
                 .build();
     }
 
@@ -304,6 +323,21 @@ public String getDefaultProject() {
         return defaultProject;
     }
 
+    public int getRetryTimes() {
+        makeSureInitialized();
+        return retryTimes;
+    }
+
+    public int getConnectTimeout() {
+        makeSureInitialized();
+        return connectTimeout;
+    }
+
+    public int getReadTimeout() {
+        makeSureInitialized();
+        return readTimeout;
+    }
+
     public ZoneId getProjectDateTimeZone() {
         makeSureInitialized();
 
@@ -385,6 +419,31 @@ public void checkProperties() throws DdlException {
                     + MCProperties.SPLIT_ROW_COUNT + "must be an integer");
         }
 
+
+        try {
+            connectTimeout = Integer.parseInt(
+                    props.getOrDefault(MCProperties.CONNECT_TIMEOUT, MCProperties.DEFAULT_CONNECT_TIMEOUT));
+            readTimeout = Integer.parseInt(
+                    props.getOrDefault(MCProperties.READ_TIMEOUT, MCProperties.DEFAULT_READ_TIMEOUT));
+            retryTimes = Integer.parseInt(
+                    props.getOrDefault(MCProperties.RETRY_COUNT, MCProperties.DEFAULT_RETRY_COUNT));
+            if (connectTimeout <= 0) {
+                throw new DdlException(MCProperties.CONNECT_TIMEOUT + " must be greater than 0");
+            }
+
+            if (readTimeout <= 0) {
+                throw new DdlException(MCProperties.READ_TIMEOUT + " must be greater than 0");
+            }
+
+            if (retryTimes <= 0) {
+                throw new DdlException(MCProperties.RETRY_COUNT + " must be greater than 0");
+            }
+
+        } catch (NumberFormatException e) {
+            throw new DdlException("property " + MCProperties.CONNECT_TIMEOUT + "/"
+                    + MCProperties.READ_TIMEOUT + "/" + MCProperties.RETRY_COUNT + "must be an integer");
+        }
+
         CloudCredential credential = MCProperties.getCredential(props);
         if (!credential.isWhole()) {
             throw new DdlException("Max-Compute credential properties '"
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalTable.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalTable.java
index 0f748f59e927bc..dbbbcf2d6a1e5b 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalTable.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/MaxComputeExternalTable.java
@@ -92,7 +92,7 @@ public List<Column> getPartitionColumns() {
     }
 
     @Override
-    protected Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
+    public Map<String, PartitionItem> getNameToPartitionItems(Optional<MvccSnapshot> snapshot) {
         if (getPartitionColumns().isEmpty()) {
             return Collections.emptyMap();
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/source/MaxComputeScanNode.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/source/MaxComputeScanNode.java
index e177e9d8b7c88c..9fa22a0fffaab8 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/source/MaxComputeScanNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/maxcompute/source/MaxComputeScanNode.java
@@ -29,6 +29,7 @@
 import org.apache.doris.analysis.SlotRef;
 import org.apache.doris.analysis.TupleDescriptor;
 import org.apache.doris.catalog.Column;
+import org.apache.doris.catalog.Env;
 import org.apache.doris.catalog.ScalarType;
 import org.apache.doris.catalog.TableIf;
 import org.apache.doris.common.AnalysisException;
@@ -43,6 +44,7 @@
 import org.apache.doris.nereids.trees.plans.logical.LogicalFileScan.SelectedPartitions;
 import org.apache.doris.nereids.util.DateUtils;
 import org.apache.doris.planner.PlanNodeId;
+import org.apache.doris.qe.ConnectContext;
 import org.apache.doris.spi.Split;
 import org.apache.doris.statistics.StatisticalType;
 import org.apache.doris.thrift.TFileFormatType;
@@ -79,19 +81,30 @@
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.Executor;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.atomic.AtomicReference;
 import java.util.stream.Collectors;
 
 public class MaxComputeScanNode extends FileQueryScanNode {
 
     private final MaxComputeExternalTable table;
-    private TableBatchReadSession tableBatchReadSession;
     private Predicate filterPredicate;
-    private static final LocationPath ROW_OFFSET_PATH = new LocationPath("/row_offset", Maps.newHashMap());
-    private static final LocationPath BYTE_SIZE_PATH = new LocationPath("/byte_size", Maps.newHashMap());
+    List<String> requiredPartitionColumns = new ArrayList<>();
+    List<String> orderedRequiredDataColumns = new ArrayList<>();
+
+    private int connectTimeout;
+    private int readTimeout;
+    private int retryTimes;
 
     @Setter
     private SelectedPartitions selectedPartitions = null;
 
+    private static final LocationPath ROW_OFFSET_PATH = new LocationPath("/row_offset", Maps.newHashMap());
+    private static final LocationPath BYTE_SIZE_PATH = new LocationPath("/byte_size", Maps.newHashMap());
+
+
     // For new planner
     public MaxComputeScanNode(PlanNodeId id, TupleDescriptor desc,
             SelectedPartitions selectedPartitions, boolean needCheckColumnPriv) {
@@ -127,6 +140,11 @@ private void setScanParams(TFileRangeDesc rangeDesc, MaxComputeSplit maxComputeS
         fileDesc.setPartitionSpec("deprecated");
         fileDesc.setTableBatchReadSession(maxComputeSplit.scanSerialize);
         fileDesc.setSessionId(maxComputeSplit.getSessionId());
+
+        fileDesc.setReadTimeout(readTimeout);
+        fileDesc.setConnectTimeout(connectTimeout);
+        fileDesc.setRetryTimes(retryTimes);
+
         tableFormatFileDesc.setMaxComputeParams(fileDesc);
         rangeDesc.setTableFormatParams(tableFormatFileDesc);
         rangeDesc.setPath("[ " + maxComputeSplit.getStart() + " , " + maxComputeSplit.getLength() + " ]");
@@ -134,33 +152,17 @@ private void setScanParams(TFileRangeDesc rangeDesc, MaxComputeSplit maxComputeS
         rangeDesc.setSize(maxComputeSplit.getLength());
     }
 
-    // Return false if no need to read any partition data.
-    // Return true if need to read partition data.
-    boolean createTableBatchReadSession() throws UserException {
-        List<String> requiredPartitionColumns = new ArrayList<>();
-        List<String> orderedRequiredDataColumns = new ArrayList<>();
-
-        List<PartitionSpec> requiredPartitionSpecs = new ArrayList<>();
-        //if requiredPartitionSpecs is empty, get all partition data.
-        if (!table.getPartitionColumns().isEmpty() && selectedPartitions != SelectedPartitions.NOT_PRUNED) {
-            this.totalPartitionNum = selectedPartitions.totalPartitionNum;
-            this.selectedPartitionNum = selectedPartitions.selectedPartitions.size();
-
-            if (selectedPartitions.selectedPartitions.isEmpty()) {
-                //no need read any partition data.
-                return false;
-            }
-            selectedPartitions.selectedPartitions.forEach(
-                    (key, value) -> requiredPartitionSpecs.add(new PartitionSpec(key))
-            );
-        }
 
+    private void createRequiredColumns() {
         Set<String> requiredSlots =
                 desc.getSlots().stream().map(e -> e.getColumn().getName()).collect(Collectors.toSet());
 
         Set<String> partitionColumns =
                 table.getPartitionColumns().stream().map(Column::getName).collect(Collectors.toSet());
 
+        requiredPartitionColumns.clear();
+        orderedRequiredDataColumns.clear();
+
         for (Column column : table.getColumns()) {
             String columnName =  column.getName();
             if (!requiredSlots.contains(columnName)) {
@@ -172,32 +174,118 @@ boolean createTableBatchReadSession() throws UserException {
                 orderedRequiredDataColumns.add(columnName);
             }
         }
+    }
 
+    /**
+     * For no partition table: request requiredPartitionSpecs is empty
+     * For partition table: if requiredPartitionSpecs is empty, get all partition data.
+     */
+    TableBatchReadSession createTableBatchReadSession(List<PartitionSpec> requiredPartitionSpecs) throws IOException {
+        MaxComputeExternalCatalog mcCatalog = (MaxComputeExternalCatalog) table.getCatalog();
 
+        readTimeout = mcCatalog.getReadTimeout();
+        connectTimeout = mcCatalog.getConnectTimeout();
+        retryTimes = mcCatalog.getRetryTimes();
+
+        TableReadSessionBuilder scanBuilder = new TableReadSessionBuilder();
+        return scanBuilder.identifier(TableIdentifier.of(table.getDbName(), table.getName()))
+                        .withSettings(mcCatalog.getSettings())
+                        .withSplitOptions(mcCatalog.getSplitOption())
+                        .requiredPartitionColumns(requiredPartitionColumns)
+                        .requiredDataColumns(orderedRequiredDataColumns)
+                        .withFilterPredicate(filterPredicate)
+                        .requiredPartitions(requiredPartitionSpecs)
+                        .withArrowOptions(
+                                ArrowOptions.newBuilder()
+                                        .withDatetimeUnit(TimestampUnit.MILLI)
+                                        .withTimestampUnit(TimestampUnit.NANO)
+                                        .build()
+                        ).buildBatchReadSession();
+    }
 
-        MaxComputeExternalCatalog mcCatalog = (MaxComputeExternalCatalog) table.getCatalog();
+    @Override
+    public boolean isBatchMode() {
+        if (table.getPartitionColumns().isEmpty()) {
+            return false;
+        }
 
-        try {
-            TableReadSessionBuilder scanBuilder = new TableReadSessionBuilder();
-            tableBatchReadSession =
-                    scanBuilder.identifier(TableIdentifier.of(table.getDbName(), table.getName()))
-                            .withSettings(mcCatalog.getSettings())
-                            .withSplitOptions(mcCatalog.getSplitOption())
-                            .requiredPartitionColumns(requiredPartitionColumns)
-                            .requiredPartitions(requiredPartitionSpecs)
-                            .requiredDataColumns(orderedRequiredDataColumns)
-                            .withArrowOptions(
-                                    ArrowOptions.newBuilder()
-                                            .withDatetimeUnit(TimestampUnit.MILLI)
-                                            .withTimestampUnit(TimestampUnit.NANO)
-                                            .build()
-                            )
-                            .withFilterPredicate(filterPredicate)
-                            .buildBatchReadSession();
-        } catch (java.io.IOException e) {
-            throw new RuntimeException(e);
+        com.aliyun.odps.Table odpsTable = table.getOdpsTable();
+        if (desc.getSlots().isEmpty() || odpsTable.getFileNum() <= 0) {
+            return false;
         }
-        return true;
+
+        int numPartitions = ConnectContext.get().getSessionVariable().getNumPartitionsInBatchMode();
+        return numPartitions > 0
+                && selectedPartitions != SelectedPartitions.NOT_PRUNED
+                && selectedPartitions.selectedPartitions.size() >= numPartitions;
+    }
+
+    @Override
+    public int numApproximateSplits() {
+        return selectedPartitions.selectedPartitions.size();
+    }
+
+    @Override
+    public void startSplit() {
+        this.totalPartitionNum = selectedPartitions.totalPartitionNum;
+        this.selectedPartitionNum = selectedPartitions.selectedPartitions.size();
+
+        if (selectedPartitions.selectedPartitions.isEmpty()) {
+            //no need read any partition data.
+            return;
+        }
+
+        createRequiredColumns();
+        List<PartitionSpec> requiredPartitionSpecs = new ArrayList<>();
+        selectedPartitions.selectedPartitions.forEach(
+                (key, value) -> requiredPartitionSpecs.add(new PartitionSpec(key))
+        );
+
+
+        int batchNumPartitions = ConnectContext.get().getSessionVariable().getNumPartitionsInBatchMode();
+
+        Executor scheduleExecutor = Env.getCurrentEnv().getExtMetaCacheMgr().getScheduleExecutor();
+        AtomicReference<UserException> batchException = new AtomicReference<>(null);
+        AtomicInteger numFinishedPartitions = new AtomicInteger(0);
+
+        CompletableFuture.runAsync(() -> {
+            for (int beginIndex = 0; beginIndex < requiredPartitionSpecs.size(); beginIndex += batchNumPartitions) {
+                int endIndex = Math.min(beginIndex + batchNumPartitions, requiredPartitionSpecs.size());
+                if (batchException.get() != null || splitAssignment.isStop()) {
+                    break;
+                }
+                List<PartitionSpec> requiredBatchPartitionSpecs = requiredPartitionSpecs.subList(beginIndex, endIndex);
+                int curBatchSize = endIndex - beginIndex;
+
+                try {
+                    CompletableFuture.runAsync(() -> {
+                        try {
+                            TableBatchReadSession tableBatchReadSession =
+                                    createTableBatchReadSession(requiredBatchPartitionSpecs);
+                            List<Split> batchSplit = getSplitByTableSession(tableBatchReadSession);
+
+                            splitAssignment.addToQueue(batchSplit);
+                        } catch (IOException e) {
+                            batchException.set(new UserException(e.getMessage(), e));
+                        } finally {
+                            if (batchException.get() != null) {
+                                splitAssignment.setException(batchException.get());
+                            }
+
+                            if (numFinishedPartitions.addAndGet(curBatchSize) == requiredPartitionSpecs.size()) {
+                                splitAssignment.finishSchedule();
+                            }
+                        }
+                    }, scheduleExecutor);
+                } catch (Exception e) {
+                    batchException.set(new UserException(e.getMessage(), e));
+                }
+
+                if (batchException.get() != null) {
+                    splitAssignment.setException(batchException.get());
+                }
+            }
+        });
     }
 
     @Override
@@ -458,63 +546,84 @@ protected Map<String, String> getLocationProperties() throws UserException {
         return new HashMap<>();
     }
 
-    @Override
-    public List<Split> getSplits() throws UserException {
+    List<Split> getSplitByTableSession(TableBatchReadSession tableBatchReadSession) throws java.io.IOException {
         List<Split> result = new ArrayList<>();
-        com.aliyun.odps.Table odpsTable = table.getOdpsTable();
-        if (desc.getSlots().isEmpty() || odpsTable.getFileNum() <= 0) {
-            return result;
-        }
+        String scanSessionSerialize =  serializeSession(tableBatchReadSession);
+        InputSplitAssigner assigner = tableBatchReadSession.getInputSplitAssigner();
+        long modificationTime = table.getOdpsTable().getLastDataModifiedTime().getTime();
 
-        if (!createTableBatchReadSession()) {
-            return result;
-        }
+        MaxComputeExternalCatalog mcCatalog = (MaxComputeExternalCatalog) table.getCatalog();
+
+        if (mcCatalog.getSplitStrategy().equals(MCProperties.SPLIT_BY_BYTE_SIZE_STRATEGY)) {
+
+            for (com.aliyun.odps.table.read.split.InputSplit split : assigner.getAllSplits()) {
+                MaxComputeSplit maxComputeSplit =
+                        new MaxComputeSplit(BYTE_SIZE_PATH,
+                                ((IndexedInputSplit) split).getSplitIndex(), -1,
+                                mcCatalog.getSplitByteSize(),
+                                modificationTime, null,
+                                Collections.emptyList());
 
-        try {
-            String scanSessionSerialize =  serializeSession(tableBatchReadSession);
-            InputSplitAssigner assigner = tableBatchReadSession.getInputSplitAssigner();
-            long modificationTime = table.getOdpsTable().getLastDataModifiedTime().getTime();
 
-            MaxComputeExternalCatalog mcCatalog = (MaxComputeExternalCatalog) table.getCatalog();
+                maxComputeSplit.scanSerialize = scanSessionSerialize;
+                maxComputeSplit.splitType = SplitType.BYTE_SIZE;
+                maxComputeSplit.sessionId = split.getSessionId();
 
-            if (mcCatalog.getSplitStrategy().equals(MCProperties.SPLIT_BY_BYTE_SIZE_STRATEGY)) {
+                result.add(maxComputeSplit);
+            }
+        } else {
+            long totalRowCount =  assigner.getTotalRowCount();
 
-                for (com.aliyun.odps.table.read.split.InputSplit split : assigner.getAllSplits()) {
-                    MaxComputeSplit maxComputeSplit =
-                            new MaxComputeSplit(BYTE_SIZE_PATH,
-                                    ((IndexedInputSplit) split).getSplitIndex(), -1,
-                                    mcCatalog.getSplitByteSize(),
-                                    modificationTime, null,
-                                    Collections.emptyList());
+            long recordsPerSplit = mcCatalog.getSplitRowCount();
+            for (long offset = 0; offset < totalRowCount; offset += recordsPerSplit) {
+                recordsPerSplit = Math.min(recordsPerSplit, totalRowCount - offset);
+                com.aliyun.odps.table.read.split.InputSplit split =
+                        assigner.getSplitByRowOffset(offset, recordsPerSplit);
 
+                MaxComputeSplit maxComputeSplit =
+                        new MaxComputeSplit(ROW_OFFSET_PATH,
+                                offset, recordsPerSplit, totalRowCount, modificationTime, null,
+                                Collections.emptyList());
 
-                    maxComputeSplit.scanSerialize = scanSessionSerialize;
-                    maxComputeSplit.splitType = SplitType.BYTE_SIZE;
-                    maxComputeSplit.sessionId = split.getSessionId();
+                maxComputeSplit.scanSerialize = scanSessionSerialize;
+                maxComputeSplit.splitType = SplitType.ROW_OFFSET;
+                maxComputeSplit.sessionId = split.getSessionId();
 
-                    result.add(maxComputeSplit);
-                }
-            } else {
-                long totalRowCount =  assigner.getTotalRowCount();
+                result.add(maxComputeSplit);
+            }
+        }
+        return result;
+    }
 
-                long recordsPerSplit = mcCatalog.getSplitRowCount();
-                for (long offset = 0; offset < totalRowCount; offset += recordsPerSplit) {
-                    recordsPerSplit = Math.min(recordsPerSplit, totalRowCount - offset);
-                    com.aliyun.odps.table.read.split.InputSplit split =
-                            assigner.getSplitByRowOffset(offset, recordsPerSplit);
 
-                    MaxComputeSplit maxComputeSplit =
-                            new MaxComputeSplit(ROW_OFFSET_PATH,
-                            offset, recordsPerSplit, totalRowCount, modificationTime, null,
-                            Collections.emptyList());
+    @Override
+    public List<Split> getSplits() throws UserException {
+        List<Split> result = new ArrayList<>();
+        com.aliyun.odps.Table odpsTable = table.getOdpsTable();
+        if (desc.getSlots().isEmpty() || odpsTable.getFileNum() <= 0) {
+            return result;
+        }
 
-                    maxComputeSplit.scanSerialize = scanSessionSerialize;
-                    maxComputeSplit.splitType = SplitType.ROW_OFFSET;
-                    maxComputeSplit.sessionId = split.getSessionId();
+        createRequiredColumns();
 
-                    result.add(maxComputeSplit);
-                }
+        List<PartitionSpec> requiredPartitionSpecs = new ArrayList<>();
+        //if requiredPartitionSpecs is empty, get all partition data.
+        if (!table.getPartitionColumns().isEmpty() && selectedPartitions != SelectedPartitions.NOT_PRUNED) {
+            this.totalPartitionNum = selectedPartitions.totalPartitionNum;
+            this.selectedPartitionNum = selectedPartitions.selectedPartitions.size();
+
+            if (selectedPartitions.selectedPartitions.isEmpty()) {
+                //no need read any partition data.
+                return result;
             }
+            selectedPartitions.selectedPartitions.forEach(
+                    (key, value) -> requiredPartitionSpecs.add(new PartitionSpec(key))
+            );
+        }
+
+        try {
+            TableBatchReadSession tableBatchReadSession = createTableBatchReadSession(requiredPartitionSpecs);
+            result = getSplitByTableSession(tableBatchReadSession);
         } catch (IOException e) {
             throw new RuntimeException(e);
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/PaimonExternalCatalog.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/PaimonExternalCatalog.java
index 5a9e6feb5ad5b8..eb25336ab0b033 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/PaimonExternalCatalog.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/PaimonExternalCatalog.java
@@ -19,7 +19,7 @@
 
 import org.apache.doris.common.DdlException;
 import org.apache.doris.common.security.authentication.AuthenticationConfig;
-import org.apache.doris.common.security.authentication.HadoopUGI;
+import org.apache.doris.common.security.authentication.HadoopAuthenticator;
 import org.apache.doris.datasource.CatalogProperty;
 import org.apache.doris.datasource.ExternalCatalog;
 import org.apache.doris.datasource.InitCatalogLog;
@@ -40,6 +40,7 @@
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.options.Options;
 
+import java.io.IOException;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
@@ -53,6 +54,7 @@ public abstract class PaimonExternalCatalog extends ExternalCatalog {
     protected String catalogType;
     protected Catalog catalog;
     protected AuthenticationConfig authConf;
+    protected HadoopAuthenticator hadoopAuthenticator;
 
     private static final List<String> REQUIRED_PROPERTIES = ImmutableList.of(
             PaimonProperties.WAREHOUSE
@@ -71,9 +73,8 @@ protected void initLocalObjectsImpl() {
         for (Map.Entry<String, String> propEntry : this.catalogProperty.getHadoopProperties().entrySet()) {
             conf.set(propEntry.getKey(), propEntry.getValue());
         }
-        authConf = AuthenticationConfig.getKerberosConfig(conf,
-                AuthenticationConfig.HADOOP_KERBEROS_PRINCIPAL,
-                AuthenticationConfig.HADOOP_KERBEROS_KEYTAB);
+        authConf = AuthenticationConfig.getKerberosConfig(conf);
+        hadoopAuthenticator = HadoopAuthenticator.getHadoopAuthenticator(authConf);
     }
 
     public String getCatalogType() {
@@ -82,40 +83,57 @@ public String getCatalogType() {
     }
 
     protected List<String> listDatabaseNames() {
-        return HadoopUGI.ugiDoAs(authConf, () -> new ArrayList<>(catalog.listDatabases()));
+        try {
+            return hadoopAuthenticator.doAs(() -> new ArrayList<>(catalog.listDatabases()));
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to list databases names, catalog name: " + getName(), e);
+        }
     }
 
     @Override
     public boolean tableExist(SessionContext ctx, String dbName, String tblName) {
         makeSureInitialized();
-        return HadoopUGI.ugiDoAs(authConf, () -> catalog.tableExists(Identifier.create(dbName, tblName)));
+        try {
+            return hadoopAuthenticator.doAs(() -> catalog.tableExists(Identifier.create(dbName, tblName)));
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to check table existence, catalog name: " + getName(), e);
+        }
     }
 
     @Override
     public List<String> listTableNames(SessionContext ctx, String dbName) {
         makeSureInitialized();
-        return HadoopUGI.ugiDoAs(authConf, () -> {
-            List<String> tableNames = null;
-            try {
-                tableNames = catalog.listTables(dbName);
-            } catch (Catalog.DatabaseNotExistException e) {
-                LOG.warn("DatabaseNotExistException", e);
-            }
-            return tableNames;
-        });
+        try {
+            return hadoopAuthenticator.doAs(() -> {
+                List<String> tableNames = null;
+                try {
+                    tableNames = catalog.listTables(dbName);
+                } catch (Catalog.DatabaseNotExistException e) {
+                    LOG.warn("DatabaseNotExistException", e);
+                }
+                return tableNames;
+            });
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to list table names, catalog name: " + getName(), e);
+        }
     }
 
     public org.apache.paimon.table.Table getPaimonTable(String dbName, String tblName) {
         makeSureInitialized();
-        return HadoopUGI.ugiDoAs(authConf, () -> {
-            org.apache.paimon.table.Table table = null;
-            try {
-                table = catalog.getTable(Identifier.create(dbName, tblName));
-            } catch (Catalog.TableNotExistException e) {
-                LOG.warn("TableNotExistException", e);
-            }
-            return table;
-        });
+        try {
+            return hadoopAuthenticator.doAs(() -> {
+                org.apache.paimon.table.Table table = null;
+                try {
+                    table = catalog.getTable(Identifier.create(dbName, tblName));
+                } catch (Catalog.TableNotExistException e) {
+                    LOG.warn("TableNotExistException", e);
+                }
+                return table;
+            });
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to get Paimon table, catalog name: " + getName() + ", db: "
+                    + dbName + ", table: " + tblName, e);
+        }
     }
 
     protected String getPaimonCatalogType(String catalogType) {
@@ -127,15 +145,19 @@ protected String getPaimonCatalogType(String catalogType) {
     }
 
     protected Catalog createCatalog() {
-        return HadoopUGI.ugiDoAs(authConf, () -> {
-            Options options = new Options();
-            Map<String, String> paimonOptionsMap = getPaimonOptionsMap();
-            for (Map.Entry<String, String> kv : paimonOptionsMap.entrySet()) {
-                options.set(kv.getKey(), kv.getValue());
-            }
-            CatalogContext context = CatalogContext.create(options, getConfiguration());
-            return createCatalogImpl(context);
-        });
+        try {
+            return hadoopAuthenticator.doAs(() -> {
+                Options options = new Options();
+                Map<String, String> paimonOptionsMap = getPaimonOptionsMap();
+                for (Map.Entry<String, String> kv : paimonOptionsMap.entrySet()) {
+                    options.set(kv.getKey(), kv.getValue());
+                }
+                CatalogContext context = CatalogContext.create(options, getConfiguration());
+                return createCatalogImpl(context);
+            });
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to create catalog, catalog name: " + getName(), e);
+        }
     }
 
     protected Catalog createCatalogImpl(CatalogContext context) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/source/PaimonScanNode.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/source/PaimonScanNode.java
index 59f51c8425c7f2..5009ec3c9049fb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/source/PaimonScanNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/paimon/source/PaimonScanNode.java
@@ -105,9 +105,9 @@ public String toString() {
     private String serializedTable;
 
     public PaimonScanNode(PlanNodeId id,
-                          TupleDescriptor desc,
-                          boolean needCheckColumnPriv,
-                          SessionVariable sessionVariable) {
+            TupleDescriptor desc,
+            boolean needCheckColumnPriv,
+            SessionVariable sessionVariable) {
         super(id, desc, "PAIMON_SCAN_NODE", StatisticalType.PAIMON_SCAN_NODE, needCheckColumnPriv);
         this.sessionVariable = sessionVariable;
     }
@@ -127,8 +127,7 @@ protected void convertPredicate() {
         predicates = paimonPredicateConverter.convertToPaimonExpr(conjuncts);
     }
 
-    private static final Base64.Encoder BASE64_ENCODER =
-            java.util.Base64.getUrlEncoder().withoutPadding();
+    private static final Base64.Encoder BASE64_ENCODER = java.util.Base64.getUrlEncoder().withoutPadding();
 
     public static <T> String encodeObjectToString(T t) {
         try {
@@ -156,11 +155,24 @@ private void setPaimonParams(TFileRangeDesc rangeDesc, PaimonSplit paimonSplit)
         tableFormatFileDesc.setTableFormatType(paimonSplit.getTableFormatType().value());
         TPaimonFileDesc fileDesc = new TPaimonFileDesc();
         org.apache.paimon.table.source.Split split = paimonSplit.getSplit();
+
+        String fileFormat = getFileFormat(paimonSplit.getPathString());
         if (split != null) {
             // use jni reader
+            rangeDesc.setFormatType(TFileFormatType.FORMAT_JNI);
             fileDesc.setPaimonSplit(encodeObjectToString(split));
+        } else {
+            // use native reader
+            if (fileFormat.equals("orc")) {
+                rangeDesc.setFormatType(TFileFormatType.FORMAT_ORC);
+            } else if (fileFormat.equals("parquet")) {
+                rangeDesc.setFormatType(TFileFormatType.FORMAT_PARQUET);
+            } else {
+                throw new RuntimeException("Unsupported file format: " + fileFormat);
+            }
         }
-        fileDesc.setFileFormat(getFileFormat(paimonSplit.getPathString()));
+
+        fileDesc.setFileFormat(fileFormat);
         fileDesc.setPaimonPredicate(encodeObjectToString(predicates));
         fileDesc.setPaimonColumnNames(source.getDesc().getSlots().stream().map(slot -> slot.getColumn().getName())
                 .collect(Collectors.joining(",")));
@@ -171,7 +183,6 @@ private void setPaimonParams(TFileRangeDesc rangeDesc, PaimonSplit paimonSplit)
         fileDesc.setDbId(((PaimonExternalTable) source.getTargetTable()).getDbId());
         fileDesc.setTblId(source.getTargetTable().getId());
         fileDesc.setLastUpdateTime(source.getTargetTable().getUpdateTime());
-        fileDesc.setPaimonTable(encodeObjectToString(source.getPaimonTable()));
         // The hadoop conf should be same with PaimonExternalCatalog.createCatalog()#getConfiguration()
         fileDesc.setHadoopConf(source.getCatalog().getCatalogProperty().getHadoopProperties());
         Optional<DeletionFile> optDeletionFile = paimonSplit.getDeletionFile();
@@ -190,8 +201,8 @@ private void setPaimonParams(TFileRangeDesc rangeDesc, PaimonSplit paimonSplit)
     @Override
     public List<Split> getSplits() throws UserException {
         boolean forceJniScanner = sessionVariable.isForceJniScanner();
-        SessionVariable.IgnoreSplitType ignoreSplitType =
-                SessionVariable.IgnoreSplitType.valueOf(sessionVariable.getIgnoreSplitType());
+        SessionVariable.IgnoreSplitType ignoreSplitType = SessionVariable.IgnoreSplitType
+                .valueOf(sessionVariable.getIgnoreSplitType());
         List<Split> splits = new ArrayList<>();
         int[] projected = desc.getSlots().stream().mapToInt(
                 slot -> (source.getPaimonTable().rowType().getFieldNames().indexOf(slot.getColumn().getName())))
@@ -288,7 +299,8 @@ public List<Split> getSplits() throws UserException {
         }
         this.selectedPartitionNum = selectedPartitionValues.size();
         // TODO: get total partition number
-        // We should set fileSplitSize at the end because fileSplitSize may be modified in splitFile.
+        // We should set fileSplitSize at the end because fileSplitSize may be modified
+        // in splitFile.
         splits.forEach(s -> s.setTargetSplitSize(fileSplitSize));
         return splits;
     }
@@ -318,8 +330,9 @@ public TFileFormatType getFileFormatType() throws DdlException, MetaNotFoundExce
 
     @Override
     public List<String> getPathPartitionKeys() throws DdlException, MetaNotFoundException {
-        //                return new ArrayList<>(source.getPaimonTable().partitionKeys());
-        //Paymon is not aware of partitions and bypasses some existing logic by returning an empty list
+        // return new ArrayList<>(source.getPaimonTable().partitionKeys());
+        // Paymon is not aware of partitions and bypasses some existing logic by
+        // returning an empty list
         return new ArrayList<>();
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/property/constants/MCProperties.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/property/constants/MCProperties.java
index 20a77574fc7820..3957ffc91bb4b4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/datasource/property/constants/MCProperties.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/property/constants/MCProperties.java
@@ -56,6 +56,21 @@ public class MCProperties extends BaseProperties {
     public static final String SPLIT_ROW_COUNT = "mc.split_row_count";
     public static final String DEFAULT_SPLIT_ROW_COUNT = "1048576"; // 256 * 4096
 
+    public static final String CONNECT_TIMEOUT = "mc.connect_timeout";
+    public static final String READ_TIMEOUT = "mc.read_timeout";
+    public static final String RETRY_COUNT = "mc.retry_count";
+
+    public static final String DEFAULT_CONNECT_TIMEOUT = "10"; // 10s
+    public static final String DEFAULT_READ_TIMEOUT = "120"; // 120s
+    public static final String DEFAULT_RETRY_COUNT = "4"; // 4 times
+
+    //withCrossPartition(true):
+    //      Very friendly to scenarios where there are many partitions but each partition is very small.
+    //withCrossPartition(false):
+    //      Very debug friendly.
+    public static final String SPLIT_CROSS_PARTITION = "mc.split_cross_partition";
+    public static final String DEFAULT_SPLIT_CROSS_PARTITION = "true";
+
     public static CloudCredential getCredential(Map<String, String> props) {
         return getCloudCredential(props, ACCESS_KEY, SECRET_KEY, SESSION_TOKEN);
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/httpv2/rest/manager/QueryProfileAction.java b/fe/fe-core/src/main/java/org/apache/doris/httpv2/rest/manager/QueryProfileAction.java
index 8c3dfa73aea759..0886edb56fb2f6 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/httpv2/rest/manager/QueryProfileAction.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/httpv2/rest/manager/QueryProfileAction.java
@@ -419,7 +419,7 @@ private ResponseEntity getProfileFromAllFrontends(HttpServletRequest request, St
 
     private void checkAuthByUserAndQueryId(String queryId) throws AuthenticationException {
         String user = ConnectContext.get().getCurrentUserIdentity().getQualifiedUser();
-        if (!user.equalsIgnoreCase(Auth.ADMIN_USER) && !user.equalsIgnoreCase(Auth.ROOT_USER)) {
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
             ProfileManager.getInstance().checkAuthByUserAndQueryId(user, queryId);
         }
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/job/disruptor/TaskDisruptor.java b/fe/fe-core/src/main/java/org/apache/doris/job/disruptor/TaskDisruptor.java
index 6ca2924c593bc1..2b2e3df0418dd3 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/job/disruptor/TaskDisruptor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/job/disruptor/TaskDisruptor.java
@@ -74,7 +74,16 @@ public void start() {
     public boolean publishEvent(Object... args) {
         try {
             RingBuffer<T> ringBuffer = disruptor.getRingBuffer();
-            return ringBuffer.tryPublishEvent(eventTranslator, args);
+            // Check if the RingBuffer has enough capacity to reserve 10 slots for tasks
+            // If there is insufficient capacity (less than 10 slots available)
+            // log a warning and drop the current task
+            if (!ringBuffer.hasAvailableCapacity(10)) {
+                LOG.warn("ring buffer has no available capacity,task will be dropped,"
+                        + "please check the task queue size.");
+                return false;
+            }
+            ringBuffer.publishEvent(eventTranslator, args);
+            return true;
         } catch (Exception e) {
             LOG.warn("Failed to publish event", e);
             // Handle the exception, e.g., retry or alert
diff --git a/fe/fe-core/src/main/java/org/apache/doris/job/executor/TimerJobSchedulerTask.java b/fe/fe-core/src/main/java/org/apache/doris/job/executor/TimerJobSchedulerTask.java
index 65a9cf2e091164..4269fa0d8f3c52 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/job/executor/TimerJobSchedulerTask.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/job/executor/TimerJobSchedulerTask.java
@@ -48,6 +48,8 @@ public void run(Timeout timeout) {
                 log.warn("dispatch timer job failed, queue maybe full. job id is {}, job name is {}",
                         this.job.getJobId(), this.job.getJobName() + getMsgWhenExecuteQueueFull());
             }
+            log.info("dispatch timer job success, job id is {}, job name is {}", this.job.getJobId(),
+                    this.job.getJobName());
         } catch (Exception e) {
             log.warn("dispatch timer job error, task id is {}", this.job.getJobId(), e);
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/job/scheduler/JobScheduler.java b/fe/fe-core/src/main/java/org/apache/doris/job/scheduler/JobScheduler.java
index ea0c263a5ee1c3..921f333791cb44 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/job/scheduler/JobScheduler.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/job/scheduler/JobScheduler.java
@@ -146,6 +146,11 @@ public void close() throws IOException {
     private void cycleTimerJobScheduler(T job, long startTimeWindowMs) {
         List<Long> delaySeconds = job.getJobConfig().getTriggerDelayTimes(System.currentTimeMillis(),
                 startTimeWindowMs, latestBatchSchedulerTimerTaskTimeMs);
+        if (CollectionUtils.isEmpty(delaySeconds)) {
+            log.info("skip job {} scheduler timer job, delay seconds is empty", job.getJobName());
+            return;
+        }
+        log.info("job {} scheduler timer job, delay seconds size is {}", job.getJobName(), delaySeconds.size());
         if (CollectionUtils.isNotEmpty(delaySeconds)) {
             delaySeconds.forEach(delaySecond -> {
                 TimerJobSchedulerTask<T> timerJobSchedulerTask = new TimerJobSchedulerTask<>(timerJobDisruptor, job);
@@ -168,7 +173,9 @@ public void schedulerInstantJob(T job, TaskType taskType, C context) throws JobE
         for (AbstractTask task : tasks) {
             if (!taskDisruptorGroupManager.dispatchInstantTask(task, job.getJobType(),
                     job.getJobConfig())) {
-                throw new JobException(job.formatMsgWhenExecuteQueueFull(task.getTaskId()));
+                String errorMsg = job.formatMsgWhenExecuteQueueFull(task.getTaskId());
+                task.onFail(errorMsg);
+                throw new JobException(errorMsg);
 
             }
             log.info("dispatch instant job, job id is {}, job name is {}, task id is {}", job.getJobId(),
@@ -186,6 +193,8 @@ private void executeTimerJobIdsWithinLastTenMinutesWindow() {
             this.latestBatchSchedulerTimerTaskTimeMs = System.currentTimeMillis();
         }
         this.latestBatchSchedulerTimerTaskTimeMs += BATCH_SCHEDULER_INTERVAL_MILLI_SECONDS;
+        log.info("execute timer job ids within last ten minutes window, last time window is {}",
+                TimeUtils.longToTimeString(lastTimeWindowMs));
         if (jobMap.isEmpty()) {
             return;
         }
@@ -207,6 +216,7 @@ private void clearEndJob(T job) {
         }
         try {
             Env.getCurrentEnv().getJobManager().unregisterJob(job.getJobId());
+            log.info("clear finish job, job id is {}, job name is {}", job.getJobId(), job.getJobName());
         } catch (JobException e) {
             log.error("clear finish job error, job id is {}", job.getJobId(), e);
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/load/ExportMgr.java b/fe/fe-core/src/main/java/org/apache/doris/load/ExportMgr.java
index eddd5fb27eeef1..94ae436ee6d87d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/load/ExportMgr.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/load/ExportMgr.java
@@ -108,26 +108,24 @@ public void addExportJobAndRegisterTask(ExportJob job) throws Exception {
                 }
             }
             unprotectAddJob(job);
-            // delete existing files
-            if (Config.enable_delete_existing_files && Boolean.parseBoolean(job.getDeleteExistingFiles())) {
-                if (job.getBrokerDesc() == null) {
-                    throw new AnalysisException("Local file system does not support delete existing files");
-                }
-                String fullPath = job.getExportPath();
-                BrokerUtil.deleteDirectoryWithFileSystem(fullPath.substring(0, fullPath.lastIndexOf('/') + 1),
-                        job.getBrokerDesc());
-            }
             Env.getCurrentEnv().getEditLog().logExportCreate(job);
-            // ATTN: Must add task after edit log, otherwise the job may finish before adding job.
-            job.getCopiedTaskExecutors().forEach(executor -> {
-                Env.getCurrentEnv().getTransientTaskManager().addMemoryTask(executor);
-            });
-            LOG.info("add export job. {}", job);
-
         } finally {
             writeUnlock();
         }
-
+        // delete existing files
+        if (Config.enable_delete_existing_files && Boolean.parseBoolean(job.getDeleteExistingFiles())) {
+            if (job.getBrokerDesc() == null) {
+                throw new AnalysisException("Local file system does not support delete existing files");
+            }
+            String fullPath = job.getExportPath();
+            BrokerUtil.deleteDirectoryWithFileSystem(fullPath.substring(0, fullPath.lastIndexOf('/') + 1),
+                    job.getBrokerDesc());
+        }
+        // ATTN: Must add task after edit log, otherwise the job may finish before adding job.
+        for (int i = 0; i < job.getCopiedTaskExecutors().size(); i++) {
+            Env.getCurrentEnv().getTransientTaskManager().addMemoryTask(job.getCopiedTaskExecutors().get(i));
+        }
+        LOG.info("add export job. {}", job);
     }
 
     public void cancelExportJob(CancelExportStmt stmt) throws DdlException, AnalysisException {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadTaskScheduler.java b/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadTaskScheduler.java
index 8afc35411b55f5..d40a6705626c84 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadTaskScheduler.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/load/routineload/RoutineLoadTaskScheduler.java
@@ -106,7 +106,7 @@ private void process() throws UserException, InterruptedException {
             if (routineLoadTaskInfo.getIsEof()) {
                 RoutineLoadJob routineLoadJob = routineLoadManager.getJob(routineLoadTaskInfo.getJobId());
                 if (System.currentTimeMillis() - routineLoadTaskInfo.getLastScheduledTime()
-                        < routineLoadJob.getMaxBatchIntervalS()) {
+                        < routineLoadJob.getMaxBatchIntervalS() * 1000) {
                     needScheduleTasksQueue.addLast(routineLoadTaskInfo);
                     return;
                 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/master/MasterImpl.java b/fe/fe-core/src/main/java/org/apache/doris/master/MasterImpl.java
index 4010a9b564d0a0..09318af34bd381 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/master/MasterImpl.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/master/MasterImpl.java
@@ -681,9 +681,9 @@ private void finishCalcDeleteBitmap(AgentTask task, TFinishTaskRequest request)
             CalcDeleteBitmapTask calcDeleteBitmapTask = (CalcDeleteBitmapTask) task;
             if (request.getTaskStatus().getStatusCode() != TStatusCode.OK) {
                 calcDeleteBitmapTask.countDownToZero(request.getTaskStatus().getStatusCode(),
-                        "backend: " + task.getBackendId() + ", error_tablet_size: "
-                                + request.getErrorTabletIdsSize() + ", err_msg: "
-                                + request.getTaskStatus().getErrorMsgs().toString());
+                        "backend: " + task.getBackendId() + ", error_tablet_size: " + request.getErrorTabletIdsSize()
+                                + ", error_tablets: " + request.getErrorTabletIds()
+                                + ", err_msg: " + request.getTaskStatus().getErrorMsgs().toString());
             } else if (request.isSetRespPartitions()
                     && calcDeleteBitmapTask.isFinishRequestStale(request.getRespPartitions())) {
                 LOG.warn("get staled response from backend: {}, report version: {}. calcDeleteBitmapTask's"
diff --git a/fe/fe-core/src/main/java/org/apache/doris/master/ReportHandler.java b/fe/fe-core/src/main/java/org/apache/doris/master/ReportHandler.java
index c5c72eae3c5a8b..08e4844863a1b7 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/master/ReportHandler.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/master/ReportHandler.java
@@ -95,6 +95,7 @@
 import com.google.common.collect.Lists;
 import com.google.common.collect.Maps;
 import com.google.common.collect.Queues;
+import com.google.common.collect.SetMultimap;
 import com.google.common.collect.Sets;
 import org.apache.commons.collections.CollectionUtils;
 import org.apache.commons.lang3.StringUtils;
@@ -503,7 +504,7 @@ public void tabletReport(long backendId, Map<Long, TTablet> backendTablets,
         Map<Long, Long> partitionVersionSyncMap = Maps.newConcurrentMap();
 
         // dbid -> txn id -> [partition info]
-        Map<Long, ListMultimap<Long, TPartitionVersionInfo>> transactionsToPublish = Maps.newHashMap();
+        Map<Long, SetMultimap<Long, TPartitionVersionInfo>> transactionsToPublish = Maps.newHashMap();
         ListMultimap<Long, Long> transactionsToClear = LinkedListMultimap.create();
 
         // db id -> tablet id
@@ -980,13 +981,13 @@ private static void deleteFromMeta(ListMultimap<Long, Long> tabletDeleteFromMeta
                                     createReplicaTask.setInvertedIndexFileStorageFormat(olapTable
                                                                 .getInvertedIndexFileStorageFormat());
                                     if (indexId == olapTable.getBaseIndexId() || olapTable.isShadowIndex(indexId)) {
-                                        List<Integer> clusterKeyIndexes = OlapTable.getClusterKeyIndexes(
+                                        List<Integer> clusterKeyUids = OlapTable.getClusterKeyUids(
                                                 indexMeta.getSchema());
-                                        if (!CollectionUtils.isEmpty(clusterKeyIndexes)) {
-                                            createReplicaTask.setClusterKeyIndexes(clusterKeyIndexes);
+                                        if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+                                            createReplicaTask.setClusterKeyUids(clusterKeyUids);
                                             LOG.info("table: {}, partition: {}, index: {}, tablet: {}, "
-                                                            + "cluster key indexes: {}", tableId, partitionId, indexId,
-                                                    tabletId, clusterKeyIndexes);
+                                                            + "cluster key uids: {}", tableId, partitionId, indexId,
+                                                    tabletId, clusterKeyUids);
                                         }
                                     }
                                     createReplicaBatchTask.addTask(createReplicaTask);
@@ -1148,14 +1149,14 @@ private static void handleMigration(ListMultimap<TStorageMedium, Long> tabletMet
     }
 
     private static void handleRepublishVersionInfo(
-            Map<Long, ListMultimap<Long, TPartitionVersionInfo>> transactionsToPublish, long backendId) {
+            Map<Long, SetMultimap<Long, TPartitionVersionInfo>> transactionsToPublish, long backendId) {
         AgentBatchTask batchTask = new AgentBatchTask();
         long createPublishVersionTaskTime = System.currentTimeMillis();
         for (Long dbId : transactionsToPublish.keySet()) {
-            ListMultimap<Long, TPartitionVersionInfo> map = transactionsToPublish.get(dbId);
+            SetMultimap<Long, TPartitionVersionInfo> map = transactionsToPublish.get(dbId);
             for (long txnId : map.keySet()) {
                 PublishVersionTask task = new PublishVersionTask(backendId, txnId, dbId,
-                        map.get(txnId), createPublishVersionTaskTime);
+                        Lists.newArrayList(map.get(txnId)), createPublishVersionTaskTime);
                 batchTask.addTask(task);
                 // add to AgentTaskQueue for handling finish report.
                 AgentTaskQueue.addTask(task);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVCache.java b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVCache.java
index 56061c75b9cee2..d3d7f1ad6ebbf5 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVCache.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVCache.java
@@ -51,14 +51,18 @@ public class MTMVCache {
     // The materialized view plan which should be optimized by the same rules to query
     // and will remove top sink and unused sort
     private final Plan logicalPlan;
-    // The original plan of mv def sql
+    // The original rewritten plan of mv def sql
     private final Plan originalPlan;
+    // The analyzed plan of mv def sql, which is used by tableCollector,should not be optimized by rbo
+    private final Plan analyzedPlan;
     private final Statistics statistics;
     private final StructInfo structInfo;
 
-    public MTMVCache(Plan logicalPlan, Plan originalPlan, Statistics statistics, StructInfo structInfo) {
+    public MTMVCache(Plan logicalPlan, Plan originalPlan, Plan analyzedPlan,
+            Statistics statistics, StructInfo structInfo) {
         this.logicalPlan = logicalPlan;
         this.originalPlan = originalPlan;
+        this.analyzedPlan = analyzedPlan;
         this.statistics = statistics;
         this.structInfo = structInfo;
     }
@@ -71,6 +75,10 @@ public Plan getOriginalPlan() {
         return originalPlan;
     }
 
+    public Plan getAnalyzedPlan() {
+        return analyzedPlan;
+    }
+
     public Statistics getStatistics() {
         return statistics;
     }
@@ -80,13 +88,14 @@ public StructInfo getStructInfo() {
     }
 
     public static MTMVCache from(MTMV mtmv, ConnectContext connectContext, boolean needCost) {
-        LogicalPlan unboundMvPlan = new NereidsParser().parseSingle(mtmv.getQuerySql());
         StatementContext mvSqlStatementContext = new StatementContext(connectContext,
                 new OriginStatement(mtmv.getQuerySql(), 0));
-        NereidsPlanner planner = new NereidsPlanner(mvSqlStatementContext);
         if (mvSqlStatementContext.getConnectContext().getStatementContext() == null) {
             mvSqlStatementContext.getConnectContext().setStatementContext(mvSqlStatementContext);
         }
+        LogicalPlan unboundMvPlan = new NereidsParser().parseSingle(mtmv.getQuerySql());
+        NereidsPlanner planner = new NereidsPlanner(mvSqlStatementContext);
+
         // Can not convert to table sink, because use the same column from different table when self join
         // the out slot is wrong
         if (needCost) {
@@ -117,7 +126,7 @@ public Plan visitLogicalResultSink(LogicalResultSink<? extends Plan> logicalResu
         Optional<StructInfo> structInfoOptional = MaterializationContext.constructStructInfo(mvPlan, originPlan,
                 planner.getCascadesContext(),
                 new BitSet());
-        return new MTMVCache(mvPlan, originPlan, needCost
+        return new MTMVCache(mvPlan, originPlan, planner.getAnalyzedPlan(), needCost
                 ? planner.getCascadesContext().getMemo().getRoot().getStatistics() : null,
                 structInfoOptional.orElseGet(() -> null));
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPartitionUtil.java b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPartitionUtil.java
index 8ba022de415006..55ce86e75706c7 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPartitionUtil.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPartitionUtil.java
@@ -172,18 +172,12 @@ public static Map<PartitionKeyDesc, Set<String>> generateRelatedPartitionDescs(M
     }
 
     public static List<Long> getPartitionsIdsByNames(MTMV mtmv, List<String> partitions) throws AnalysisException {
-        mtmv.readLock();
-        try {
-            List<Long> res = Lists.newArrayList();
-            for (String partitionName : partitions) {
-                Partition partition = mtmv.getPartitionOrAnalysisException(partitionName);
-                res.add(partition.getId());
-            }
-            return res;
-        } finally {
-            mtmv.readUnlock();
+        List<Long> res = Lists.newArrayList();
+        for (String partitionName : partitions) {
+            Partition partition = mtmv.getPartitionOrAnalysisException(partitionName);
+            res.add(partition.getId());
         }
-
+        return res;
     }
 
     /**
diff --git a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPlanUtil.java b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPlanUtil.java
index c0cd47bd5a0f2f..35c06e74d3cc80 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPlanUtil.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/mtmv/MTMVPlanUtil.java
@@ -35,12 +35,10 @@
 import org.apache.doris.nereids.rules.RuleType;
 import org.apache.doris.nereids.trees.plans.Plan;
 import org.apache.doris.nereids.trees.plans.commands.ExplainCommand.ExplainLevel;
-import org.apache.doris.nereids.trees.plans.commands.info.CreateMTMVInfo;
 import org.apache.doris.nereids.trees.plans.logical.LogicalPlan;
 import org.apache.doris.nereids.trees.plans.visitor.TableCollector;
 import org.apache.doris.nereids.trees.plans.visitor.TableCollector.TableCollectorContext;
 import org.apache.doris.qe.ConnectContext;
-import org.apache.doris.qe.SessionVariable;
 
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Sets;
@@ -58,6 +56,12 @@ public static ConnectContext createMTMVContext(MTMV mtmv) {
         ctx.setCurrentUserIdentity(UserIdentity.ADMIN);
         ctx.getState().reset();
         ctx.setThreadLocalInfo();
+        // Debug session variable should be disabled when refreshed
+        ctx.getSessionVariable().skipDeletePredicate = false;
+        ctx.getSessionVariable().skipDeleteBitmap = false;
+        ctx.getSessionVariable().skipDeleteSign = false;
+        ctx.getSessionVariable().skipStorageEngineMerge = false;
+        ctx.getSessionVariable().showHiddenColumns = false;
         ctx.getSessionVariable().allowModifyMaterializedViewData = true;
         // Disable add default limit rule to avoid refresh data wrong
         ctx.getSessionVariable().setDisableNereidsRules(
@@ -98,31 +102,20 @@ private static void setCatalogAndDb(ConnectContext ctx, MTMV mtmv) {
     public static MTMVRelation generateMTMVRelation(MTMV mtmv, ConnectContext ctx) {
         // Should not make table without data to empty relation when analyze the related table,
         // so add disable rules
-        SessionVariable sessionVariable = ctx.getSessionVariable();
-        Set<String> tempDisableRules = sessionVariable.getDisableNereidsRuleNames();
-        sessionVariable.setDisableNereidsRules(CreateMTMVInfo.MTMV_PLANER_DISABLE_RULES);
-        if (ctx.getStatementContext() != null) {
-            ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
-        }
-        Plan plan;
-        try {
-            plan = getPlanBySql(mtmv.getQuerySql(), ctx);
-        } finally {
-            sessionVariable.setDisableNereidsRules(String.join(",", tempDisableRules));
-            ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
-        }
-        return generateMTMVRelation(plan);
+        Plan plan = getAnalyzePlanBySql(mtmv.getQuerySql(), ctx);
+        return generateMTMVRelation(plan, ctx);
     }
 
-    public static MTMVRelation generateMTMVRelation(Plan plan) {
-        return new MTMVRelation(getBaseTables(plan, true), getBaseTables(plan, false), getBaseViews(plan));
+    public static MTMVRelation generateMTMVRelation(Plan plan, ConnectContext connectContext) {
+        return new MTMVRelation(getBaseTables(plan, true, connectContext),
+                getBaseTables(plan, false, connectContext), getBaseViews(plan));
     }
 
-    private static Set<BaseTableInfo> getBaseTables(Plan plan, boolean expand) {
+    private static Set<BaseTableInfo> getBaseTables(Plan plan, boolean expand, ConnectContext connectContext) {
         TableCollectorContext collectorContext =
                 new TableCollector.TableCollectorContext(
                         com.google.common.collect.Sets
-                                .newHashSet(TableType.values()), expand);
+                                .newHashSet(TableType.values()), expand, connectContext);
         plan.accept(TableCollector.INSTANCE, collectorContext);
         Set<TableIf> collectedTables = collectorContext.getCollectedTables();
         return transferTableIfToInfo(collectedTables);
@@ -140,7 +133,7 @@ private static Set<BaseTableInfo> transferTableIfToInfo(Set<TableIf> tables) {
         return result;
     }
 
-    private static Plan getPlanBySql(String querySql, ConnectContext ctx) {
+    private static Plan getAnalyzePlanBySql(String querySql, ConnectContext ctx) {
         List<StatementBase> statements;
         try {
             statements = new NereidsParser().parseSQL(querySql);
@@ -153,7 +146,7 @@ private static Plan getPlanBySql(String querySql, ConnectContext ctx) {
         ctx.setStatementContext(new StatementContext());
         try {
             NereidsPlanner planner = new NereidsPlanner(ctx.getStatementContext());
-            return planner.planWithLock(logicalPlan, PhysicalProperties.ANY, ExplainLevel.NONE);
+            return planner.planWithLock(logicalPlan, PhysicalProperties.ANY, ExplainLevel.ANALYZED_PLAN);
         } finally {
             ctx.setStatementContext(original);
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/mysql/MysqlServer.java b/fe/fe-core/src/main/java/org/apache/doris/mysql/MysqlServer.java
index 5f70e3000b9507..e7a888cdd249b8 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/mysql/MysqlServer.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/mysql/MysqlServer.java
@@ -68,14 +68,17 @@ public MysqlServer(int port, ConnectScheduler connectScheduler) {
     // return true if success, otherwise false
     public boolean start() {
         try {
+            OptionMap optionMap = OptionMap.builder()
+                    .set(Options.TCP_NODELAY, true)
+                    .set(Options.BACKLOG, Config.mysql_nio_backlog_num)
+                    .set(Options.KEEP_ALIVE, Config.mysql_nio_enable_keep_alive)
+                    .getMap();
             if (FrontendOptions.isBindIPV6()) {
                 server = xnioWorker.createStreamConnectionServer(new InetSocketAddress("::0", port), acceptListener,
-                    OptionMap.create(Options.TCP_NODELAY, true, Options.BACKLOG, Config.mysql_nio_backlog_num));
-
+                    optionMap);
             } else {
                 server = xnioWorker.createStreamConnectionServer(new InetSocketAddress(port), acceptListener,
-                    OptionMap.create(Options.TCP_NODELAY, true, Options.BACKLOG, Config.mysql_nio_backlog_num));
-
+                    optionMap);
             }
             server.resumeAccepts();
             running = true;
diff --git a/fe/fe-core/src/main/java/org/apache/doris/mysql/privilege/Auth.java b/fe/fe-core/src/main/java/org/apache/doris/mysql/privilege/Auth.java
index f1277a1cd0a3b5..a1fb57d01cafa4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/mysql/privilege/Auth.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/mysql/privilege/Auth.java
@@ -686,7 +686,7 @@ private void grantInternal(UserIdentity userIdent, String role, TablePattern tbl
         writeLock();
         try {
             if (!isReplay) {
-                checkTablePatternExist(tblPattern);
+                checkTablePatternExist(tblPattern, privs);
             }
             if (role == null) {
                 if (!doesUserExist(userIdent)) {
@@ -706,8 +706,12 @@ private void grantInternal(UserIdentity userIdent, String role, TablePattern tbl
         }
     }
 
-    private void checkTablePatternExist(TablePattern tablePattern) throws DdlException {
+    private void checkTablePatternExist(TablePattern tablePattern, PrivBitSet privs) throws DdlException {
         Objects.requireNonNull(tablePattern, "tablePattern can not be null");
+        Objects.requireNonNull(privs, "privs can not be null");
+        if (privs.containsPrivs(Privilege.CREATE_PRIV)) {
+            return;
+        }
         PrivLevel privLevel = tablePattern.getPrivLevel();
         if (privLevel == PrivLevel.GLOBAL) {
             return;
@@ -1019,6 +1023,10 @@ public void createRole(CreateRoleStmt stmt) throws DdlException {
         createRoleInternal(stmt.getRole(), stmt.isSetIfNotExists(), stmt.getComment(), false);
     }
 
+    public void createRole(String role, boolean ignoreIfExists, String comment) throws DdlException {
+        createRoleInternal(role, ignoreIfExists, comment, false);
+    }
+
     public void alterRole(AlterRoleStmt stmt) throws DdlException {
         alterRoleInternal(stmt.getRole(), stmt.getComment(), false);
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/CascadesContext.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/CascadesContext.java
index 17ae5883063fb7..bb10996a11bf6a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/CascadesContext.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/CascadesContext.java
@@ -582,8 +582,9 @@ public static class Lock implements AutoCloseable {
         public Lock(LogicalPlan plan, CascadesContext cascadesContext) {
             this.cascadesContext = cascadesContext;
             // tables can also be load from dump file
-            if (cascadesContext.tables == null) {
+            if (cascadesContext.getTables() == null || cascadesContext.getTables().isEmpty()) {
                 cascadesContext.extractTables(plan);
+                cascadesContext.getStatementContext().setTables(cascadesContext.getTables());
             }
             for (TableIf table : cascadesContext.tables.values()) {
                 if (!table.needReadLockWhenPlan()) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/NereidsPlanner.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/NereidsPlanner.java
index c7478411a5de11..58af5cd3e92199 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/NereidsPlanner.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/NereidsPlanner.java
@@ -361,8 +361,8 @@ private void setRuntimeFilterWaitTimeByTableRowCountAndType() {
 
     private void initCascadesContext(LogicalPlan plan, PhysicalProperties requireProperties) {
         cascadesContext = CascadesContext.initContext(statementContext, plan, requireProperties);
-        if (statementContext.getConnectContext().getTables() != null) {
-            cascadesContext.setTables(statementContext.getConnectContext().getTables());
+        if (statementContext.getTables() != null) {
+            cascadesContext.setTables(statementContext.getTables());
         }
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/StatementContext.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/StatementContext.java
index b172f9dc591bd9..008a2c8ac70da2 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/StatementContext.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/StatementContext.java
@@ -27,6 +27,7 @@
 import org.apache.doris.datasource.mvcc.MvccSnapshot;
 import org.apache.doris.datasource.mvcc.MvccTable;
 import org.apache.doris.datasource.mvcc.MvccTableInfo;
+import org.apache.doris.nereids.exceptions.AnalysisException;
 import org.apache.doris.nereids.hint.Hint;
 import org.apache.doris.nereids.memo.Group;
 import org.apache.doris.nereids.rules.analysis.ColumnAliasGenerator;
@@ -53,6 +54,7 @@
 import org.apache.doris.system.Backend;
 
 import com.google.common.annotations.VisibleForTesting;
+import com.google.common.base.Preconditions;
 import com.google.common.base.Stopwatch;
 import com.google.common.base.Supplier;
 import com.google.common.base.Suppliers;
@@ -150,6 +152,9 @@ public class StatementContext implements Closeable {
     // placeholder params for prepared statement
     private List<Placeholder> placeholders;
 
+    // tables used for plan replayer
+    private Map<List<String>, TableIf> tables = null;
+
     // for create view support in nereids
     // key is the start and end position of the sql substring that needs to be replaced,
     // and value is the new string used for replacement.
@@ -213,6 +218,30 @@ public StatementContext(ConnectContext connectContext, OriginStatement originSta
         }
     }
 
+    public Map<List<String>, TableIf> getTables() {
+        if (tables == null) {
+            tables = Maps.newHashMap();
+        }
+        return tables;
+    }
+
+    public void setTables(Map<List<String>, TableIf> tables) {
+        this.tables = tables;
+    }
+
+    /** get table by table name, try to get from information from dumpfile first */
+    public TableIf getTableInMinidumpCache(List<String> tableQualifier) {
+        if (!getConnectContext().getSessionVariable().isPlayNereidsDump()) {
+            return null;
+        }
+        Preconditions.checkState(tables != null, "tables should not be null");
+        TableIf table = tables.getOrDefault(tableQualifier, null);
+        if (getConnectContext().getSessionVariable().isPlayNereidsDump() && table == null) {
+            throw new AnalysisException("Minidump cache can not find table:" + tableQualifier);
+        }
+        return table;
+    }
+
     public void setConnectContext(ConnectContext connectContext) {
         this.connectContext = connectContext;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/analyzer/Scope.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/analyzer/Scope.java
index dbcbea7c104b5a..7c77c680ff287b 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/analyzer/Scope.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/analyzer/Scope.java
@@ -18,7 +18,6 @@
 package org.apache.doris.nereids.analyzer;
 
 import org.apache.doris.nereids.trees.expressions.Slot;
-import org.apache.doris.nereids.trees.expressions.SubqueryExpr;
 import org.apache.doris.nereids.util.Utils;
 
 import com.google.common.base.Suppliers;
@@ -62,20 +61,18 @@ public class Scope {
 
     private final Optional<Scope> outerScope;
     private final List<Slot> slots;
-    private final Optional<SubqueryExpr> ownerSubquery;
     private final Set<Slot> correlatedSlots;
     private final boolean buildNameToSlot;
     private final Supplier<ListMultimap<String, Slot>> nameToSlot;
 
     public Scope(List<? extends Slot> slots) {
-        this(Optional.empty(), slots, Optional.empty());
+        this(Optional.empty(), slots);
     }
 
     /** Scope */
-    public Scope(Optional<Scope> outerScope, List<? extends Slot> slots, Optional<SubqueryExpr> subqueryExpr) {
+    public Scope(Optional<Scope> outerScope, List<? extends Slot> slots) {
         this.outerScope = Objects.requireNonNull(outerScope, "outerScope can not be null");
         this.slots = Utils.fastToImmutableList(Objects.requireNonNull(slots, "slots can not be null"));
-        this.ownerSubquery = Objects.requireNonNull(subqueryExpr, "subqueryExpr can not be null");
         this.correlatedSlots = Sets.newLinkedHashSet();
         this.buildNameToSlot = slots.size() > 500;
         this.nameToSlot = buildNameToSlot ? Suppliers.memoize(this::buildNameToSlot) : null;
@@ -89,10 +86,6 @@ public Optional<Scope> getOuterScope() {
         return outerScope;
     }
 
-    public Optional<SubqueryExpr> getSubquery() {
-        return ownerSubquery;
-    }
-
     public Set<Slot> getCorrelatedSlots() {
         return correlatedSlots;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/PhysicalPlanTranslator.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/PhysicalPlanTranslator.java
index c474e6bd56e1d7..bea5eec432b2ab 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/PhysicalPlanTranslator.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/PhysicalPlanTranslator.java
@@ -649,10 +649,12 @@ public PlanFragment visitPhysicalHudiScan(PhysicalHudiScan fileScan, PlanTransla
                         + " for Hudi table");
         PhysicalHudiScan hudiScan = (PhysicalHudiScan) fileScan;
         ScanNode scanNode = new HudiScanNode(context.nextPlanNodeId(), tupleDescriptor, false,
-                hudiScan.getScanParams(), hudiScan.getIncrementalRelation());
+                hudiScan.getScanParams(), hudiScan.getIncrementalRelation(), ConnectContext.get().getSessionVariable());
         if (fileScan.getTableSnapshot().isPresent()) {
             ((FileQueryScanNode) scanNode).setQueryTableSnapshot(fileScan.getTableSnapshot().get());
         }
+        HudiScanNode hudiScanNode = (HudiScanNode) scanNode;
+        hudiScanNode.setSelectedPartitions(fileScan.getSelectedPartitions());
         return getPlanFragmentForPhysicalFileScan(fileScan, context, scanNode, table, tupleDescriptor);
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/RuntimeFilterTranslator.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/RuntimeFilterTranslator.java
index 3dbd6cfcec7917..07e0af601739b1 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/RuntimeFilterTranslator.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/glue/translator/RuntimeFilterTranslator.java
@@ -143,6 +143,7 @@ public void createLegacyRuntimeFilter(RuntimeFilter filter, JoinNodeBase node, P
                     targetTupleIdMapList, context.getLimits());
             if (node instanceof HashJoinNode) {
                 origFilter.setIsBroadcast(((HashJoinNode) node).getDistributionMode() == DistributionMode.BROADCAST);
+                origFilter.setSingleEq(((HashJoinNode) node).getEqJoinConjuncts().size());
             } else {
                 // nest loop join
                 origFilter.setIsBroadcast(true);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/executor/Rewriter.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/executor/Rewriter.java
index fa00a4e9343325..dbaaf2a6b32244 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/executor/Rewriter.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/executor/Rewriter.java
@@ -113,6 +113,7 @@
 import org.apache.doris.nereids.rules.rewrite.PushDownAggThroughJoin;
 import org.apache.doris.nereids.rules.rewrite.PushDownAggThroughJoinOnPkFk;
 import org.apache.doris.nereids.rules.rewrite.PushDownAggThroughJoinOneSide;
+import org.apache.doris.nereids.rules.rewrite.PushDownAggWithDistinctThroughJoinOneSide;
 import org.apache.doris.nereids.rules.rewrite.PushDownDistinctThroughJoin;
 import org.apache.doris.nereids.rules.rewrite.PushDownFilterThroughProject;
 import org.apache.doris.nereids.rules.rewrite.PushDownLimit;
@@ -344,6 +345,7 @@ public class Rewriter extends AbstractBatchJobExecutor {
 
                 topic("Eager aggregation",
                         costBased(topDown(
+                                new PushDownAggWithDistinctThroughJoinOneSide(),
                                 new PushDownAggThroughJoinOneSide(),
                                 new PushDownAggThroughJoin()
                         )),
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/HyperElement.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/HyperElement.java
new file mode 100644
index 00000000000000..6d8d7c6326c0d9
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/HyperElement.java
@@ -0,0 +1,27 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.jobs.joinorder.hypergraph;
+
+/**
+ * This is the common base class for all
+ * */
+public interface HyperElement {
+
+    // Get the references nodes
+    long getReferenceNodes();
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/edge/Edge.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/edge/Edge.java
index 35694169498870..f75ed83250119a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/edge/Edge.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/edge/Edge.java
@@ -18,6 +18,7 @@
 package org.apache.doris.nereids.jobs.joinorder.hypergraph.edge;
 
 import org.apache.doris.common.Pair;
+import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperElement;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.bitmap.LongBitmap;
 import org.apache.doris.nereids.trees.expressions.Expression;
 import org.apache.doris.nereids.trees.expressions.Slot;
@@ -32,7 +33,7 @@
 /**
  * Edge in HyperGraph
  */
-public abstract class Edge {
+public abstract class Edge implements HyperElement {
     private final int index;
     private final double selectivity;
 
@@ -42,7 +43,9 @@ public abstract class Edge {
     // added by the graph simplifier.
     private final long leftRequiredNodes;
     private final long rightRequiredNodes;
+    // The nodes needed which to prevent wrong association or l-association
     private long leftExtendedNodes;
+    // The nodes needed which to prevent wrong association or r-association
     private long rightExtendedNodes;
 
     // record the left child edges and right child edges in origin plan tree
@@ -53,8 +56,11 @@ public abstract class Edge {
     private final BitSet curOperatorEdges = new BitSet();
     // record all sub nodes behind in this operator. It's T function in paper
     private final long subTreeNodes;
-
+    // The edges which prevents association or l-association when join edge
+    // and prevents push down or pull up when filter edge in the left of edge
     private final Set<JoinEdge> leftRejectEdges;
+    // The edges which prevents association or r-association
+    // and prevents push down or pull up when filter edge in the right of edge
     private final Set<JoinEdge> rightRejectEdges;
 
     /**
@@ -187,6 +193,7 @@ public boolean isSub(Edge edge) {
         return LongBitmap.isSubset(getReferenceNodes(), otherBitmap);
     }
 
+    @Override
     public long getReferenceNodes() {
         return LongBitmap.newBitmapUnion(leftExtendedNodes, rightExtendedNodes);
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/node/AbstractNode.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/node/AbstractNode.java
index a4a64e0449deee..686576de771d94 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/node/AbstractNode.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/jobs/joinorder/hypergraph/node/AbstractNode.java
@@ -17,6 +17,7 @@
 
 package org.apache.doris.nereids.jobs.joinorder.hypergraph.node;
 
+import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperElement;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.bitmap.LongBitmap;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.Edge;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.FilterEdge;
@@ -33,7 +34,7 @@
 /**
  * HyperGraph Node.
  */
-public class AbstractNode {
+public class AbstractNode implements HyperElement {
     protected final int index;
     protected final List<JoinEdge> joinEdges;
     protected final List<FilterEdge> filterEdges;
@@ -65,6 +66,11 @@ public List<Edge> getEdges() {
                 .build();
     }
 
+    @Override
+    public long getReferenceNodes() {
+        return getNodeMap();
+    }
+
     public int getIndex() {
         return index;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/Minidump.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/Minidump.java
index 5c324e1f364f15..37c7ff9a165b7c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/Minidump.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/Minidump.java
@@ -123,6 +123,7 @@ public static void main(String[] args) {
 
         StatementContext statementContext = new StatementContext(ConnectContext.get(),
                 new OriginStatement(minidump.getSql(), 0));
+        statementContext.setTables(minidump.getTables());
         ConnectContext.get().setStatementContext(statementContext);
         JSONObject resultPlan = MinidumpUtils.executeSql(minidump.getSql());
         JSONObject minidumpResult = new JSONObject(minidump.getResultPlanJson());
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/MinidumpUtils.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/MinidumpUtils.java
index fad7befc1626d6..c0f88b25341cde 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/MinidumpUtils.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/minidump/MinidumpUtils.java
@@ -227,7 +227,6 @@ public static void setConnectContext(Minidump minidump) {
         connectContext.setThreadLocalInfo();
         Env.getCurrentEnv().setColocateTableIndex(minidump.getColocateTableIndex());
         connectContext.setSessionVariable(minidump.getSessionVariable());
-        connectContext.setTables(minidump.getTables());
         connectContext.setDatabase(minidump.getDbName());
         connectContext.getSessionVariable().setPlanNereidsDump(true);
         connectContext.getSessionVariable().enableNereidsTimeout = false;
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/parser/LogicalPlanBuilder.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/parser/LogicalPlanBuilder.java
index dfe879e7d44dad..15aeca952a2556 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/parser/LogicalPlanBuilder.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/parser/LogicalPlanBuilder.java
@@ -50,7 +50,11 @@
 import org.apache.doris.mtmv.MTMVRefreshTriggerInfo;
 import org.apache.doris.nereids.DorisParser;
 import org.apache.doris.nereids.DorisParser.AddConstraintContext;
+import org.apache.doris.nereids.DorisParser.AdminCheckTabletsContext;
+import org.apache.doris.nereids.DorisParser.AdminCompactTableContext;
+import org.apache.doris.nereids.DorisParser.AdminDiagnoseTabletContext;
 import org.apache.doris.nereids.DorisParser.AdminShowReplicaDistributionContext;
+import org.apache.doris.nereids.DorisParser.AdminShowReplicaStatusContext;
 import org.apache.doris.nereids.DorisParser.AggClauseContext;
 import org.apache.doris.nereids.DorisParser.AggStateDataTypeContext;
 import org.apache.doris.nereids.DorisParser.AliasQueryContext;
@@ -89,8 +93,11 @@
 import org.apache.doris.nereids.DorisParser.ComplexColTypeListContext;
 import org.apache.doris.nereids.DorisParser.ComplexDataTypeContext;
 import org.apache.doris.nereids.DorisParser.ConstantContext;
+import org.apache.doris.nereids.DorisParser.CreateEncryptkeyContext;
+import org.apache.doris.nereids.DorisParser.CreateFileContext;
 import org.apache.doris.nereids.DorisParser.CreateMTMVContext;
 import org.apache.doris.nereids.DorisParser.CreateProcedureContext;
+import org.apache.doris.nereids.DorisParser.CreateRoleContext;
 import org.apache.doris.nereids.DorisParser.CreateRoutineLoadContext;
 import org.apache.doris.nereids.DorisParser.CreateRowPolicyContext;
 import org.apache.doris.nereids.DorisParser.CreateSqlBlockRuleContext;
@@ -112,6 +119,7 @@
 import org.apache.doris.nereids.DorisParser.DropFileContext;
 import org.apache.doris.nereids.DorisParser.DropMTMVContext;
 import org.apache.doris.nereids.DorisParser.DropProcedureContext;
+import org.apache.doris.nereids.DorisParser.DropRepositoryContext;
 import org.apache.doris.nereids.DorisParser.DropRoleContext;
 import org.apache.doris.nereids.DorisParser.DropSqlBlockRuleContext;
 import org.apache.doris.nereids.DorisParser.DropUserContext;
@@ -235,11 +243,14 @@
 import org.apache.doris.nereids.DorisParser.ShowCreateMTMVContext;
 import org.apache.doris.nereids.DorisParser.ShowCreateMaterializedViewContext;
 import org.apache.doris.nereids.DorisParser.ShowCreateProcedureContext;
+import org.apache.doris.nereids.DorisParser.ShowCreateRepositoryContext;
 import org.apache.doris.nereids.DorisParser.ShowCreateTableContext;
 import org.apache.doris.nereids.DorisParser.ShowCreateViewContext;
+import org.apache.doris.nereids.DorisParser.ShowDatabaseIdContext;
 import org.apache.doris.nereids.DorisParser.ShowDeleteContext;
 import org.apache.doris.nereids.DorisParser.ShowDiagnoseTabletContext;
 import org.apache.doris.nereids.DorisParser.ShowDynamicPartitionContext;
+import org.apache.doris.nereids.DorisParser.ShowEncryptKeysContext;
 import org.apache.doris.nereids.DorisParser.ShowEventsContext;
 import org.apache.doris.nereids.DorisParser.ShowFrontendsContext;
 import org.apache.doris.nereids.DorisParser.ShowGrantsContext;
@@ -460,6 +471,9 @@
 import org.apache.doris.nereids.trees.plans.algebra.Aggregate;
 import org.apache.doris.nereids.trees.plans.algebra.SetOperation.Qualifier;
 import org.apache.doris.nereids.trees.plans.commands.AddConstraintCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminCheckTabletsCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminCompactTableCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminShowReplicaStatusCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterRoleCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterSqlBlockRuleCommand;
@@ -476,10 +490,13 @@
 import org.apache.doris.nereids.trees.plans.commands.CleanAllProfileCommand;
 import org.apache.doris.nereids.trees.plans.commands.Command;
 import org.apache.doris.nereids.trees.plans.commands.Constraint;
+import org.apache.doris.nereids.trees.plans.commands.CreateEncryptkeyCommand;
+import org.apache.doris.nereids.trees.plans.commands.CreateFileCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateJobCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreatePolicyCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.CreateRoleCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateSqlBlockRuleCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateTableCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateTableLikeCommand;
@@ -494,6 +511,7 @@
 import org.apache.doris.nereids.trees.plans.commands.DropJobCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.DropRepositoryCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropRoleCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropSqlBlockRuleCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropUserCommand;
@@ -527,11 +545,14 @@
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateMaterializedViewCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowCreateRepositoryCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateTableCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateViewCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowDatabaseIdCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDeleteCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDiagnoseTabletCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDynamicPartitionCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowEncryptKeysCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowEventsCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowFrontendsCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowGrantsCommand;
@@ -1150,6 +1171,18 @@ public CancelMTMVTaskCommand visitCancelMTMVTask(CancelMTMVTaskContext ctx) {
         return new CancelMTMVTaskCommand(new CancelMTMVTaskInfo(new TableNameInfo(nameParts), taskId));
     }
 
+    @Override
+    public AdminCompactTableCommand visitAdminCompactTable(AdminCompactTableContext ctx) {
+        TableRefInfo tableRefInfo = visitBaseTableRefContext(ctx.baseTableRef());
+        EqualTo equalTo = null;
+        if (ctx.WHERE() != null) {
+            StringLiteral left = new StringLiteral(stripQuotes(ctx.TYPE().getText()));
+            StringLiteral right = new StringLiteral(stripQuotes(ctx.STRING_LITERAL().getText()));
+            equalTo = new EqualTo(left, right);
+        }
+        return new AdminCompactTableCommand(tableRefInfo, equalTo);
+    }
+
     @Override
     public AlterMTMVCommand visitAlterMTMV(AlterMTMVContext ctx) {
         List<String> nameParts = visitMultipartIdentifier(ctx.mvName);
@@ -1897,6 +1930,21 @@ public static String stripQuotes(String str) {
         return str;
     }
 
+    @Override
+    public LogicalPlan visitShowEncryptKeys(ShowEncryptKeysContext ctx) {
+        String dbName = null;
+        if (ctx.database != null) {
+            List<String> nameParts = visitMultipartIdentifier(ctx.database);
+            dbName = nameParts.get(0); // only one entry possible
+        }
+
+        String likeString = null;
+        if (ctx.LIKE() != null) {
+            likeString = stripQuotes(ctx.STRING_LITERAL().getText());
+        }
+        return new ShowEncryptKeysCommand(dbName, likeString);
+    }
+
     @Override
     public LogicalPlan visitAliasedQuery(AliasedQueryContext ctx) {
         if (ctx.tableAlias().getText().equals("")) {
@@ -4390,6 +4438,11 @@ public RefreshDatabaseCommand visitRefreshDatabase(RefreshDatabaseContext ctx) {
         throw new ParseException("Only one dot can be in the name: " + String.join(".", parts));
     }
 
+    @Override
+    public LogicalPlan visitShowCreateRepository(ShowCreateRepositoryContext ctx) {
+        return new ShowCreateRepositoryCommand(ctx.identifier().getText());
+    }
+
     public LogicalPlan visitShowLastInsert(ShowLastInsertContext ctx) {
         return new ShowLastInsertCommand();
     }
@@ -4517,6 +4570,22 @@ public LogicalPlan visitShowTrash(ShowTrashContext ctx) {
         return new ShowTrashCommand();
     }
 
+    @Override
+    public LogicalPlan visitAdminShowReplicaStatus(AdminShowReplicaStatusContext ctx) {
+        Expression where = null;
+        if (ctx.WHERE() != null) {
+            StringLiteral left = new StringLiteral(stripQuotes(ctx.STATUS().toString()));
+            StringLiteral right = new StringLiteral(stripQuotes(ctx.STRING_LITERAL().getText()));
+            if (ctx.NEQ() != null) {
+                where = new Not(new EqualTo(left, right));
+            } else {
+                where = new EqualTo(left, right);
+            }
+        }
+        TableRefInfo tableRefInfo = visitBaseTableRefContext(ctx.baseTableRef());
+        return new AdminShowReplicaStatusCommand(tableRefInfo, where);
+    }
+
     @Override
     public LogicalPlan visitShowRepositories(ShowRepositoriesContext ctx) {
         return new ShowRepositoriesCommand();
@@ -4631,6 +4700,12 @@ public LogicalPlan visitShowDiagnoseTablet(ShowDiagnoseTabletContext ctx) {
         return new ShowDiagnoseTabletCommand(tabletId);
     }
 
+    @Override
+    public LogicalPlan visitAdminDiagnoseTablet(AdminDiagnoseTabletContext ctx) {
+        long tabletId = Long.parseLong(ctx.INTEGER_VALUE().getText());
+        return new ShowDiagnoseTabletCommand(tabletId);
+    }
+
     @Override
     public LogicalPlan visitShowCreateTable(ShowCreateTableContext ctx) {
         List<String> nameParts = visitMultipartIdentifier(ctx.name);
@@ -4669,6 +4744,29 @@ public LogicalPlan visitAlterRole(AlterRoleContext ctx) {
         return new AlterRoleCommand(ctx.role.getText(), comment);
     }
 
+    @Override
+    public LogicalPlan visitShowDatabaseId(ShowDatabaseIdContext ctx) {
+        long dbId = (ctx.databaseId != null) ? Long.parseLong(ctx.databaseId.getText()) : -1;
+        return new ShowDatabaseIdCommand(dbId);
+    }
+
+    public LogicalPlan visitCreateRole(CreateRoleContext ctx) {
+        String comment = ctx.STRING_LITERAL() == null ? "" : LogicalPlanBuilderAssistant.escapeBackSlash(
+                ctx.STRING_LITERAL().getText().substring(1, ctx.STRING_LITERAL().getText().length() - 1));
+        return new CreateRoleCommand(ctx.EXISTS() != null, ctx.name.getText(), comment);
+    }
+
+    @Override
+    public LogicalPlan visitCreateFile(CreateFileContext ctx) {
+        String dbName = null;
+        if (ctx.database != null) {
+            dbName = ctx.database.getText();
+        }
+        Map<String, String> properties = ctx.propertyClause() != null
+                                    ? Maps.newHashMap(visitPropertyClause(ctx.propertyClause())) : Maps.newHashMap();
+        return new CreateFileCommand(stripQuotes(ctx.name.getText()), dbName, properties);
+    }
+
     @Override
     public LogicalPlan visitShowFrontends(ShowFrontendsContext ctx) {
         String detail = (ctx.name != null) ? ctx.name.getText() : null;
@@ -4749,6 +4847,13 @@ public LogicalPlan visitDropRole(DropRoleContext ctx) {
         return new DropRoleCommand(ctx.name.getText(), ctx.EXISTS() != null);
     }
 
+    @Override
+    public LogicalPlan visitCreateEncryptkey(CreateEncryptkeyContext ctx) {
+        List<String> nameParts = visitMultipartIdentifier(ctx.multipartIdentifier());
+        return new CreateEncryptkeyCommand(new EncryptKeyName(nameParts), ctx.EXISTS() != null,
+                                            stripQuotes(ctx.STRING_LITERAL().getText()));
+    }
+
     @Override
     public LogicalPlan visitDropEncryptkey(DropEncryptkeyContext ctx) {
         List<String> nameParts = visitMultipartIdentifier(ctx.name);
@@ -4766,6 +4871,11 @@ public LogicalPlan visitDropFile(DropFileContext ctx) {
         return new DropFileCommand(stripQuotes(ctx.name.getText()), dbName, properties);
     }
 
+    @Override
+    public LogicalPlan visitDropRepository(DropRepositoryContext ctx) {
+        return new DropRepositoryCommand(stripQuotes(ctx.name.getText()));
+    }
+
     @Override
     public LogicalPlan visitDropSqlBlockRule(DropSqlBlockRuleContext ctx) {
         return new DropSqlBlockRuleCommand(visitIdentifierSeq(ctx.identifierSeq()), ctx.EXISTS() != null);
@@ -4842,4 +4952,19 @@ public LogicalPlan visitShowCollation(ShowCollationContext ctx) {
         }
         return new ShowCollationCommand(wild);
     }
+
+    @Override
+    public LogicalPlan visitAdminCheckTablets(AdminCheckTabletsContext ctx) {
+        List<Long> tabletIdLists = new ArrayList<>();
+        if (ctx.tabletList() != null) {
+            ctx.tabletList().tabletIdList.stream().forEach(tabletToken -> {
+                tabletIdLists.add(Long.parseLong(tabletToken.getText()));
+            });
+        }
+        Map<String, String> properties = ctx.properties != null
+                ? Maps.newHashMap(visitPropertyClause(ctx.properties))
+                : Maps.newHashMap();
+        return new AdminCheckTabletsCommand(tabletIdLists, properties);
+    }
 }
+
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/RuleType.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/RuleType.java
index c81f56f85b6add..e25050b012dc5f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/RuleType.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/RuleType.java
@@ -201,6 +201,7 @@ public enum RuleType {
     ELIMINATE_SORT(RuleTypeClass.REWRITE),
 
     PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE(RuleTypeClass.REWRITE),
+    PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE(RuleTypeClass.REWRITE),
     PUSH_DOWN_AGG_THROUGH_JOIN(RuleTypeClass.REWRITE),
     PUSH_DOWN_AGG_THROUGH_JOIN_ON_PKFK(RuleTypeClass.REWRITE),
     TRANSPOSE_LOGICAL_SEMI_JOIN_LOGICAL_JOIN(RuleTypeClass.REWRITE),
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindExpression.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindExpression.java
index cde659b91021ad..1e481542baec12 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindExpression.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindExpression.java
@@ -1229,7 +1229,7 @@ private <E extends Expression> E checkBoundExceptLambda(E expression, Plan plan)
     private Scope toScope(CascadesContext cascadesContext, List<? extends Slot> slots) {
         Optional<Scope> outerScope = cascadesContext.getOuterScope();
         if (outerScope.isPresent()) {
-            return new Scope(outerScope, slots, outerScope.get().getSubquery());
+            return new Scope(outerScope, slots);
         } else {
             return new Scope(slots);
         }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindRelation.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindRelation.java
index cba3afca6f08d3..c7d4e9f975e50a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindRelation.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/BindRelation.java
@@ -171,7 +171,7 @@ private LogicalPlan bindWithCurrentDb(CascadesContext cascadesContext, UnboundRe
         List<String> tableQualifier = RelationUtil.getQualifierName(cascadesContext.getConnectContext(),
                 unboundRelation.getNameParts());
         TableIf table = null;
-        table = ConnectContext.get().getTableInMinidumpCache(tableQualifier);
+        table = ConnectContext.get().getStatementContext().getTableInMinidumpCache(tableQualifier);
         if (table == null) {
             if (customTableResolver.isPresent()) {
                 table = customTableResolver.get().apply(tableQualifier);
@@ -182,7 +182,7 @@ private LogicalPlan bindWithCurrentDb(CascadesContext cascadesContext, UnboundRe
         if (table == null) {
             table = RelationUtil.getTable(tableQualifier, cascadesContext.getConnectContext().getEnv());
         }
-        ConnectContext.get().getTables().put(tableQualifier, table);
+        ConnectContext.get().getStatementContext().getTables().put(tableQualifier, table);
 
         // TODO: should generate different Scan sub class according to table's type
         LogicalPlan scan = getLogicalPlan(table, unboundRelation, tableQualifier, cascadesContext);
@@ -201,13 +201,13 @@ private LogicalPlan bind(CascadesContext cascadesContext, UnboundRelation unboun
         if (customTableResolver.isPresent()) {
             table = customTableResolver.get().apply(tableQualifier);
         }
-        table = ConnectContext.get().getTableInMinidumpCache(tableQualifier);
+        table = ConnectContext.get().getStatementContext().getTableInMinidumpCache(tableQualifier);
         // In some cases even if we have already called the "cascadesContext.getTableByName",
         // it also gets the null. So, we just check it in the catalog again for safety.
         if (table == null) {
             table = RelationUtil.getTable(tableQualifier, cascadesContext.getConnectContext().getEnv());
         }
-        ConnectContext.get().getTables().put(tableQualifier, table);
+        ConnectContext.get().getStatementContext().getTables().put(tableQualifier, table);
         return getLogicalPlan(table, unboundRelation, tableQualifier, cascadesContext);
     }
 
@@ -243,6 +243,10 @@ private LogicalPlan makeOlapScan(TableIf table, UnboundRelation unboundRelation,
                     unboundRelation.getTableSample());
             }
         }
+        if (!tabletIds.isEmpty()) {
+            // This tabletIds is set manually, so need to set specifiedTabletIds
+            scan = scan.withManuallySpecifiedTabletIds(tabletIds);
+        }
         if (needGenerateLogicalAggForRandomDistAggTable(scan)) {
             // it's a random distribution agg table
             // add agg on olap scan
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/ExpressionAnalyzer.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/ExpressionAnalyzer.java
index adc68ac6ecac1b..6abbbda447c8ec 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/ExpressionAnalyzer.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/ExpressionAnalyzer.java
@@ -833,8 +833,9 @@ private UnboundFunction bindHighOrderFunction(UnboundFunction unboundFunction, E
                 .map(ArrayItemReference::toSlot)
                 .collect(ImmutableList.toImmutableList());
 
-        ExpressionAnalyzer lambdaAnalyzer = new ExpressionAnalyzer(currentPlan, new Scope(boundedSlots),
-                context == null ? null : context.cascadesContext, true, false) {
+        ExpressionAnalyzer lambdaAnalyzer = new ExpressionAnalyzer(currentPlan, new Scope(Optional.of(getScope()),
+                boundedSlots), context == null ? null : context.cascadesContext,
+                true, true) {
             @Override
             protected void couldNotFoundColumn(UnboundSlot unboundSlot, String tableName) {
                 throw new AnalysisException("Unknown lambda slot '"
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/SubExprAnalyzer.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/SubExprAnalyzer.java
index 7b0ed45708251d..9a70ce24afb8ef 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/SubExprAnalyzer.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/analysis/SubExprAnalyzer.java
@@ -53,7 +53,6 @@
 import java.util.HashSet;
 import java.util.List;
 import java.util.Objects;
-import java.util.Optional;
 import java.util.Set;
 
 /**
@@ -205,19 +204,15 @@ private AnalyzedResult analyzeSubquery(SubqueryExpr expr) {
         }
         CascadesContext subqueryContext = CascadesContext.newContextWithCteContext(
                 cascadesContext, expr.getQueryPlan(), cascadesContext.getCteContext());
-        Scope subqueryScope = genScopeWithSubquery(expr);
+        // don't use `getScope()` because we only need `getScope().getOuterScope()` and `getScope().getSlots()`
+        // otherwise unexpected errors may occur
+        Scope subqueryScope = new Scope(getScope().getOuterScope(), getScope().getSlots());
         subqueryContext.setOuterScope(subqueryScope);
         subqueryContext.newAnalyzer().analyze();
         return new AnalyzedResult((LogicalPlan) subqueryContext.getRewritePlan(),
                 subqueryScope.getCorrelatedSlots());
     }
 
-    private Scope genScopeWithSubquery(SubqueryExpr expr) {
-        return new Scope(getScope().getOuterScope(),
-                getScope().getSlots(),
-                Optional.ofNullable(expr));
-    }
-
     public Scope getScope() {
         return scope;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/AbstractMaterializedViewRule.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/AbstractMaterializedViewRule.java
index 8e9ef1eaa97b7a..e6f384502d620f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/AbstractMaterializedViewRule.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/AbstractMaterializedViewRule.java
@@ -461,17 +461,14 @@ protected Pair<Map<BaseTableInfo, Set<String>>, Map<BaseTableInfo, Set<String>>>
             return Pair.of(ImmutableMap.of(), ImmutableMap.of());
         }
         // Collect the mv related base table partitions which query used
-        Map<BaseTableInfo, Set<Partition>> queryUsedBaseTablePartitions = new LinkedHashMap<>();
+        Map<BaseTableInfo, Set<String>> queryUsedBaseTablePartitions = new LinkedHashMap<>();
         queryUsedBaseTablePartitions.put(relatedPartitionTable, new HashSet<>());
         queryPlan.accept(new StructInfo.QueryScanPartitionsCollector(), queryUsedBaseTablePartitions);
         // Bail out, not check invalid partition if not olap scan, support later
         if (queryUsedBaseTablePartitions.isEmpty()) {
             return Pair.of(ImmutableMap.of(), ImmutableMap.of());
         }
-        Set<String> queryUsedBaseTablePartitionNameSet = queryUsedBaseTablePartitions.get(relatedPartitionTable)
-                .stream()
-                .map(Partition::getName)
-                .collect(Collectors.toSet());
+        Set<String> queryUsedBaseTablePartitionNameSet = queryUsedBaseTablePartitions.get(relatedPartitionTable);
 
         Collection<Partition> mvValidPartitions = MTMVRewriteUtil.getMTMVCanRewritePartitions(mtmv,
                 cascadesContext.getConnectContext(), System.currentTimeMillis(), false);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/HyperGraphComparator.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/HyperGraphComparator.java
index 868f97949c0705..22282a2351627b 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/HyperGraphComparator.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/HyperGraphComparator.java
@@ -19,12 +19,14 @@
 
 import org.apache.doris.common.Pair;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.ConflictRulesMaker;
+import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperElement;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperGraph;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.bitmap.LongBitmap;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.Edge;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.FilterEdge;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.JoinEdge;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.node.StructInfoNode;
+import org.apache.doris.nereids.rules.exploration.mv.StructInfo.ExpressionPosition;
 import org.apache.doris.nereids.rules.rewrite.PushDownFilterThroughJoin;
 import org.apache.doris.nereids.trees.expressions.Expression;
 import org.apache.doris.nereids.trees.expressions.NamedExpression;
@@ -35,18 +37,23 @@
 import org.apache.doris.nereids.util.ExpressionUtils;
 import org.apache.doris.nereids.util.JoinUtils;
 
+import com.google.common.collect.BiMap;
+import com.google.common.collect.HashMultimap;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
+import com.google.common.collect.Multimap;
 import com.google.common.collect.Sets;
 
 import java.util.ArrayList;
+import java.util.Collection;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.Map.Entry;
 import java.util.Objects;
+import java.util.Optional;
 import java.util.Set;
 import java.util.stream.Collectors;
 import javax.annotation.Nullable;
@@ -75,9 +82,9 @@ public class HyperGraphComparator {
     private final Map<Edge, List<? extends Expression>> pullUpViewExprWithEdge = new HashMap<>();
     private final LogicalCompatibilityContext logicalCompatibilityContext;
     // this records the slots which needs to reject null
-    // the key is the target join which should reject null, the value is a pair, the first value of the pair is the
-    // join type, the second value is also a pair which left represents the slots in the left of join that should
-    // reject null, right represents the slots in the right of join that should reject null.
+    // the key is the view join edge which should reject null, the value is a pair, the first value of the pair is the
+    // query join type, the second value is also a pair which left represents the slots in the left of view join that
+    // should reject null, right represents the slots in the right of view join that should reject null.
     private final Map<JoinEdge, Pair<JoinType, Pair<Set<Slot>, Set<Slot>>>> inferredViewEdgeWithCond = new HashMap<>();
     private List<JoinEdge> viewJoinEdgesAfterInferring;
     private List<FilterEdge> viewFilterEdgesAfterInferring;
@@ -245,9 +252,17 @@ private boolean compareNodeWithExpr(StructInfoNode query, StructInfoNode view) {
         }
         int size = queryExprSetList.size();
         for (int i = 0; i < size; i++) {
-            Set<Expression> mappingQueryExprSet = queryExprSetList.get(i).stream()
-                    .map(logicalCompatibilityContext::getViewNodeExprFromQuery)
-                    .collect(Collectors.toSet());
+            Set<Expression> queryExpressions = queryExprSetList.get(i);
+            Set<Expression> mappingQueryExprSet = new HashSet<>();
+            for (Expression queryExpression : queryExpressions) {
+                Optional<Expression> mappingViewExprByQueryExpr = getMappingViewExprByQueryExpr(queryExpression, query,
+                        this.logicalCompatibilityContext,
+                        ExpressionPosition.NODE);
+                if (!mappingViewExprByQueryExpr.isPresent()) {
+                    return false;
+                }
+                mappingQueryExprSet.add(mappingViewExprByQueryExpr.get());
+            }
             if (!mappingQueryExprSet.equals(viewExprSetList.get(i))) {
                 return false;
             }
@@ -403,7 +418,10 @@ private Map<Edge, Edge> constructQueryToViewJoinMapWithExpr() {
             if (edgeMap.containsKey(entry.getValue())) {
                 continue;
             }
-            Expression viewExpr = logicalCompatibilityContext.getViewJoinExprFromQuery(entry.getKey());
+            Expression viewExpr = getMappingViewExprByQueryExpr(entry.getKey(),
+                    entry.getValue(),
+                    logicalCompatibilityContext,
+                    ExpressionPosition.JOIN_EDGE).orElse(null);
             if (viewExprToEdge.containsKey(viewExpr)) {
                 edgeMap.put(entry.getValue(), Objects.requireNonNull(viewExprToEdge.get(viewExpr)));
             }
@@ -411,25 +429,76 @@ private Map<Edge, Edge> constructQueryToViewJoinMapWithExpr() {
         return edgeMap;
     }
 
+    // Such as the filter as following, their expression is same, but should be different filter edge
+    // Only construct edge that can mapping, the edges which can not mapping would be handled by buildComparisonRes
+    //     LogicalJoin[569]
+    //       |--LogicalProject[567]
+    //       |  +--LogicalFilter[566] ( predicates=(l_orderkey#10 IS NULL OR ( not (l_orderkey#10 = 1))) )
+    //       |     +--LogicalJoin[565]
+    //       |        |--LogicalProject[562]
+    //       |        |  +--LogicalOlapScan
+    //       |        +--LogicalProject[564]
+    //       |           +--LogicalFilter[563] ( predicates=(l_orderkey#10 IS NULL OR ( not (l_orderkey#10 = 1))))
+    //       |              +--LogicalOlapScan
+    //       +--LogicalProject[568]
+    //         +--LogicalOlapScan
     private Map<Edge, Edge> constructQueryToViewFilterMapWithExpr() {
-        Map<Expression, Edge> viewExprToEdge = getViewFilterEdges().stream()
-                .flatMap(e -> e.getExpressions().stream().map(expr -> Pair.of(expr, e)))
-                .collect(ImmutableMap.toImmutableMap(p -> p.first, p -> p.second));
-        Map<Expression, Edge> queryExprToEdge = getQueryFilterEdges().stream()
+        Multimap<Expression, Edge> viewExprToEdge = HashMultimap.create();
+        getViewFilterEdges().stream()
                 .flatMap(e -> e.getExpressions().stream().map(expr -> Pair.of(expr, e)))
-                .collect(ImmutableMap.toImmutableMap(p -> p.first, p -> p.second));
+                .forEach(pair -> viewExprToEdge.put(pair.key(), pair.value()));
 
-        HashMap<Edge, Edge> edgeMap = new HashMap<>();
-        for (Entry<Expression, Edge> entry : queryExprToEdge.entrySet()) {
-            if (edgeMap.containsKey(entry.getValue())) {
-                continue;
+        Multimap<Expression, Edge> queryExprToEdge = HashMultimap.create();
+        getQueryFilterEdges().stream()
+                .flatMap(e -> e.getExpressions().stream().map(expr -> Pair.of(expr, e)))
+                .forEach(pair -> queryExprToEdge.put(pair.key(), pair.value()));
+
+        HashMap<Edge, Edge> queryToViewEdgeMap = new HashMap<>();
+        for (Entry<Expression, Collection<Edge>> entry : queryExprToEdge.asMap().entrySet()) {
+            Expression queryExprViewBased = null;
+            for (Edge queryEdge : entry.getValue()) {
+                queryExprViewBased = getMappingViewExprByQueryExpr(entry.getKey(),
+                        queryEdge,
+                        logicalCompatibilityContext,
+                        ExpressionPosition.FILTER_EDGE).orElse(null);
+                if (queryExprViewBased == null) {
+                    continue;
+                }
+                Collection<Edge> viewEdges = viewExprToEdge.get(queryExprViewBased);
+                if (viewEdges.isEmpty()) {
+                    continue;
+                }
+                for (Edge viewEdge : viewEdges) {
+                    if (!isSubTreeNodesEquals(queryEdge, viewEdge, logicalCompatibilityContext)) {
+                        // Such as query filter edge is <{1} --FILTER-- {}> but view filter edge is
+                        // <{0, 1} --FILTER-- {}>, though they are all
+                        // l_orderkey#10 IS NULL OR ( not (l_orderkey#10 = 1)) but they are different actually
+                        continue;
+                    }
+                    queryToViewEdgeMap.put(queryEdge, viewEdge);
+                }
             }
-            Expression viewExpr = logicalCompatibilityContext.getViewFilterExprFromQuery(entry.getKey());
-            if (viewExprToEdge.containsKey(viewExpr)) {
-                edgeMap.put(entry.getValue(), Objects.requireNonNull(viewExprToEdge.get(viewExpr)));
+        }
+        return queryToViewEdgeMap;
+    }
+
+    private static boolean isSubTreeNodesEquals(Edge queryEdge, Edge viewEdge,
+            LogicalCompatibilityContext logicalCompatibilityContext) {
+        if (!(queryEdge instanceof FilterEdge) || !(viewEdge instanceof FilterEdge)) {
+            return false;
+        }
+        // subTreeNodes should be equal
+        BiMap<Integer, Integer> queryToViewNodeIdMapping =
+                logicalCompatibilityContext.getQueryToViewNodeIDMapping();
+        List<Integer> queryNodeIndexViewBasedList = new ArrayList<>();
+        for (int queryNodeIndex : LongBitmap.getIterator(queryEdge.getSubTreeNodes())) {
+            Integer queryNodeIndexViewBased = queryToViewNodeIdMapping.get(queryNodeIndex);
+            if (queryNodeIndexViewBased == null) {
+                return false;
             }
+            queryNodeIndexViewBasedList.add(queryNodeIndexViewBased);
         }
-        return edgeMap;
+        return LongBitmap.newBitmap(queryNodeIndexViewBasedList) == viewEdge.getSubTreeNodes();
     }
 
     private void refreshViewEdges() {
@@ -463,17 +532,17 @@ private boolean compareEdgeWithNode(Edge query, Edge view) {
     }
 
     private boolean compareFilterEdgeWithNode(FilterEdge query, FilterEdge view) {
-        return rewriteQueryNodeMap(query.getReferenceNodes()) == view.getReferenceNodes();
+        return getViewNodesByQuery(query.getReferenceNodes()) == view.getReferenceNodes();
     }
 
     private boolean compareJoinEdgeWithNode(JoinEdge query, JoinEdge view) {
         boolean res = false;
         if (query.getJoinType().swap() == view.getJoinType()) {
-            res |= rewriteQueryNodeMap(query.getLeftExtendedNodes()) == view.getRightExtendedNodes()
-                    && rewriteQueryNodeMap(query.getRightExtendedNodes()) == view.getLeftExtendedNodes();
+            res |= getViewNodesByQuery(query.getLeftExtendedNodes()) == view.getRightExtendedNodes()
+                    && getViewNodesByQuery(query.getRightExtendedNodes()) == view.getLeftExtendedNodes();
         }
-        res |= rewriteQueryNodeMap(query.getLeftExtendedNodes()) == view.getLeftExtendedNodes()
-                && rewriteQueryNodeMap(query.getRightExtendedNodes()) == view.getRightExtendedNodes();
+        res |= getViewNodesByQuery(query.getLeftExtendedNodes()) == view.getLeftExtendedNodes()
+                && getViewNodesByQuery(query.getRightExtendedNodes()) == view.getRightExtendedNodes();
         return res;
     }
 
@@ -496,8 +565,8 @@ private boolean compareJoinEdgeOrInfer(JoinEdge query, JoinEdge view) {
     }
 
     private boolean tryInferEdge(JoinEdge query, JoinEdge view) {
-        if (rewriteQueryNodeMap(query.getLeftRequiredNodes()) != view.getLeftRequiredNodes()
-                || rewriteQueryNodeMap(query.getRightRequiredNodes()) != view.getRightRequiredNodes()) {
+        if (getViewNodesByQuery(query.getLeftRequiredNodes()) != view.getLeftRequiredNodes()
+                || getViewNodesByQuery(query.getRightRequiredNodes()) != view.getRightRequiredNodes()) {
             return false;
         }
         if (!query.getJoinType().equals(view.getJoinType())) {
@@ -518,7 +587,7 @@ private boolean tryInferEdge(JoinEdge query, JoinEdge view) {
         return true;
     }
 
-    private long rewriteQueryNodeMap(long bitmap) {
+    private long getViewNodesByQuery(long bitmap) {
         long newBitmap = LongBitmap.newBitmap();
         for (int i : LongBitmap.getIterator(bitmap)) {
             int newIdx = getQueryToViewNodeIdMap().getOrDefault(i, 0);
@@ -527,6 +596,35 @@ private long rewriteQueryNodeMap(long bitmap) {
         return newBitmap;
     }
 
+    private Optional<Expression> getMappingViewExprByQueryExpr(Expression queryExpression,
+            HyperElement queryExpressionBelongedHyperElement,
+            LogicalCompatibilityContext context,
+            ExpressionPosition expressionPosition) {
+        Expression queryShuttledExpr;
+        Collection<Pair<Expression, HyperElement>> viewExpressions;
+        if (ExpressionPosition.JOIN_EDGE.equals(expressionPosition)) {
+            queryShuttledExpr = context.getQueryJoinShuttledExpr(queryExpression);
+            viewExpressions = context.getViewJoinExprFromQuery(queryShuttledExpr);
+        } else if (ExpressionPosition.FILTER_EDGE.equals(expressionPosition)) {
+            queryShuttledExpr = context.getQueryFilterShuttledExpr(queryExpression);
+            viewExpressions = context.getViewFilterExprFromQuery(queryShuttledExpr);
+        } else {
+            queryShuttledExpr = context.getQueryNodeShuttledExpr(queryExpression);
+            viewExpressions = context.getViewNodeExprFromQuery(queryShuttledExpr);
+        }
+        if (viewExpressions.size() == 1) {
+            return Optional.of(viewExpressions.iterator().next().key());
+        }
+        long queryReferenceNodes = queryExpressionBelongedHyperElement.getReferenceNodes();
+        long viewReferenceNodes = getViewNodesByQuery(queryReferenceNodes);
+        for (Pair<Expression, HyperElement> viewExpressionPair : viewExpressions) {
+            if (viewExpressionPair.value().getReferenceNodes() == viewReferenceNodes) {
+                return Optional.of(viewExpressionPair.key());
+            }
+        }
+        return Optional.empty();
+    }
+
     private void compareJoinEdgeWithExpr(Edge query, Edge view) {
         Set<? extends Expression> queryExprSet = query.getExpressionSet();
         Set<? extends Expression> viewExprSet = view.getExpressionSet();
@@ -534,7 +632,10 @@ private void compareJoinEdgeWithExpr(Edge query, Edge view) {
         Set<Expression> exprMappedOfView = new HashSet<>();
         List<Expression> residualQueryExpr = new ArrayList<>();
         for (Expression queryExpr : queryExprSet) {
-            Expression viewExpr = logicalCompatibilityContext.getViewJoinExprFromQuery(queryExpr);
+            Expression viewExpr = getMappingViewExprByQueryExpr(queryExpr,
+                    query,
+                    logicalCompatibilityContext,
+                    ExpressionPosition.JOIN_EDGE).orElse(null);
             if (viewExprSet.contains(viewExpr)) {
                 exprMappedOfView.add(viewExpr);
             } else {
@@ -553,7 +654,10 @@ private void compareFilterEdgeWithExpr(Edge query, Edge view) {
         Set<Expression> exprMappedOfView = new HashSet<>();
         List<Expression> residualQueryExpr = new ArrayList<>();
         for (Expression queryExpr : queryExprSet) {
-            Expression viewExpr = logicalCompatibilityContext.getViewFilterExprFromQuery(queryExpr);
+            Expression viewExpr = getMappingViewExprByQueryExpr(queryExpr,
+                    query,
+                    logicalCompatibilityContext,
+                    ExpressionPosition.FILTER_EDGE).orElse(null);
             if (viewExprSet.contains(viewExpr)) {
                 exprMappedOfView.add(viewExpr);
             } else {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/InitMaterializationContextHook.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/InitMaterializationContextHook.java
index 2e8baecf165639..4f8198e0b3c0bd 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/InitMaterializationContextHook.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/InitMaterializationContextHook.java
@@ -79,13 +79,18 @@ public void initMaterializationContext(CascadesContext cascadesContext) {
      * @param cascadesContext current cascadesContext in the planner
      */
     protected void doInitMaterializationContext(CascadesContext cascadesContext) {
+        if (cascadesContext.getConnectContext().getSessionVariable().isInDebugMode()) {
+            LOG.info(String.format("MaterializationContext init return because is in debug mode, current queryId is %s",
+                    cascadesContext.getConnectContext().getQueryIdentifier()));
+            return;
+        }
         // Only collect the table or mv which query use directly, to avoid useless mv partition in rewrite
-        TableCollectorContext collectorContext = new TableCollectorContext(Sets.newHashSet(), false);
+        // Keep use one connection context when in query, if new connect context,
+        // the ConnectionContext.get() will change
+        TableCollectorContext collectorContext = new TableCollectorContext(Sets.newHashSet(), false,
+                cascadesContext.getConnectContext());
         try {
             Plan rewritePlan = cascadesContext.getRewritePlan();
-            // Keep use one connection context when in query, if new connect context,
-            // the ConnectionContext.get() will change
-            collectorContext.setConnectContext(cascadesContext.getConnectContext());
             rewritePlan.accept(TableCollector.INSTANCE, collectorContext);
         } catch (Exception e) {
             LOG.warn(String.format("MaterializationContext init table collect fail, current queryId is %s",
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/LogicalCompatibilityContext.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/LogicalCompatibilityContext.java
index ca13c9701dabc2..77ab37873d06b4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/LogicalCompatibilityContext.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/LogicalCompatibilityContext.java
@@ -17,6 +17,8 @@
 
 package org.apache.doris.nereids.rules.exploration.mv;
 
+import org.apache.doris.common.Pair;
+import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperElement;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.node.StructInfoNode;
 import org.apache.doris.nereids.memo.GroupExpression;
 import org.apache.doris.nereids.rules.exploration.mv.StructInfo.ExpressionPosition;
@@ -36,8 +38,10 @@
 import com.google.common.base.Suppliers;
 import com.google.common.collect.BiMap;
 import com.google.common.collect.HashBiMap;
+import com.google.common.collect.HashMultimap;
+import com.google.common.collect.Multimap;
 
-import java.util.HashMap;
+import java.util.Collection;
 import java.util.Map;
 import java.util.function.Supplier;
 
@@ -48,11 +52,15 @@ public class LogicalCompatibilityContext {
     private final BiMap<StructInfoNode, StructInfoNode> queryToViewNodeMapping;
     private final BiMap<Integer, Integer> queryToViewNodeIDMapping;
     private final ObjectId planNodeId;
-    private final Supplier<BiMap<Expression, Expression>> queryToViewJoinEdgeExpressionMappingSupplier;
-    private final Supplier<BiMap<Expression, Expression>> queryToViewNodeExpressionMappingSupplier;
-    private final Supplier<BiMap<Expression, Expression>> queryToViewFilterEdgeExpressionMappingSupplier;
-    @Deprecated
-    private BiMap<Expression, Expression> queryToViewAllExpressionMapping;
+    private final Supplier<Multimap<Expression, Pair<Expression, HyperElement>>>
+            queryToViewJoinEdgeExpressionMappingSupplier;
+    private final Supplier<Map<Expression, Expression>> queryToQueryShuttledJoinExpressionMappingSupplier;
+    private final Supplier<Multimap<Expression, Pair<Expression, HyperElement>>>
+            queryToViewNodeExpressionMappingSupplier;
+    private final Supplier<Map<Expression, Expression>> queryToQueryShuttledNodeExpressionMappingSupplier;
+    private final Supplier<Multimap<Expression, Pair<Expression, HyperElement>>>
+            queryToViewFilterEdgeExpressionMappingSupplier;
+    private final Supplier<Map<Expression, Expression>> queryToQueryShuttledFilterExpressionMappingSupplier;
 
     /**
      * LogicalCompatibilityContext
@@ -66,16 +74,25 @@ private LogicalCompatibilityContext(BiMap<StructInfoNode, StructInfoNode> queryT
                         queryStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.JOIN_EDGE),
                         viewStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.JOIN_EDGE)));
 
+        this.queryToQueryShuttledJoinExpressionMappingSupplier = Suppliers.memoize(
+                () -> queryStructInfo.getExpressionToShuttledExpressionToMap().get(ExpressionPosition.JOIN_EDGE));
+
         this.queryToViewNodeExpressionMappingSupplier =
                 Suppliers.memoize(() -> generateExpressionMapping(viewToQuerySlotMapping,
                         queryStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.NODE),
                         viewStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.NODE)));
 
+        this.queryToQueryShuttledNodeExpressionMappingSupplier = Suppliers.memoize(
+                () -> queryStructInfo.getExpressionToShuttledExpressionToMap().get(ExpressionPosition.NODE));
+
         this.queryToViewFilterEdgeExpressionMappingSupplier =
                 Suppliers.memoize(() -> generateExpressionMapping(viewToQuerySlotMapping,
                         queryStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.FILTER_EDGE),
                         viewStructInfo.getShuttledExpressionsToExpressionsMap().get(ExpressionPosition.FILTER_EDGE)));
 
+        this.queryToQueryShuttledFilterExpressionMappingSupplier = Suppliers.memoize(
+                () -> queryStructInfo.getExpressionToShuttledExpressionToMap().get(ExpressionPosition.FILTER_EDGE));
+
         this.queryToViewNodeMapping = queryToViewNodeMapping;
         this.queryToViewNodeIDMapping = HashBiMap.create();
         queryToViewNodeMapping.forEach((k, v) -> queryToViewNodeIDMapping.put(k.getIndex(), v.getIndex()));
@@ -92,18 +109,30 @@ public BiMap<Integer, Integer> getQueryToViewNodeIDMapping() {
         return queryToViewNodeIDMapping;
     }
 
-    public Expression getViewJoinExprFromQuery(Expression queryJoinExpr) {
+    public Collection<Pair<Expression, HyperElement>> getViewJoinExprFromQuery(Expression queryJoinExpr) {
         return queryToViewJoinEdgeExpressionMappingSupplier.get().get(queryJoinExpr);
     }
 
-    public Expression getViewFilterExprFromQuery(Expression queryJoinExpr) {
+    public Expression getQueryJoinShuttledExpr(Expression queryJoinExpr) {
+        return queryToQueryShuttledJoinExpressionMappingSupplier.get().get(queryJoinExpr);
+    }
+
+    public Collection<Pair<Expression, HyperElement>> getViewFilterExprFromQuery(Expression queryJoinExpr) {
         return queryToViewFilterEdgeExpressionMappingSupplier.get().get(queryJoinExpr);
     }
 
-    public Expression getViewNodeExprFromQuery(Expression queryJoinExpr) {
+    public Expression getQueryFilterShuttledExpr(Expression queryFilterExpr) {
+        return queryToQueryShuttledFilterExpressionMappingSupplier.get().get(queryFilterExpr);
+    }
+
+    public Collection<Pair<Expression, HyperElement>> getViewNodeExprFromQuery(Expression queryJoinExpr) {
         return queryToViewNodeExpressionMappingSupplier.get().get(queryJoinExpr);
     }
 
+    public Expression getQueryNodeShuttledExpr(Expression queryNodeExpr) {
+        return queryToQueryShuttledNodeExpressionMappingSupplier.get().get(queryNodeExpr);
+    }
+
     /**
      * Generate logical compatibility context,
      * this make expression mapping between query and view by relation and the slot in relation mapping
@@ -134,24 +163,31 @@ public static LogicalCompatibilityContext from(RelationMapping relationMapping,
                 viewStructInfo);
     }
 
-    private static BiMap<Expression, Expression> generateExpressionMapping(
+    /**
+     * The result is multimap
+     * the key is shuttled query expr
+     * the value is original view expr collection
+     * */
+    private static Multimap<Expression, Pair<Expression, HyperElement>> generateExpressionMapping(
             Map<SlotReference, SlotReference> viewToQuerySlotMapping,
-            Map<Expression, Expression> queryShuttledExprToExprMap,
-            Map<Expression, Expression> viewShuttledExprToExprMap) {
-        final Map<Expression, Expression> viewEdgeToConjunctsMapQueryBased = new HashMap<>();
-        BiMap<Expression, Expression> queryToViewEdgeMapping = HashBiMap.create();
+            Multimap<Expression, Pair<Expression, HyperElement>> queryShuttledExprToExprMap,
+            Multimap<Expression, Pair<Expression, HyperElement>> viewShuttledExprToExprMap) {
+        Multimap<Expression, Pair<Expression, HyperElement>> queryToViewEdgeMapping = HashMultimap.create();
         if (queryShuttledExprToExprMap == null || viewShuttledExprToExprMap == null
                 || queryShuttledExprToExprMap.isEmpty() || viewShuttledExprToExprMap.isEmpty()) {
             return queryToViewEdgeMapping;
         }
+        final Multimap<Expression, Pair<Expression, HyperElement>> viewShuttledExprToExprMapQueryBased =
+                HashMultimap.create();
         viewShuttledExprToExprMap.forEach((shuttledExpr, expr) -> {
-            viewEdgeToConjunctsMapQueryBased.put(
+            viewShuttledExprToExprMapQueryBased.put(
                     orderSlotAsc(ExpressionUtils.replace(shuttledExpr, viewToQuerySlotMapping)), expr);
         });
-        queryShuttledExprToExprMap.forEach((exprSet, edge) -> {
-            Expression viewExpr = viewEdgeToConjunctsMapQueryBased.get(orderSlotAsc(exprSet));
-            if (viewExpr != null) {
-                queryToViewEdgeMapping.put(edge, viewExpr);
+        queryShuttledExprToExprMap.forEach((shuttledExpr, expr) -> {
+            Collection<Pair<Expression, HyperElement>> viewExpressions = viewShuttledExprToExprMapQueryBased.get(
+                    orderSlotAsc(shuttledExpr));
+            if (viewExpressions != null) {
+                queryToViewEdgeMapping.putAll(shuttledExpr, viewExpressions);
             }
         });
         return queryToViewEdgeMapping;
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/MaterializedViewUtils.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/MaterializedViewUtils.java
index 484abd11f01e72..4c5703e27687e4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/MaterializedViewUtils.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/MaterializedViewUtils.java
@@ -343,11 +343,19 @@ public Plan visitLogicalResultSink(LogicalResultSink<? extends Plan> logicalResu
                     ImmutableList.of(Rewriter.custom(RuleType.ELIMINATE_SORT, EliminateSort::new))).execute();
             return childContext.getRewritePlan();
         }, mvPlan, originPlan);
-        return new MTMVCache(mvPlan, originPlan,
+        return new MTMVCache(mvPlan, originPlan, planner.getAnalyzedPlan(),
                 planner.getCascadesContext().getMemo().getRoot().getStatistics(), null);
     }
 
-    private static final class TableQueryOperatorChecker extends DefaultPlanVisitor<Boolean, Void> {
+    /**
+     * Check the query if Contains query operator
+     * Such sql as following should return true
+     * select * from orders TABLET(10098) because TABLET(10098) should return true
+     * select * from orders_partition PARTITION (day_2) because PARTITION (day_2)
+     * select * from orders index query_index_test because index query_index_test
+     * select * from orders TABLESAMPLE(20 percent) because TABLESAMPLE(20 percent)
+     * */
+    public static final class TableQueryOperatorChecker extends DefaultPlanVisitor<Boolean, Void> {
         public static final TableQueryOperatorChecker INSTANCE = new TableQueryOperatorChecker();
 
         @Override
@@ -358,12 +366,20 @@ public Boolean visitLogicalRelation(LogicalRelation relation, Void context) {
             if (relation instanceof LogicalOlapScan) {
                 LogicalOlapScan logicalOlapScan = (LogicalOlapScan) relation;
                 if (logicalOlapScan.getTableSample().isPresent()) {
+                    // Contain sample, select * from orders TABLESAMPLE(20 percent)
                     return true;
                 }
-                if (!logicalOlapScan.getSelectedTabletIds().isEmpty()) {
+                if (!logicalOlapScan.getManuallySpecifiedTabletIds().isEmpty()) {
+                    // Contain tablets, select * from orders TABLET(10098) because TABLET(10098)
                     return true;
                 }
                 if (!logicalOlapScan.getManuallySpecifiedPartitions().isEmpty()) {
+                    // Contain specified partitions, select * from orders_partition PARTITION (day_2)
+                    return true;
+                }
+                if (logicalOlapScan.getSelectedIndexId() != logicalOlapScan.getTable().getBaseIndexId()) {
+                    // Contains select index or use sync mv in rbo rewrite
+                    // select * from orders index query_index_test
                     return true;
                 }
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/StructInfo.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/StructInfo.java
index 526ec7030d2db5..365360e06b096c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/StructInfo.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/StructInfo.java
@@ -17,17 +17,18 @@
 
 package org.apache.doris.nereids.rules.exploration.mv;
 
-import org.apache.doris.catalog.Partition;
 import org.apache.doris.catalog.TableIf;
 import org.apache.doris.common.Pair;
+import org.apache.doris.datasource.ExternalTable;
 import org.apache.doris.mtmv.BaseTableInfo;
 import org.apache.doris.nereids.CascadesContext;
 import org.apache.doris.nereids.jobs.executor.Rewriter;
+import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperElement;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.HyperGraph;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.edge.JoinEdge;
 import org.apache.doris.nereids.jobs.joinorder.hypergraph.node.StructInfoNode;
-import org.apache.doris.nereids.memo.Group;
 import org.apache.doris.nereids.memo.GroupExpression;
+import org.apache.doris.nereids.rules.exploration.mv.MaterializedViewUtils.TableQueryOperatorChecker;
 import org.apache.doris.nereids.rules.exploration.mv.Predicates.SplitPredicate;
 import org.apache.doris.nereids.trees.copier.DeepCopierContext;
 import org.apache.doris.nereids.trees.copier.LogicalPlanDeepCopier;
@@ -36,6 +37,7 @@
 import org.apache.doris.nereids.trees.expressions.Expression;
 import org.apache.doris.nereids.trees.expressions.SlotReference;
 import org.apache.doris.nereids.trees.expressions.literal.Literal;
+import org.apache.doris.nereids.trees.plans.AbstractPlan;
 import org.apache.doris.nereids.trees.plans.GroupPlan;
 import org.apache.doris.nereids.trees.plans.JoinType;
 import org.apache.doris.nereids.trees.plans.ObjectId;
@@ -49,6 +51,8 @@
 import org.apache.doris.nereids.trees.plans.commands.UpdateMvByPartitionCommand.PredicateAdder;
 import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
 import org.apache.doris.nereids.trees.plans.logical.LogicalCatalogRelation;
+import org.apache.doris.nereids.trees.plans.logical.LogicalFileScan;
+import org.apache.doris.nereids.trees.plans.logical.LogicalFileScan.SelectedPartitions;
 import org.apache.doris.nereids.trees.plans.logical.LogicalFilter;
 import org.apache.doris.nereids.trees.plans.logical.LogicalJoin;
 import org.apache.doris.nereids.trees.plans.logical.LogicalOlapScan;
@@ -61,12 +65,15 @@
 import org.apache.doris.nereids.trees.plans.visitor.ExpressionLineageReplacer;
 import org.apache.doris.nereids.util.ExpressionUtils;
 
+import com.google.common.collect.HashMultimap;
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Lists;
+import com.google.common.collect.Multimap;
 import com.google.common.collect.Sets;
 
 import java.util.ArrayList;
 import java.util.BitSet;
+import java.util.HashMap;
 import java.util.LinkedHashMap;
 import java.util.LinkedHashSet;
 import java.util.List;
@@ -109,9 +116,23 @@ public class StructInfo {
     // split predicates is shuttled
     private SplitPredicate splitPredicate;
     private EquivalenceClass equivalenceClass;
-    // Key is the expression shuttled and the value is the origin expression
+    // For value of Map, the key is the position of expression
+    // the value is the expressions and the hyper element of expression pair
+    // Key of pair is the expression shuttled and the value is the origin expression and the hyper element it belonged
+    // Sometimes origin expressions are different and shuttled expression is same
+    // Such as origin expressions are l_partkey#0 > 1 and l_partkey#10 > 1 and shuttled expression is l_partkey#10 > 1
     // this is for building LogicalCompatibilityContext later.
-    private final Map<ExpressionPosition, Map<Expression, Expression>> shuttledExpressionsToExpressionsMap;
+    private final Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+            shuttledExpressionsToExpressionsMap;
+    // For value of Map, the key is the position of expression
+    // the value is the original expression and shuttled expression map
+    // Such as origin expressions are l_partkey#0 > 1 and shuttled expression is l_partkey#10 > 1
+    // the map would be {ExpressionPosition.FILTER, {
+    //     l_partkey#0 > 1 : l_partkey#10 > 1
+    // }}
+    // this is for building LogicalCompatibilityContext later.
+    private final Map<ExpressionPosition, Map<Expression, Expression>> expressionToShuttledExpressionToMap;
+
     // Record the exprId and the corresponding expr map, this is used by expression shuttled
     private final Map<ExprId, Expression> namedExprIdAndExprMapping;
     private final List<? extends Expression> planOutputShuttledExpressions;
@@ -123,7 +144,9 @@ private StructInfo(Plan originalPlan, ObjectId originalPlanId, HyperGraph hyperG
             Plan bottomPlan, List<CatalogRelation> relations,
             Map<RelationId, StructInfoNode> relationIdStructInfoNodeMap,
             @Nullable Predicates predicates,
-            Map<ExpressionPosition, Map<Expression, Expression>> shuttledExpressionsToExpressionsMap,
+            Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+                    shuttledExpressionsToExpressionsMap,
+            Map<ExpressionPosition, Map<Expression, Expression>> expressionToShuttledExpressionToMap,
             Map<ExprId, Expression> namedExprIdAndExprMapping,
             BitSet tableIdSet,
             SplitPredicate splitPredicate,
@@ -142,6 +165,7 @@ private StructInfo(Plan originalPlan, ObjectId originalPlanId, HyperGraph hyperG
         this.splitPredicate = splitPredicate;
         this.equivalenceClass = equivalenceClass;
         this.shuttledExpressionsToExpressionsMap = shuttledExpressionsToExpressionsMap;
+        this.expressionToShuttledExpressionToMap = expressionToShuttledExpressionToMap;
         this.namedExprIdAndExprMapping = namedExprIdAndExprMapping;
         this.planOutputShuttledExpressions = planOutputShuttledExpressions;
     }
@@ -152,7 +176,8 @@ private StructInfo(Plan originalPlan, ObjectId originalPlanId, HyperGraph hyperG
     public StructInfo withPredicates(Predicates predicates) {
         return new StructInfo(this.originalPlan, this.originalPlanId, this.hyperGraph, this.valid, this.topPlan,
                 this.bottomPlan, this.relations, this.relationIdStructInfoNodeMap, predicates,
-                this.shuttledExpressionsToExpressionsMap, this.namedExprIdAndExprMapping, this.tableBitSet,
+                this.shuttledExpressionsToExpressionsMap, this.expressionToShuttledExpressionToMap,
+                this.namedExprIdAndExprMapping, this.tableBitSet,
                 null, null, this.planOutputShuttledExpressions);
     }
 
@@ -162,13 +187,16 @@ public StructInfo withPredicates(Predicates predicates) {
     public StructInfo withTableBitSet(BitSet tableBitSet) {
         return new StructInfo(this.originalPlan, this.originalPlanId, this.hyperGraph, this.valid, this.topPlan,
                 this.bottomPlan, this.relations, this.relationIdStructInfoNodeMap, this.predicates,
-                this.shuttledExpressionsToExpressionsMap, this.namedExprIdAndExprMapping, tableBitSet,
+                this.shuttledExpressionsToExpressionsMap, this.expressionToShuttledExpressionToMap,
+                this.namedExprIdAndExprMapping, tableBitSet,
                 this.splitPredicate, this.equivalenceClass, this.planOutputShuttledExpressions);
     }
 
     private static boolean collectStructInfoFromGraph(HyperGraph hyperGraph,
             Plan topPlan,
-            Map<ExpressionPosition, Map<Expression, Expression>> shuttledExpressionsToExpressionsMap,
+            Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+                    shuttledExpressionsToExpressionsMap,
+            Map<ExpressionPosition, Map<Expression, Expression>> expressionToShuttledExpressionToMap,
             Map<ExprId, Expression> namedExprIdAndExprMapping,
             List<CatalogRelation> relations,
             Map<RelationId, StructInfoNode> relationIdStructInfoNodeMap,
@@ -196,8 +224,9 @@ private static boolean collectStructInfoFromGraph(HyperGraph hyperGraph,
                     structInfoNode.getPlan().accept(ExpressionLineageReplacer.INSTANCE, replaceContext);
                     // Replace expressions by expression map
                     List<Expression> replacedExpressions = replaceContext.getReplacedExpressions();
-                    putShuttledExpressionsToExpressionsMap(shuttledExpressionsToExpressionsMap,
-                            ExpressionPosition.NODE, replacedExpressions.get(0), expression);
+                    putShuttledExpressionToExpressionsMap(shuttledExpressionsToExpressionsMap,
+                            expressionToShuttledExpressionToMap,
+                            ExpressionPosition.NODE, replacedExpressions.get(0), expression, node);
                     // Record this, will be used in top level expression shuttle later, see the method
                     // ExpressionLineageReplacer#visitGroupPlan
                     namedExprIdAndExprMapping.putAll(replaceContext.getExprIdExpressionMap());
@@ -223,8 +252,10 @@ private static boolean collectStructInfoFromGraph(HyperGraph hyperGraph,
             // Replace expressions by expression map
             List<Expression> replacedExpressions = replaceContext.getReplacedExpressions();
             for (int i = 0; i < replacedExpressions.size(); i++) {
-                putShuttledExpressionsToExpressionsMap(shuttledExpressionsToExpressionsMap,
-                        ExpressionPosition.JOIN_EDGE, replacedExpressions.get(i), joinConjunctExpressions.get(i));
+                putShuttledExpressionToExpressionsMap(shuttledExpressionsToExpressionsMap,
+                        expressionToShuttledExpressionToMap,
+                        ExpressionPosition.JOIN_EDGE, replacedExpressions.get(i), joinConjunctExpressions.get(i),
+                        edge);
             }
             // Record this, will be used in top level expression shuttle later, see the method
             // ExpressionLineageReplacer#visitGroupPlan
@@ -236,10 +267,11 @@ private static boolean collectStructInfoFromGraph(HyperGraph hyperGraph,
             filterExpressions.forEach(predicate -> {
                 // this is used for LogicalCompatibilityContext
                 ExpressionUtils.extractConjunction(predicate).forEach(expr ->
-                        putShuttledExpressionsToExpressionsMap(shuttledExpressionsToExpressionsMap,
+                        putShuttledExpressionToExpressionsMap(shuttledExpressionsToExpressionsMap,
+                                expressionToShuttledExpressionToMap,
                                 ExpressionPosition.FILTER_EDGE,
                                 ExpressionUtils.shuttleExpressionWithLineage(predicate, topPlan, new BitSet()),
-                                predicate));
+                                predicate, filterEdge));
             });
         });
         return true;
@@ -311,11 +343,13 @@ public static StructInfo of(Plan originalPlan, @Nullable Plan topPlan, @Nullable
         // collect struct info fromGraph
         List<CatalogRelation> relationList = new ArrayList<>();
         Map<RelationId, StructInfoNode> relationIdStructInfoNodeMap = new LinkedHashMap<>();
-        Map<ExpressionPosition, Map<Expression, Expression>> shuttledHashConjunctsToConjunctsMap =
-                new LinkedHashMap<>();
+        Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+                shuttledHashConjunctsToConjunctsMap = new LinkedHashMap<>();
         Map<ExprId, Expression> namedExprIdAndExprMapping = new LinkedHashMap<>();
         BitSet tableBitSet = new BitSet();
+        Map<ExpressionPosition, Map<Expression, Expression>> expressionToShuttledExpressionToMap = new HashMap<>();
         boolean valid = collectStructInfoFromGraph(hyperGraph, topPlan, shuttledHashConjunctsToConjunctsMap,
+                expressionToShuttledExpressionToMap,
                 namedExprIdAndExprMapping,
                 relationList,
                 relationIdStructInfoNodeMap,
@@ -323,6 +357,11 @@ public static StructInfo of(Plan originalPlan, @Nullable Plan topPlan, @Nullable
                 cascadesContext);
         valid = valid
                 && hyperGraph.getNodes().stream().allMatch(n -> ((StructInfoNode) n).getExpressions() != null);
+        // if relationList has any relation which contains table operator,
+        // such as query with sample, index, table, is invalid
+        boolean invalid = relationList.stream().anyMatch(relation ->
+                ((AbstractPlan) relation).accept(TableQueryOperatorChecker.INSTANCE, null));
+        valid = valid && !invalid;
         // collect predicate from top plan which not in hyper graph
         Set<Expression> topPlanPredicates = new LinkedHashSet<>();
         topPlan.accept(PREDICATE_COLLECTOR, topPlanPredicates);
@@ -332,19 +371,11 @@ public static StructInfo of(Plan originalPlan, @Nullable Plan topPlan, @Nullable
                 ExpressionUtils.shuttleExpressionWithLineage(originalPlan.getOutput(), originalPlan, new BitSet());
         return new StructInfo(originalPlan, originalPlanId, hyperGraph, valid, topPlan, bottomPlan,
                 relationList, relationIdStructInfoNodeMap, predicates, shuttledHashConjunctsToConjunctsMap,
+                expressionToShuttledExpressionToMap,
                 namedExprIdAndExprMapping, tableBitSet, null, null,
                 planOutputShuttledExpressions);
     }
 
-    /**
-     * Build Struct info from group.
-     * Maybe return multi structInfo when original plan already be rewritten by mv
-     */
-    public static StructInfo of(Group group) {
-        // TODO build graph from original plan and get relations and predicates from graph
-        return null;
-    }
-
     public List<CatalogRelation> getRelations() {
         return relations;
     }
@@ -401,21 +432,36 @@ public Map<RelationId, StructInfoNode> getRelationIdStructInfoNodeMap() {
         return relationIdStructInfoNodeMap;
     }
 
-    public Map<ExpressionPosition, Map<Expression, Expression>> getShuttledExpressionsToExpressionsMap() {
+    public Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+            getShuttledExpressionsToExpressionsMap() {
         return shuttledExpressionsToExpressionsMap;
     }
 
-    private static void putShuttledExpressionsToExpressionsMap(
-            Map<ExpressionPosition, Map<Expression, Expression>> shuttledExpressionsToExpressionsMap,
+    public Map<ExpressionPosition, Map<Expression, Expression>> getExpressionToShuttledExpressionToMap() {
+        return expressionToShuttledExpressionToMap;
+    }
+
+    private static void putShuttledExpressionToExpressionsMap(
+            Map<ExpressionPosition, Multimap<Expression, Pair<Expression, HyperElement>>>
+                    shuttledExpressionsToExpressionsMap,
+            Map<ExpressionPosition, Map<Expression, Expression>> expressionPositionToExpressionToMap,
             ExpressionPosition expressionPosition,
-            Expression key, Expression value) {
-        Map<Expression, Expression> expressionExpressionMap = shuttledExpressionsToExpressionsMap.get(
-                expressionPosition);
-        if (expressionExpressionMap == null) {
-            expressionExpressionMap = new LinkedHashMap<>();
-            shuttledExpressionsToExpressionsMap.put(expressionPosition, expressionExpressionMap);
+            Expression shuttledExpression, Expression originalExpression, HyperElement valueBelongedElement) {
+        Multimap<Expression, Pair<Expression, HyperElement>> shuttledExpressionToExpressionMap =
+                shuttledExpressionsToExpressionsMap.get(expressionPosition);
+        if (shuttledExpressionToExpressionMap == null) {
+            shuttledExpressionToExpressionMap = HashMultimap.create();
+            shuttledExpressionsToExpressionsMap.put(expressionPosition, shuttledExpressionToExpressionMap);
+        }
+        shuttledExpressionToExpressionMap.put(shuttledExpression, Pair.of(originalExpression, valueBelongedElement));
+
+        Map<Expression, Expression> originalExprToShuttledExprMap =
+                expressionPositionToExpressionToMap.get(expressionPosition);
+        if (originalExprToShuttledExprMap == null) {
+            originalExprToShuttledExprMap = new HashMap<>();
+            expressionPositionToExpressionToMap.put(expressionPosition, originalExprToShuttledExprMap);
         }
-        expressionExpressionMap.put(key, value);
+        originalExprToShuttledExprMap.put(originalExpression, shuttledExpression);
     }
 
     public List<? extends Expression> getExpressions() {
@@ -724,22 +770,28 @@ public Plan visitLogicalOlapScan(LogicalOlapScan olapScan,
      * Collect partitions on base table
      */
     public static class QueryScanPartitionsCollector extends DefaultPlanVisitor<Plan,
-            Map<BaseTableInfo, Set<Partition>>> {
+            Map<BaseTableInfo, Set<String>>> {
         @Override
         public Plan visitLogicalCatalogRelation(LogicalCatalogRelation catalogRelation,
-                Map<BaseTableInfo, Set<Partition>> targetTablePartitionMap) {
+                Map<BaseTableInfo, Set<String>> targetTablePartitionMap) {
             TableIf table = catalogRelation.getTable();
             BaseTableInfo relatedPartitionTable = new BaseTableInfo(table);
             if (!targetTablePartitionMap.containsKey(relatedPartitionTable)) {
                 return catalogRelation;
             }
+            Set<String> tablePartitions = targetTablePartitionMap.get(relatedPartitionTable);
             if (catalogRelation instanceof LogicalOlapScan) {
                 // Handle olap table
                 LogicalOlapScan logicalOlapScan = (LogicalOlapScan) catalogRelation;
-                Set<Partition> tablePartitions = targetTablePartitionMap.get(relatedPartitionTable);
                 for (Long partitionId : logicalOlapScan.getSelectedPartitionIds()) {
-                    tablePartitions.add(logicalOlapScan.getTable().getPartition(partitionId));
+                    tablePartitions.add(logicalOlapScan.getTable().getPartition(partitionId).getName());
                 }
+            } else if (catalogRelation instanceof LogicalFileScan
+                    && catalogRelation.getTable() instanceof ExternalTable
+                    && ((ExternalTable) catalogRelation.getTable()).supportInternalPartitionPruned()) {
+                LogicalFileScan logicalFileScan = (LogicalFileScan) catalogRelation;
+                SelectedPartitions selectedPartitions = logicalFileScan.getSelectedPartitions();
+                tablePartitions.addAll(selectedPartitions.selectedPartitions.keySet());
             } else {
                 // todo Support other type partition table
                 // Not support to partition check now when query external catalog table, support later.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/mapping/SlotMapping.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/mapping/SlotMapping.java
index 882dec19ea82dd..6e481a101420a1 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/mapping/SlotMapping.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/exploration/mv/mapping/SlotMapping.java
@@ -19,7 +19,6 @@
 
 import org.apache.doris.nereids.trees.expressions.Slot;
 import org.apache.doris.nereids.trees.expressions.SlotReference;
-import org.apache.doris.nereids.types.VariantType;
 
 import com.google.common.collect.BiMap;
 import com.google.common.collect.HashBiMap;
@@ -78,19 +77,19 @@ public static SlotMapping generate(RelationMapping relationMapping) {
             for (List<String> sourceSlotName : sourceSlotNameToSlotMap.keySet()) {
                 Slot sourceSlot = sourceSlotNameToSlotMap.get(sourceSlotName);
                 Slot targetSlot = targetSlotNameSlotMap.get(sourceSlotName);
-                // source slot can not map from target, bail out
-                if (targetSlot == null && !(((SlotReference) sourceSlot).getDataType() instanceof VariantType)) {
-                    LOG.warn(String.format("SlotMapping generate is null, source relation is %s, "
-                            + "target relation is %s", sourceRelation, targetRelation));
-                    return null;
-                }
                 if (targetSlot == null) {
+                    // there are two scenes in which targetSlot maybe null
+                    // 1
                     // if variant, though can not map slot from query to view, but we maybe derive slot from query
                     // variant self, such as query slot to view slot mapping is payload#4 -> payload#10
                     // and query has a variant which is payload['issue']['number']#20, this can not get from view.
                     // in this scene, we can derive
                     // payload['issue']['number']#20 -> element_at(element_at(payload#10, 'issue'), 'number') mapping
                     // in expression rewrite
+                    // 2
+                    // Maybe table add column after last refresh
+                    LOG.warn(String.format("SlotMapping generate is null, source relation is %s, "
+                            + "target relation is %s", sourceRelation, targetRelation));
                     continue;
                 }
                 relationSlotMap.put(MappedSlot.of(sourceSlot,
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/implementation/AggregateStrategies.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/implementation/AggregateStrategies.java
index 6cf243bbfeec7b..094882294fa6db 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/implementation/AggregateStrategies.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/implementation/AggregateStrategies.java
@@ -47,6 +47,7 @@
 import org.apache.doris.nereids.trees.expressions.functions.ExpressionTrait;
 import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
 import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateParam;
+import org.apache.doris.nereids.trees.expressions.functions.agg.AggregatePhase;
 import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
 import org.apache.doris.nereids.trees.expressions.functions.agg.GroupConcat;
 import org.apache.doris.nereids.trees.expressions.functions.agg.Max;
@@ -294,31 +295,37 @@ public List<Rule> buildRules() {
             RuleType.ONE_PHASE_AGGREGATE_WITHOUT_DISTINCT.build(
                 basePattern
                     .when(agg -> agg.getDistinctArguments().isEmpty())
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.ONE))
                     .thenApplyMulti(ctx -> onePhaseAggregateWithoutDistinct(ctx.root, ctx.connectContext))
             ),
             RuleType.TWO_PHASE_AGGREGATE_WITHOUT_DISTINCT.build(
                 basePattern
                     .when(agg -> agg.getDistinctArguments().isEmpty())
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.TWO))
                     .thenApplyMulti(ctx -> twoPhaseAggregateWithoutDistinct(ctx.root, ctx.connectContext))
             ),
             // RuleType.TWO_PHASE_AGGREGATE_WITH_COUNT_DISTINCT_MULTI.build(
             //     basePattern
             //         .when(this::containsCountDistinctMultiExpr)
+            //         .when(agg -> agg.supportAggregatePhase(AggregatePhase.TWO))
             //         .thenApplyMulti(ctx -> twoPhaseAggregateWithCountDistinctMulti(ctx.root, ctx.cascadesContext))
             // ),
             RuleType.THREE_PHASE_AGGREGATE_WITH_COUNT_DISTINCT_MULTI.build(
                 basePattern
                     .when(this::containsCountDistinctMultiExpr)
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.THREE))
                     .thenApplyMulti(ctx -> threePhaseAggregateWithCountDistinctMulti(ctx.root, ctx.cascadesContext))
             ),
             RuleType.ONE_PHASE_AGGREGATE_SINGLE_DISTINCT_TO_MULTI.build(
                 basePattern
                     .when(agg -> agg.getDistinctArguments().size() == 1 && couldConvertToMulti(agg))
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.ONE))
                     .thenApplyMulti(ctx -> onePhaseAggregateWithMultiDistinct(ctx.root, ctx.connectContext))
             ),
             RuleType.TWO_PHASE_AGGREGATE_SINGLE_DISTINCT_TO_MULTI.build(
                 basePattern
                     .when(agg -> agg.getDistinctArguments().size() == 1 && couldConvertToMulti(agg))
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.TWO))
                     .thenApplyMulti(ctx -> twoPhaseAggregateWithMultiDistinct(ctx.root, ctx.connectContext))
             ),
             RuleType.TWO_PHASE_AGGREGATE_WITH_MULTI_DISTINCT.build(
@@ -326,17 +333,20 @@ public List<Rule> buildRules() {
                     .when(agg -> agg.getDistinctArguments().size() > 1
                             && !containsCountDistinctMultiExpr(agg)
                             && couldConvertToMulti(agg))
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.TWO))
                     .thenApplyMulti(ctx -> twoPhaseAggregateWithMultiDistinct(ctx.root, ctx.connectContext))
             ),
             // RuleType.TWO_PHASE_AGGREGATE_WITH_DISTINCT.build(
             //     basePattern
             //         .when(agg -> agg.getDistinctArguments().size() == 1)
+            //         .when(agg -> agg.supportAggregatePhase(AggregatePhase.TWO))
             //         .thenApplyMulti(ctx -> twoPhaseAggregateWithDistinct(ctx.root, ctx.connectContext))
             // ),
             RuleType.THREE_PHASE_AGGREGATE_WITH_DISTINCT.build(
                 basePattern
                     .when(agg -> agg.getDistinctArguments().size() == 1)
-                     .whenNot(agg -> agg.mustUseMultiDistinctAgg())
+                    .whenNot(agg -> agg.mustUseMultiDistinctAgg())
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.THREE))
                     .thenApplyMulti(ctx -> threePhaseAggregateWithDistinct(ctx.root, ctx.connectContext))
             ),
             /*
@@ -361,6 +371,7 @@ && couldConvertToMulti(agg))
                     .when(agg -> agg.getDistinctArguments().size() == 1)
                     .when(agg -> agg.getGroupByExpressions().isEmpty())
                     .whenNot(agg -> agg.mustUseMultiDistinctAgg())
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.FOUR))
                     .thenApplyMulti(ctx -> {
                         Function<List<Expression>, RequireProperties> secondPhaseRequireDistinctHash =
                                 groupByAndDistinct -> RequireProperties.of(
@@ -408,6 +419,7 @@ && couldConvertToMulti(agg))
                         }
                         return couldConvertToMulti(agg);
                     })
+                    .when(agg -> agg.supportAggregatePhase(AggregatePhase.FOUR))
                     .thenApplyMulti(ctx -> {
                         Function<List<Expression>, RequireProperties> secondPhaseRequireGroupByAndDistinctHash =
                                 groupByAndDistinct -> RequireProperties.of(
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/MergePercentileToArray.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/MergePercentileToArray.java
index f92ad84bde8525..fe81adf13bf29d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/MergePercentileToArray.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/MergePercentileToArray.java
@@ -152,10 +152,10 @@ private Plan doMerge(LogicalAggregate<Plan> aggregate) {
                 (List<Expression>) (List) newPercentileArrays);
         ImmutableList.Builder<NamedExpression> newProjectOutputExpressions = ImmutableList.builder();
         newProjectOutputExpressions.addAll((List<NamedExpression>) (List) notChangeForProject);
-        Map<Expression, Alias> existsAliasMap = Maps.newHashMap();
+        Map<Expression, List<Alias>> existsAliasMap = Maps.newHashMap();
         // existsAliasMap is used to keep upper plan refer the same expr
         for (Alias alias : existsAliases) {
-            existsAliasMap.put(alias.child(), alias);
+            existsAliasMap.computeIfAbsent(alias.child(), k -> new ArrayList<>()).add(alias);
         }
         Map<DistinctAndExpr, Slot> slotMap = Maps.newHashMap();
         // slotMap is used to find the correspondence
@@ -169,20 +169,22 @@ private Plan doMerge(LogicalAggregate<Plan> aggregate) {
         for (Map.Entry<DistinctAndExpr, List<AggregateFunction>> entry : funcMap.entrySet()) {
             for (int i = 0; i < entry.getValue().size(); i++) {
                 AggregateFunction aggFunc = entry.getValue().get(i);
-                Alias originAlias = existsAliasMap.get(aggFunc);
-                DistinctAndExpr distinctAndExpr = new DistinctAndExpr(aggFunc.child(0), aggFunc.isDistinct());
-                Alias newAlias = new Alias(originAlias.getExprId(), new ElementAt(slotMap.get(distinctAndExpr),
-                        new IntegerLiteral(i + 1)), originAlias.getName());
-                newProjectOutputExpressions.add(newAlias);
+                List<Alias> originAliases = existsAliasMap.get(aggFunc);
+                for (Alias originAlias : originAliases) {
+                    DistinctAndExpr distinctAndExpr = new DistinctAndExpr(aggFunc.child(0), aggFunc.isDistinct());
+                    Alias newAlias = new Alias(originAlias.getExprId(), new ElementAt(slotMap.get(distinctAndExpr),
+                            new IntegerLiteral(i + 1)), originAlias.getName());
+                    newProjectOutputExpressions.add(newAlias);
+                }
             }
         }
         newProjectOutputExpressions.addAll(groupBySlots);
-        return new LogicalProject(newProjectOutputExpressions.build(), newAggregate);
+        return new LogicalProject<>(newProjectOutputExpressions.build(), newAggregate);
     }
 
     private static class DistinctAndExpr {
-        private Expression expression;
-        private boolean isDistinct;
+        private final Expression expression;
+        private final boolean isDistinct;
 
         public DistinctAndExpr(Expression expression, boolean isDistinct) {
             this.expression = expression;
@@ -193,10 +195,6 @@ public Expression getExpression() {
             return expression;
         }
 
-        public boolean isDistinct() {
-            return isDistinct;
-        }
-
         @Override
         public boolean equals(Object o) {
             if (this == o) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneEmptyPartition.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneEmptyPartition.java
index 5465211c73e793..c7b8f452afbe66 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneEmptyPartition.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneEmptyPartition.java
@@ -36,11 +36,16 @@ public Rule build() {
         return logicalOlapScan().thenApply(ctx -> {
             LogicalOlapScan scan = ctx.root;
             OlapTable table = scan.getTable();
-            List<Long> ids = table.selectNonEmptyPartitionIds(scan.getSelectedPartitionIds());
+            List<Long> partitionIdsToPrune = scan.getSelectedPartitionIds();
+            List<Long> ids = table.selectNonEmptyPartitionIds(partitionIdsToPrune);
             if (ids.isEmpty()) {
                 return new LogicalEmptyRelation(ConnectContext.get().getStatementContext().getNextRelationId(),
                         scan.getOutput());
             }
+            if (partitionIdsToPrune.equals(ids)) {
+                // Not Prune actually, return directly
+                return null;
+            }
             return scan.withSelectedPartitionIds(ids);
         }).toRule(RuleType.PRUNE_EMPTY_PARTITION);
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTablet.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTablet.java
index 4b86b7a3706f0e..fc212550b6f364 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTablet.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTablet.java
@@ -53,7 +53,7 @@ public Rule build() {
             LogicalOlapScan olapScan = filter.child();
             OlapTable table = olapScan.getTable();
             Builder<Long> selectedTabletIdsBuilder = ImmutableList.builder();
-            if (olapScan.getSelectedTabletIds().isEmpty()) {
+            if (olapScan.getManuallySpecifiedTabletIds().isEmpty()) {
                 for (Long id : olapScan.getSelectedPartitionIds()) {
                     Partition partition = table.getPartition(id);
                     MaterializedIndex index = partition.getIndex(olapScan.getSelectedIndexId());
@@ -64,10 +64,10 @@ public Rule build() {
                                     partition.getDistributionInfo()));
                 }
             } else {
-                selectedTabletIdsBuilder.addAll(olapScan.getSelectedTabletIds());
+                selectedTabletIdsBuilder.addAll(olapScan.getManuallySpecifiedTabletIds());
             }
             List<Long> selectedTabletIds = selectedTabletIdsBuilder.build();
-            if (new HashSet<>(selectedTabletIds).equals(new HashSet<>(olapScan.getSelectedTabletIds()))) {
+            if (new HashSet<>(selectedTabletIds).equals(new HashSet<>(olapScan.getManuallySpecifiedTabletIds()))) {
                 return null;
             }
             return filter.withChildren(olapScan.withSelectedTabletIds(selectedTabletIds));
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoin.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoin.java
index f003d2ac2cc918..665e3294a93a72 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoin.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoin.java
@@ -85,11 +85,6 @@ public List<Rule> buildRules() {
                                     );
                         })
                         .thenApply(ctx -> {
-                            Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
-                                    .getSessionVariable().getEnableNereidsRules();
-                            if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN.type())) {
-                                return null;
-                            }
                             LogicalAggregate<LogicalJoin<Plan, Plan>> agg = ctx.root;
                             return pushAgg(agg, agg.child(), ImmutableList.of());
                         })
@@ -109,11 +104,6 @@ public List<Rule> buildRules() {
                                     );
                         })
                         .thenApply(ctx -> {
-                            Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
-                                    .getSessionVariable().getEnableNereidsRules();
-                            if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN.type())) {
-                                return null;
-                            }
                             LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
                             return pushAgg(agg, agg.child().child(), agg.child().getProjects());
                         })
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoinOneSide.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoinOneSide.java
index c5d3d0fb49a0a5..9319b09cc30470 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoinOneSide.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggThroughJoinOneSide.java
@@ -79,11 +79,6 @@ public List<Rule> buildRules() {
                                             && (f.children().isEmpty() || f.child(0) instanceof Slot)));
                         })
                         .thenApply(ctx -> {
-                            Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
-                                    .getSessionVariable().getEnableNereidsRules();
-                            if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE.type())) {
-                                return null;
-                            }
                             LogicalAggregate<LogicalJoin<Plan, Plan>> agg = ctx.root;
                             return pushMinMaxSumCount(agg, agg.child(), ImmutableList.of());
                         })
@@ -101,11 +96,6 @@ public List<Rule> buildRules() {
                                             && (f.children().isEmpty() || f.child(0) instanceof Slot));
                         })
                         .thenApply(ctx -> {
-                            Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
-                                    .getSessionVariable().getEnableNereidsRules();
-                            if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE.type())) {
-                                return null;
-                            }
                             LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
                             return pushMinMaxSumCount(agg, agg.child().child(), agg.child().getProjects());
                         })
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggWithDistinctThroughJoinOneSide.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggWithDistinctThroughJoinOneSide.java
new file mode 100644
index 00000000000000..3f9ad609744e21
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownAggWithDistinctThroughJoinOneSide.java
@@ -0,0 +1,176 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.rules.rewrite;
+
+import org.apache.doris.nereids.rules.Rule;
+import org.apache.doris.nereids.rules.RuleType;
+import org.apache.doris.nereids.trees.expressions.Alias;
+import org.apache.doris.nereids.trees.expressions.Expression;
+import org.apache.doris.nereids.trees.expressions.NamedExpression;
+import org.apache.doris.nereids.trees.expressions.Slot;
+import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
+import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
+import org.apache.doris.nereids.trees.expressions.functions.agg.Max;
+import org.apache.doris.nereids.trees.expressions.functions.agg.Min;
+import org.apache.doris.nereids.trees.expressions.functions.agg.Sum;
+import org.apache.doris.nereids.trees.plans.Plan;
+import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
+import org.apache.doris.nereids.trees.plans.logical.LogicalJoin;
+import org.apache.doris.nereids.trees.plans.logical.LogicalProject;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableList.Builder;
+import com.google.common.collect.Sets;
+
+import java.util.ArrayList;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Set;
+
+/**
+ * Push down agg function with distinct through join on only one side.
+ */
+public class PushDownAggWithDistinctThroughJoinOneSide implements RewriteRuleFactory {
+    @Override
+    public List<Rule> buildRules() {
+        return ImmutableList.of(
+                logicalAggregate(logicalProject(innerLogicalJoin()))
+                        .when(agg -> agg.child().isAllSlots())
+                        .when(agg -> agg.child().child().getOtherJoinConjuncts().isEmpty())
+                        .when(agg -> !agg.isGenerated())
+                        .whenNot(agg -> agg.getAggregateFunctions().isEmpty())
+                        .whenNot(agg -> agg.child()
+                                .child(0).children().stream().anyMatch(p -> p instanceof LogicalAggregate))
+                        .when(agg -> {
+                            Set<AggregateFunction> funcs = agg.getAggregateFunctions();
+                            if (funcs.size() > 1) {
+                                return false;
+                            } else {
+                                return funcs.stream()
+                                        .allMatch(f -> (f instanceof Min || f instanceof Max || f instanceof Sum
+                                                || f instanceof Count) && f.isDistinct()
+                                                && f.child(0) instanceof Slot);
+                            }
+                        })
+                        .thenApply(ctx -> {
+                            LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
+                            return pushDownAggWithDistinct(agg, agg.child().child(), agg.child().getProjects());
+                        })
+                        .toRule(RuleType.PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)
+        );
+    }
+
+    private static LogicalAggregate<Plan> pushDownAggWithDistinct(LogicalAggregate<? extends Plan> agg,
+            LogicalJoin<Plan, Plan> join, List<NamedExpression> projects) {
+        Plan leftJoin = join.left();
+        Plan rightJoin = join.right();
+        List<Slot> leftJoinOutput = leftJoin.getOutput();
+        List<Slot> rightJoinOutput = rightJoin.getOutput();
+
+        List<AggregateFunction> leftFuncs = new ArrayList<>();
+        List<AggregateFunction> rightFuncs = new ArrayList<>();
+        Set<Slot> leftFuncSlotSet = new HashSet<>();
+        Set<Slot> rightFuncSlotSet = new HashSet<>();
+        Set<Slot> newAggOverJoinGroupByKeys = new HashSet<>();
+        for (AggregateFunction func : agg.getAggregateFunctions()) {
+            Slot slot = (Slot) func.child(0);
+            newAggOverJoinGroupByKeys.add(slot);
+            if (leftJoinOutput.contains(slot)) {
+                leftFuncs.add(func);
+                leftFuncSlotSet.add(slot);
+            } else if (rightJoinOutput.contains(slot)) {
+                rightFuncs.add(func);
+                rightFuncSlotSet.add(slot);
+            } else {
+                throw new IllegalStateException("Slot " + slot + " not found in join output");
+            }
+        }
+        boolean isLeftSideAggDistinct = !leftFuncs.isEmpty() && rightFuncs.isEmpty();
+        boolean isRightSideAggDistinct = leftFuncs.isEmpty() && !rightFuncs.isEmpty();
+        if (!isLeftSideAggDistinct && !isRightSideAggDistinct) {
+            return null;
+        }
+
+        Set<Slot> leftPushDownGroupBy = new HashSet<>();
+        Set<Slot> rightPushDownGroupBy = new HashSet<>();
+        for (Expression e : agg.getGroupByExpressions()) {
+            Slot slot = (Slot) e;
+            newAggOverJoinGroupByKeys.add(slot);
+            if (leftJoinOutput.contains(slot)) {
+                leftPushDownGroupBy.add(slot);
+            } else if (rightJoinOutput.contains(slot)) {
+                rightPushDownGroupBy.add(slot);
+            } else {
+                return null;
+            }
+        }
+        join.getHashJoinConjuncts().forEach(e -> e.getInputSlots().forEach(slot -> {
+            if (leftJoinOutput.contains(slot)) {
+                leftPushDownGroupBy.add(slot);
+            } else if (rightJoinOutput.contains(slot)) {
+                rightPushDownGroupBy.add(slot);
+            } else {
+                throw new IllegalStateException("Slot " + slot + " not found in join output");
+            }
+        }));
+
+        if (isLeftSideAggDistinct) {
+            leftPushDownGroupBy.add((Slot) leftFuncs.get(0).child(0));
+            Builder<NamedExpression> leftAggOutputBuilder = ImmutableList.<NamedExpression>builder()
+                    .addAll(leftPushDownGroupBy);
+            leftJoin = new LogicalAggregate<>(ImmutableList.copyOf(leftPushDownGroupBy),
+                    leftAggOutputBuilder.build(), join.left());
+        } else {
+            rightPushDownGroupBy.add((Slot) rightFuncs.get(0).child(0));
+            Builder<NamedExpression> rightAggOutputBuilder = ImmutableList.<NamedExpression>builder()
+                    .addAll(rightPushDownGroupBy);
+            rightJoin = new LogicalAggregate<>(ImmutableList.copyOf(rightPushDownGroupBy),
+                    rightAggOutputBuilder.build(), join.right());
+        }
+
+        Preconditions.checkState(leftJoin != join.left() || rightJoin != join.right(),
+                "not pushing down aggr with distinct through join on single side successfully");
+        Plan newJoin = join.withChildren(leftJoin, rightJoin);
+        LogicalAggregate<? extends Plan> newAggOverJoin = agg.withChildGroupByAndOutput(
+                ImmutableList.copyOf(newAggOverJoinGroupByKeys), projects, newJoin);
+
+        List<NamedExpression> newOutputExprs = new ArrayList<>();
+        for (NamedExpression ne : agg.getOutputExpressions()) {
+            if (ne instanceof Alias && ((Alias) ne).child() instanceof AggregateFunction) {
+                AggregateFunction func = (AggregateFunction) ((Alias) ne).child();
+                Slot slot = (Slot) func.child(0);
+                if (leftFuncSlotSet.contains(slot) || rightFuncSlotSet.contains(slot)) {
+                    Expression newFunc = discardDistinct(func);
+                    newOutputExprs.add((NamedExpression) ne.withChildren(newFunc));
+                } else {
+                    throw new IllegalStateException("Slot " + slot + " not found in join output");
+                }
+            } else {
+                newOutputExprs.add(ne);
+            }
+        }
+        return agg.withAggOutputChild(newOutputExprs, newAggOverJoin);
+    }
+
+    private static Expression discardDistinct(AggregateFunction func) {
+        Preconditions.checkState(func.isDistinct(), "current aggregation function is not distinct");
+        Set<Expression> aggChild = Sets.newLinkedHashSet(func.children());
+        return func.withDistinctAndChildren(false, ImmutableList.copyOf(aggChild));
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownDistinctThroughJoin.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownDistinctThroughJoin.java
index fa705a08d8db8a..533452c2f28f61 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownDistinctThroughJoin.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/PushDownDistinctThroughJoin.java
@@ -18,7 +18,6 @@
 package org.apache.doris.nereids.rules.rewrite;
 
 import org.apache.doris.nereids.jobs.JobContext;
-import org.apache.doris.nereids.rules.RuleType;
 import org.apache.doris.nereids.trees.plans.Plan;
 import org.apache.doris.nereids.trees.plans.algebra.Relation;
 import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
@@ -30,7 +29,6 @@
 
 import com.google.common.collect.ImmutableList;
 
-import java.util.Set;
 import java.util.function.Function;
 
 /**
@@ -39,11 +37,6 @@
 public class PushDownDistinctThroughJoin extends DefaultPlanRewriter<JobContext> implements CustomRewriter {
     @Override
     public Plan rewriteRoot(Plan plan, JobContext context) {
-        Set<Integer> enableNereidsRules = context.getCascadesContext().getConnectContext()
-                .getSessionVariable().getEnableNereidsRules();
-        if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_DISTINCT_THROUGH_JOIN.type())) {
-            return null;
-        }
         return plan.accept(this, context);
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregateFunction.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregateFunction.java
index 58b9d0274ddfc5..90df2f531da3fb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregateFunction.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregateFunction.java
@@ -131,6 +131,10 @@ public String toString() {
         return getName() + "(" + (distinct ? "DISTINCT " : "") + args + ")";
     }
 
+    public boolean supportAggregatePhase(AggregatePhase aggregatePhase) {
+        return true;
+    }
+
     public List<Expression> getDistinctArguments() {
         return distinct ? getArguments() : ImmutableList.of();
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregatePhase.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregatePhase.java
new file mode 100644
index 00000000000000..9115e5890ad66c
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/AggregatePhase.java
@@ -0,0 +1,23 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.expressions.functions.agg;
+
+/** AggregatePhase */
+public enum AggregatePhase {
+    ONE, TWO, THREE, FOUR
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculate.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculate.java
new file mode 100644
index 00000000000000..2575709fa318c2
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculate.java
@@ -0,0 +1,84 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.expressions.functions.agg;
+
+import org.apache.doris.catalog.FunctionSignature;
+import org.apache.doris.nereids.trees.expressions.Expression;
+import org.apache.doris.nereids.trees.expressions.functions.ExplicitlyCastableSignature;
+import org.apache.doris.nereids.trees.expressions.functions.scalar.BitmapEmpty;
+import org.apache.doris.nereids.trees.expressions.literal.VarcharLiteral;
+import org.apache.doris.nereids.types.BitmapType;
+import org.apache.doris.nereids.types.VarcharType;
+import org.apache.doris.nereids.types.coercion.CharacterType;
+import org.apache.doris.nereids.util.ExpressionUtils;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableList;
+
+import java.util.List;
+
+/** OrthogonalBitmapExprCalculate */
+public class OrthogonalBitmapExprCalculate extends NotNullableAggregateFunction
+        implements OrthogonalBitmapFunction, ExplicitlyCastableSignature {
+
+    static final List<FunctionSignature> FUNCTION_SIGNATURES = ImmutableList.of(
+            FunctionSignature.ret(BitmapType.INSTANCE)
+                    .varArgs(BitmapType.INSTANCE, VarcharType.SYSTEM_DEFAULT, VarcharType.SYSTEM_DEFAULT)
+    );
+
+    /**
+     * constructor with 3 arguments.
+     */
+    public OrthogonalBitmapExprCalculate(
+            Expression bitmap, Expression filterColumn, VarcharLiteral inputString) {
+        super("orthogonal_bitmap_expr_calculate", ExpressionUtils.mergeArguments(bitmap, filterColumn, inputString));
+    }
+
+    /**
+     * constructor with 3 arguments.
+     */
+    public OrthogonalBitmapExprCalculate(boolean distinct,
+            Expression bitmap, Expression filterColumn, VarcharLiteral inputString) {
+        super("orthogonal_bitmap_expr_calculate", distinct,
+                ExpressionUtils.mergeArguments(bitmap, filterColumn, inputString));
+    }
+
+    @Override
+    public boolean supportAggregatePhase(AggregatePhase aggregatePhase) {
+        return aggregatePhase == AggregatePhase.TWO;
+    }
+
+    @Override
+    public Expression resultForEmptyInput() {
+        return new BitmapEmpty();
+    }
+
+    @Override
+    public OrthogonalBitmapExprCalculate withDistinctAndChildren(boolean distinct, List<Expression> children) {
+        Preconditions.checkArgument(children.size() == 3
+                && children.get(2).getDataType() instanceof CharacterType
+                && children.get(2).getDataType() instanceof VarcharType);
+        return new OrthogonalBitmapExprCalculate(
+                distinct, children.get(0), children.get(1), (VarcharLiteral) children.get(2));
+    }
+
+    @Override
+    public List<FunctionSignature> getSignatures() {
+        return FUNCTION_SIGNATURES;
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculateCount.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculateCount.java
new file mode 100644
index 00000000000000..0ae69f9fe89c28
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/agg/OrthogonalBitmapExprCalculateCount.java
@@ -0,0 +1,86 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.expressions.functions.agg;
+
+import org.apache.doris.catalog.FunctionSignature;
+import org.apache.doris.nereids.trees.expressions.Expression;
+import org.apache.doris.nereids.trees.expressions.functions.ExplicitlyCastableSignature;
+import org.apache.doris.nereids.trees.expressions.functions.scalar.BitmapEmpty;
+import org.apache.doris.nereids.trees.expressions.literal.VarcharLiteral;
+import org.apache.doris.nereids.types.BigIntType;
+import org.apache.doris.nereids.types.BitmapType;
+import org.apache.doris.nereids.types.VarcharType;
+import org.apache.doris.nereids.types.coercion.CharacterType;
+import org.apache.doris.nereids.util.ExpressionUtils;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableList;
+
+import java.util.List;
+
+/** OrthogonalBitmapExprCalculateCount */
+public class OrthogonalBitmapExprCalculateCount extends NotNullableAggregateFunction
+        implements OrthogonalBitmapFunction, ExplicitlyCastableSignature {
+
+    static final List<FunctionSignature> FUNCTION_SIGNATURES = ImmutableList.of(
+            FunctionSignature.ret(BigIntType.INSTANCE)
+                    .varArgs(BitmapType.INSTANCE, VarcharType.SYSTEM_DEFAULT, VarcharType.SYSTEM_DEFAULT)
+    );
+
+    /**
+     * constructor with 3 arguments.
+     */
+    public OrthogonalBitmapExprCalculateCount(
+            Expression bitmap, Expression filterColumn, VarcharLiteral inputString) {
+        super("orthogonal_bitmap_expr_calculate_count",
+                ExpressionUtils.mergeArguments(bitmap, filterColumn, inputString));
+    }
+
+    /**
+     * constructor with 3 arguments.
+     */
+    public OrthogonalBitmapExprCalculateCount(boolean distinct,
+            Expression bitmap, Expression filterColumn, VarcharLiteral inputString) {
+        super("orthogonal_bitmap_expr_calculate_count", distinct,
+                ExpressionUtils.mergeArguments(bitmap, filterColumn, inputString));
+    }
+
+    @Override
+    public boolean supportAggregatePhase(AggregatePhase aggregatePhase) {
+        return aggregatePhase == AggregatePhase.TWO;
+    }
+
+    @Override
+    public Expression resultForEmptyInput() {
+        return new BitmapEmpty();
+    }
+
+    @Override
+    public OrthogonalBitmapExprCalculateCount withDistinctAndChildren(boolean distinct, List<Expression> children) {
+        Preconditions.checkArgument(children.size() == 3
+                && children.get(2).getDataType() instanceof CharacterType
+                && children.get(2).getDataType() instanceof VarcharType);
+        return new OrthogonalBitmapExprCalculateCount(
+                distinct, children.get(0), children.get(1), (VarcharLiteral) children.get(2));
+    }
+
+    @Override
+    public List<FunctionSignature> getSignatures() {
+        return FUNCTION_SIGNATURES;
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/PlanType.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/PlanType.java
index 14a1b13a4667df..8198a8600a60c9 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/PlanType.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/PlanType.java
@@ -132,6 +132,7 @@ public enum PlanType {
     PHYSICAL_WINDOW,
 
     // commands
+    ADMIN_CHECK_TABLETS_COMMAND,
     CREATE_POLICY_COMMAND,
     CREATE_TABLE_COMMAND,
     CREATE_SQL_BLOCK_RULE_COMMAND,
@@ -152,6 +153,7 @@ public enum PlanType {
     RESUME_JOB_COMMAND,
     ALTER_MTMV_COMMAND,
     ADD_CONSTRAINT_COMMAND,
+    ADMIN_COMPACT_TABLE_COMMAND,
     DROP_CONSTRAINT_COMMAND,
     SHOW_CONSTRAINTS_COMMAND,
     REFRESH_MTMV_COMMAND,
@@ -167,10 +169,12 @@ public enum PlanType {
     CREATE_PROCEDURE_COMMAND,
     DROP_PROCEDURE_COMMAND,
     DROP_ROLE_COMMAND,
+    DROP_REPOSITOORY_COMMAND,
     SHOW_PROCEDURE_COMMAND,
     SHOW_CREATE_PROCEDURE_COMMAND,
     CREATE_VIEW_COMMAND,
     CLEAN_ALL_PROFILE_COMMAND,
+    CREATE_ROLE_COMMAND,
     ALTER_ROLE_COMMAND,
     ALTER_VIEW_COMMAND,
     ALTER_STORAGE_VAULT,
@@ -204,11 +208,14 @@ public enum PlanType {
     SHOW_CREATE_CATALOG_COMMAND,
     SHOW_CREATE_DATABASE_COMMAND,
     SHOW_CREATE_MATERIALIZED_VIEW_COMMAND,
+    SHOW_CREATE_REPOSITORY_COMMAND,
     SHOW_CREATE_TABLE_COMMAND,
     SHOW_CREATE_VIEW_COMMAND,
+    SHOW_DATABASE_ID_COMMAND,
     SHOW_DELETE_COMMAND,
     SHOW_DIAGNOSE_TABLET_COMMAND,
     SHOW_DYNAMIC_PARTITION_COMMAND,
+    SHOW_ENCRYPT_KEYS_COMMAND,
     SHOW_EVENTS_COMMAND,
     SHOW_FRONTENDS_COMMAND,
     SHOW_GRANTS_COMMAND,
@@ -220,6 +227,7 @@ public enum PlanType {
     SHOW_PLUGINS_COMMAND,
     SHOW_PRIVILEGES_COMMAND,
     SHOW_REPLICA_DISTRIBUTION_COMMAND,
+    SHOW_REPLICA_STATUS_COMMAND,
     SHOW_REPOSITORIES_COMMAND,
     SHOW_ROLE_COMMAND,
     SHOW_SMALL_FILES_COMMAND,
@@ -237,5 +245,7 @@ public enum PlanType {
     RECOVER_TABLE_COMMAND,
     RECOVER_PARTITION_COMMAND,
     REPLAY_COMMAND,
+    CREATE_ENCRYPTKEY_COMMAND,
+    CREATE_FILE_COMMAND,
     CREATE_ROUTINE_LOAD_COMMAND
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCheckTabletsCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCheckTabletsCommand.java
new file mode 100644
index 00000000000000..bba555d77a2e92
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCheckTabletsCommand.java
@@ -0,0 +1,109 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.DdlException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.util.PropertyAnalyzer;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import org.apache.commons.collections.CollectionUtils;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+
+/**
+ * drop user command
+ */
+public class AdminCheckTabletsCommand extends Command implements ForwardNoSync {
+    private static final Logger LOG = LogManager.getLogger(AdminCheckTabletsCommand.class);
+    private final List<Long> tabletIds;
+    private final Map<String, String> properties;
+
+    /**
+     * Check Type in Properties.
+     * At present only CONSISTENCY is supported
+     */
+    public enum CheckType {
+        CONSISTENCY; // check the consistency of replicas of tablet
+        public static CheckType getTypeFromString(String str) throws AnalysisException {
+            try {
+                return CheckType.valueOf(str.toUpperCase());
+            } catch (Exception e) {
+                throw new AnalysisException("Unknown check type: " + str);
+            }
+        }
+    }
+
+    /**
+     * constructor
+     */
+    // ADMIN CHECK TABLET (id1, id2, ...) PROPERTIES ("type" = "check_consistency");
+    public AdminCheckTabletsCommand(List<Long> tabletIds, Map<String, String> properties) {
+        super(PlanType.ADMIN_CHECK_TABLETS_COMMAND);
+        this.tabletIds = tabletIds;
+        this.properties = properties;
+    }
+
+    @Override
+    public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+
+        if (CollectionUtils.isEmpty(tabletIds)) {
+            throw new AnalysisException("Tablet id list is empty");
+        }
+
+        String typeStr = PropertyAnalyzer.analyzeType(properties);
+        if (typeStr == null) {
+            throw new AnalysisException("Should specify 'type' property");
+        }
+        CheckType checkType = CheckType.getTypeFromString(typeStr);
+
+        if (properties != null && !properties.isEmpty()) {
+            throw new AnalysisException("Unknown properties: " + properties.keySet());
+        }
+
+        if (Objects.requireNonNull(checkType) == CheckType.CONSISTENCY) {
+            Env.getCurrentEnv().getConsistencyChecker().addTabletsToCheck(tabletIds);
+        }
+    }
+
+    @Override
+    protected void checkSupportedInCloudMode(ConnectContext ctx) throws DdlException {
+        LOG.info("AdminCheckTabletsCommand not supported in cloud mode");
+        throw new DdlException("Unsupported operation");
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitAdminCheckTabletsCommand(this, context);
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCompactTableCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCompactTableCommand.java
new file mode 100644
index 00000000000000..cb1b75af54d796
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminCompactTableCommand.java
@@ -0,0 +1,136 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.DdlException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.UserException;
+import org.apache.doris.common.util.Util;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.expressions.EqualTo;
+import org.apache.doris.nereids.trees.expressions.literal.StringLiteral;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.commands.info.TableRefInfo;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+
+import java.util.List;
+
+/**
+ * AdminCompactTableCommand
+ */
+public class AdminCompactTableCommand extends Command implements ForwardWithSync {
+    private static final Logger LOG = LogManager.getLogger(AdminCompactTableCommand.class);
+    private TableRefInfo tableRefInfo;
+    private EqualTo where;
+
+    /**
+     * compact type
+     */
+    public enum CompactionType {
+        CUMULATIVE,
+        BASE
+    }
+
+    private CompactionType typeFilter;
+
+    public AdminCompactTableCommand(TableRefInfo tableRefInfo, EqualTo where) {
+        super(PlanType.ADD_CONSTRAINT_COMMAND);
+        this.tableRefInfo = tableRefInfo;
+        this.where = where;
+    }
+
+    @Override
+    public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        validate(ctx);
+        String dbName = tableRefInfo.getTableNameInfo().getDb();
+        String tableName = tableRefInfo.getTableNameInfo().getTbl();
+        String type = getCompactionType();
+        List<String> partitionNames = tableRefInfo.getPartitionNamesInfo().getPartitionNames();
+        ctx.getEnv().compactTable(dbName, tableName, type, partitionNames);
+    }
+
+    private void validate(ConnectContext ctx) throws UserException {
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+        tableRefInfo.analyze(ctx);
+        Util.prohibitExternalCatalog(tableRefInfo.getTableNameInfo().getCtl(), this.getClass().getSimpleName());
+
+        List<String> partitionNames = tableRefInfo.getPartitionNamesInfo().getPartitionNames();
+        if (partitionNames != null) {
+            if (partitionNames.size() != 1) {
+                throw new AnalysisException("Only support single partition for compaction");
+            }
+        } else {
+            throw new AnalysisException("No partition selected for compaction");
+        }
+
+        // analyze where clause if not null
+        if (where == null) {
+            throw new AnalysisException("Compaction type must be specified in"
+                + " Where clause like: type = 'BASE/CUMULATIVE'");
+        }
+
+        if (!analyzeWhere()) {
+            throw new AnalysisException(
+                "Where clause should looks like: type = 'BASE/CUMULATIVE'");
+        }
+    }
+
+    private boolean analyzeWhere() {
+        try {
+            typeFilter = CompactionType.valueOf(((StringLiteral) where.right()).getStringValue().toUpperCase());
+        } catch (Exception e) {
+            return false;
+        }
+
+        if (typeFilter == null || (typeFilter != CompactionType.CUMULATIVE && typeFilter != CompactionType.BASE)) {
+            return false;
+        }
+
+        return true;
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitAdminCompactTableCommand(this, context);
+    }
+
+    private String getCompactionType() {
+        if (typeFilter == CompactionType.CUMULATIVE) {
+            return "cumulative";
+        } else {
+            return "base";
+        }
+    }
+
+    @Override
+    protected void checkSupportedInCloudMode(ConnectContext ctx) throws DdlException {
+        LOG.info("AdminCompactTableCommand not supported in cloud mode");
+        throw new DdlException("Unsupported operation");
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminShowReplicaStatusCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminShowReplicaStatusCommand.java
new file mode 100644
index 00000000000000..89ff5c8e2c7147
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AdminShowReplicaStatusCommand.java
@@ -0,0 +1,178 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.analysis.RedirectStatus;
+import org.apache.doris.catalog.Column;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.catalog.MetadataViewer;
+import org.apache.doris.catalog.Replica;
+import org.apache.doris.catalog.ScalarType;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.DdlException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.UserException;
+import org.apache.doris.common.util.Util;
+import org.apache.doris.mysql.privilege.Auth;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.analyzer.UnboundSlot;
+import org.apache.doris.nereids.trees.expressions.EqualTo;
+import org.apache.doris.nereids.trees.expressions.Expression;
+import org.apache.doris.nereids.trees.expressions.Not;
+import org.apache.doris.nereids.trees.expressions.literal.StringLikeLiteral;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.commands.info.TableRefInfo;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.ShowResultSet;
+import org.apache.doris.qe.ShowResultSetMetaData;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+
+import java.util.List;
+
+/**
+ * ShowReplicaStatusCommand
+ */
+public class AdminShowReplicaStatusCommand extends ShowCommand {
+    public static final ImmutableList<String> TITLE_NAMES = new ImmutableList.Builder<String>()
+            .add("TabletId").add("ReplicaId").add("BackendId").add("Version").add("LastFailedVersion")
+            .add("LastSuccessVersion").add("CommittedVersion").add("SchemaHash").add("VersionNum")
+            .add("IsBad").add("IsUserDrop").add("State").add("Status")
+            .build();
+    private static final Logger LOG = LogManager.getLogger(AdminShowReplicaStatusCommand.class);
+
+    private TableRefInfo tableRefInfo;
+    private Expression where;
+
+    private Replica.ReplicaStatus statusFilter;
+
+    public AdminShowReplicaStatusCommand(TableRefInfo tableRefInfo, Expression where) {
+        super(PlanType.SHOW_REPLICA_STATUS_COMMAND);
+        this.tableRefInfo = tableRefInfo;
+        this.where = where;
+    }
+
+    @Override
+    public ShowResultSet doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        validate(ctx);
+        List<List<String>> results;
+        try {
+            results = MetadataViewer.getTabletStatus(tableRefInfo.getTableNameInfo().getDb(),
+                tableRefInfo.getTableNameInfo().getTbl(),
+                tableRefInfo.getPartitionNamesInfo().getPartitionNames(), statusFilter, where);
+        } catch (DdlException e) {
+            throw new AnalysisException(e.getMessage());
+        }
+        return new ShowResultSet(getMetaData(), results);
+    }
+
+    public ShowResultSetMetaData getMetaData() {
+        ShowResultSetMetaData.Builder builder = ShowResultSetMetaData.builder();
+        for (String title : TITLE_NAMES) {
+            builder.addColumn(new Column(title, ScalarType.createVarchar(30)));
+        }
+        return builder.build();
+    }
+
+    /**
+     * validate for show replica
+     */
+    public void validate(ConnectContext ctx) throws AnalysisException, UserException {
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+
+        // bind relation
+        tableRefInfo.analyze(ctx);
+        Util.prohibitExternalCatalog(tableRefInfo.getTableNameInfo().getCtl(), this.getClass().getSimpleName());
+
+        if (!validateWhere()) {
+            throw new AnalysisException(
+                "Where clause should looks like: status =/!= 'OK/DEAD/VERSION_ERROR/SCHEMA_ERROR/MISSING'");
+        }
+    }
+
+    private boolean validateWhere() throws AnalysisException {
+        // analyze where clause if not null
+        if (where == null) {
+            return true;
+        }
+
+        if (!(where instanceof EqualTo || (where instanceof Not && where.child(0) instanceof EqualTo))) {
+            return false;
+        }
+
+        EqualTo equalTo = where instanceof EqualTo ? (EqualTo) where : (EqualTo) ((Not) where).child();
+
+        Expression leftChild = equalTo.child(0);
+        if (!(leftChild instanceof UnboundSlot)) {
+            return false;
+        }
+
+        String leftKey = ((UnboundSlot) leftChild).getName();
+        if (!leftKey.equalsIgnoreCase("status")) {
+            return false;
+        }
+
+        Expression rightChild = equalTo.child(1);
+        if (!(rightChild instanceof StringLikeLiteral)) {
+            return false;
+        }
+
+        try {
+            statusFilter = Replica.ReplicaStatus
+                    .valueOf(((StringLikeLiteral) rightChild).getStringValue().toUpperCase());
+        } catch (Exception e) {
+            return false;
+        }
+
+        if (statusFilter == null) {
+            return false;
+        }
+
+        return true;
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitAdminShowReplicaStatusCommand(this, context);
+    }
+
+    @Override
+    public RedirectStatus toRedirectStatus() {
+        if (ConnectContext.get().getSessionVariable().getForwardToMaster()) {
+            return RedirectStatus.FORWARD_NO_SYNC;
+        } else {
+            return RedirectStatus.NO_FORWARD;
+        }
+    }
+
+    @Override
+    protected void checkSupportedInCloudMode(ConnectContext ctx) throws DdlException {
+        if (!ctx.getCurrentUserIdentity().getUser().equals(Auth.ROOT_USER)) {
+            LOG.info("ShowReplicaStatusCommand not supported in cloud mode");
+            throw new DdlException("Unsupported operation");
+        }
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AlterRoleCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AlterRoleCommand.java
index fe8d0fd5db95a1..9f2d4ba22745ea 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AlterRoleCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/AlterRoleCommand.java
@@ -27,14 +27,11 @@
 import org.apache.doris.qe.StmtExecutor;
 
 import com.google.common.base.Strings;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
 
 /**
  * alter role command
  */
 public class AlterRoleCommand extends AlterCommand {
-    public static final Logger LOG = LogManager.getLogger(AlterRoleCommand.class);
     private final String role;
     private final String comment;
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateEncryptkeyCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateEncryptkeyCommand.java
new file mode 100644
index 00000000000000..f8fc7c3cc12c5e
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateEncryptkeyCommand.java
@@ -0,0 +1,73 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.analysis.EncryptKeyName;
+import org.apache.doris.analysis.StmtType;
+import org.apache.doris.catalog.EncryptKey;
+import org.apache.doris.catalog.EncryptKeyHelper;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.base.Strings;
+
+/** CreateEncryptkeyCommand */
+public class CreateEncryptkeyCommand extends Command implements ForwardWithSync {
+    private final boolean ifNotExists;
+    private final EncryptKeyName encryptKeyName;
+    private final String keyString;
+
+    public CreateEncryptkeyCommand(EncryptKeyName encryptKeyName, boolean ifNotExists, String keyString) {
+        super(PlanType.CREATE_ENCRYPTKEY_COMMAND);
+        this.ifNotExists = ifNotExists;
+        this.encryptKeyName = encryptKeyName;
+        this.keyString = keyString;
+    }
+
+    @Override
+    public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        // check operation privilege
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+
+        encryptKeyName.analyze(ctx);
+        if (Strings.isNullOrEmpty(keyString)) {
+            throw new AnalysisException("keyString can not be null or empty string.");
+        }
+        EncryptKeyHelper.createEncryptKey(encryptKeyName.getDb(),
+                                            new EncryptKey(encryptKeyName, keyString), ifNotExists);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitCreateEncryptKeyCommand(this, context);
+    }
+
+    @Override
+    public StmtType stmtType() {
+        return StmtType.CREATE;
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateFileCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateFileCommand.java
new file mode 100644
index 00000000000000..c8ea3cc161567d
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateFileCommand.java
@@ -0,0 +1,126 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.analysis.StmtType;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.base.Strings;
+import com.google.common.collect.ImmutableSet;
+
+import java.util.Map;
+import java.util.Optional;
+
+/** CreateFileCommand */
+public class CreateFileCommand extends Command implements ForwardWithSync {
+    public static final String PROP_CATALOG_DEFAULT = "DEFAULT";
+    private static final String PROP_CATALOG = "catalog";
+    private static final String PROP_URL = "url";
+    private static final String PROP_MD5 = "md5";
+    private static final String PROP_SAVE_CONTENT = "save_content";
+
+    private static final ImmutableSet<String> PROPERTIES_SET = new ImmutableSet.Builder<String>()
+            .add(PROP_CATALOG).add(PROP_URL).add(PROP_MD5).build();
+    private final String fileName;
+    private String dbName;
+    private final Map<String, String> properties;
+
+    // analyze properties will fill these.
+    // needed item set after analyzed
+    private String catalogName;
+    private String downloadUrl;
+    private String checksum;
+    // if saveContent is true, the file content will be saved in FE memory, so the file size will be limited
+    // by the configuration. If it is false, only URL will be saved.
+    private boolean saveContent = true;
+
+    public CreateFileCommand(String fileName, String dbName, Map<String, String> properties) {
+        super(PlanType.CREATE_FILE_COMMAND);
+        this.fileName = fileName;
+        this.dbName = dbName;
+        this.properties = properties;
+    }
+
+    private void analyzeProperties() throws Exception {
+        Optional<String> optional = properties.keySet().stream().filter(
+                entity -> !PROPERTIES_SET.contains(entity)).findFirst();
+        if (optional.isPresent()) {
+            throw new AnalysisException(optional.get() + " is invalid property");
+        }
+
+        catalogName = properties.get(PROP_CATALOG);
+        if (Strings.isNullOrEmpty(catalogName)) {
+            catalogName = PROP_CATALOG_DEFAULT;
+        }
+
+        downloadUrl = properties.get(PROP_URL);
+        if (Strings.isNullOrEmpty(downloadUrl)) {
+            throw new AnalysisException("download url is missing");
+        }
+
+        if (properties.containsKey(PROP_MD5)) {
+            checksum = properties.get(PROP_MD5);
+        }
+
+        if (properties.containsKey(PROP_SAVE_CONTENT)) {
+            throw new AnalysisException("'save_content' property is not supported yet");
+        }
+    }
+
+    @Override
+    public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        // check operation privilege
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+
+        if (dbName == null) {
+            dbName = ctx.getDatabase();
+        }
+
+        if (Strings.isNullOrEmpty(dbName)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_NO_DB_ERROR);
+        }
+
+        if (Strings.isNullOrEmpty(fileName)) {
+            throw new AnalysisException("File name is not specified");
+        }
+
+        analyzeProperties();
+        Env.getCurrentEnv().getSmallFileMgr().createFile(dbName, catalogName, fileName,
+                                                    downloadUrl, checksum, saveContent);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitCreateFileCommand(this, context);
+    }
+
+    @Override
+    public StmtType stmtType() {
+        return StmtType.CREATE;
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateRoleCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateRoleCommand.java
new file mode 100644
index 00000000000000..1596993ba669f2
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/CreateRoleCommand.java
@@ -0,0 +1,75 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.analysis.StmtType;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.Config;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.FeNameFormat;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.base.Strings;
+
+/**
+ * Create role command
+ */
+public class CreateRoleCommand extends Command implements ForwardWithSync {
+    private boolean ifNotExists;
+    private String role;
+    private String comment;
+
+    /**
+     * ctor of this command.
+     */
+    public CreateRoleCommand(boolean ifNotExists, String role, String comment) {
+        super(PlanType.CREATE_ROLE_COMMAND);
+        this.ifNotExists = ifNotExists;
+        this.role = role;
+        this.comment = Strings.nullToEmpty(comment);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitCreateRoleCommand(this, context);
+    }
+
+    @Override
+    public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        if (Config.access_controller_type.equalsIgnoreCase("ranger-doris")) {
+            throw new AnalysisException("Create role is prohibited when Ranger is enabled.");
+        }
+        FeNameFormat.checkRoleName(role, false /* can not be admin */, "Can not create role");
+        // check if current user has GRANT priv on GLOBAL level.
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.GRANT)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "CREATE ROLE");
+        }
+        Env.getCurrentEnv().getAuth().createRole(role, ifNotExists, comment);
+    }
+
+    @Override
+    public StmtType stmtType() {
+        return StmtType.CREATE;
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRepositoryCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRepositoryCommand.java
new file mode 100644
index 00000000000000..4fef49c39937ed
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRepositoryCommand.java
@@ -0,0 +1,67 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.catalog.Env;
+import org.apache.doris.common.DdlException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.StmtExecutor;
+
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+
+/**
+ * drop repository command
+ */
+public class DropRepositoryCommand extends DropCommand {
+    public static final Logger LOG = LogManager.getLogger(DropRepositoryCommand.class);
+    private final String repoName;
+
+    /**
+     * constructor
+     */
+    public DropRepositoryCommand(String repoName) {
+        super(PlanType.DROP_REPOSITOORY_COMMAND);
+        this.repoName = repoName;
+    }
+
+    @Override
+    public void doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "ADMIN");
+        }
+        Env.getCurrentEnv().getBackupHandler().dropRepository(repoName);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitDropRepositoryCommand(this, context);
+    }
+
+    @Override
+    protected void checkSupportedInCloudMode(ConnectContext ctx) throws DdlException {
+        LOG.info("DropRepositoryCommand not supported in cloud mode");
+        throw new DdlException("Unsupported operation");
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRoleCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRoleCommand.java
index 2f7858aa6ae180..5b74d32cf6a4df 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRoleCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropRoleCommand.java
@@ -29,14 +29,10 @@
 import org.apache.doris.qe.ConnectContext;
 import org.apache.doris.qe.StmtExecutor;
 
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-
 /**
  * drop roles command
  */
 public class DropRoleCommand extends DropCommand {
-    public static final Logger LOG = LogManager.getLogger(DropRoleCommand.class);
     private final boolean ifExists;
     private final String role;
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropUserCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropUserCommand.java
index 094ce06c36143e..5c4fb407e40213 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropUserCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/DropUserCommand.java
@@ -55,8 +55,8 @@ public void doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
 
         userIdent.analyze();
 
-        if (userIdent.isRootUser()) {
-            ErrorReport.reportAnalysisException(ErrorCode.ERR_COMMON_ERROR, "Can not drop root user");
+        if (userIdent.isSystemUser()) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_COMMON_ERROR, "Can not drop system user");
         }
 
         // only user with GLOBAL level's GRANT_PRIV can drop user.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ExplainCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ExplainCommand.java
index d4fce906693a68..e3f2f1d732ae5a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ExplainCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ExplainCommand.java
@@ -27,6 +27,7 @@
 import org.apache.doris.nereids.trees.plans.PlanType;
 import org.apache.doris.nereids.trees.plans.logical.LogicalPlan;
 import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.planner.ScanNode;
 import org.apache.doris.qe.ConnectContext;
 import org.apache.doris.qe.StmtExecutor;
 
@@ -95,6 +96,9 @@ public void run(ConnectContext ctx, StmtExecutor executor) throws Exception {
         } else {
             executor.handleExplainStmt(planner.getExplainString(explainOptions), true);
         }
+        for (ScanNode scanNode : planner.getScanNodes()) {
+            scanNode.stop();
+        }
     }
 
     @Override
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ReplayCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ReplayCommand.java
index 15cc2b3696a41e..4eabbb9e9595d2 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ReplayCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ReplayCommand.java
@@ -99,6 +99,7 @@ private void handleLoad() throws Exception {
         // 3. run nereids planner with sql in minidump file
         StatementContext statementContext = new StatementContext(ConnectContext.get(),
                 new OriginStatement(minidump.getSql(), 0));
+        statementContext.setTables(minidump.getTables());
         ConnectContext.get().setStatementContext(statementContext);
         JSONObject resultPlan = MinidumpUtils.executeSql(minidump.getSql());
         JSONObject minidumpResult = new JSONObject(minidump.getResultPlanJson());
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowCreateRepositoryCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowCreateRepositoryCommand.java
new file mode 100644
index 00000000000000..8c27e8748fbb72
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowCreateRepositoryCommand.java
@@ -0,0 +1,81 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.backup.Repository;
+import org.apache.doris.catalog.Column;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.catalog.ScalarType;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.UserException;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.ShowResultSet;
+import org.apache.doris.qe.ShowResultSetMetaData;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.collect.Lists;
+
+import java.util.List;
+
+/**
+ * ShowCreateRepositoryCommand
+ */
+public class ShowCreateRepositoryCommand extends ShowCommand {
+    private static final ShowResultSetMetaData META_DATA =
+            ShowResultSetMetaData.builder()
+                            .addColumn(new Column("RepoName", ScalarType.createVarchar(128)))
+                            .addColumn(new Column("CreateStmt", ScalarType.createVarchar(65535)))
+                            .build();
+
+    private final String repoName;
+
+    public ShowCreateRepositoryCommand(String repoName) {
+        super(PlanType.SHOW_CREATE_REPOSITORY_COMMAND);
+        this.repoName = repoName;
+    }
+
+    private void validate() throws UserException {
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR,
+                    PrivPredicate.ADMIN.getPrivs().toString());
+        }
+    }
+
+    @Override
+    public ShowResultSet doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        validate();
+        List<List<String>> rows = Lists.newArrayList();
+        Repository repo = Env.getCurrentEnv().getBackupHandler().getRepoMgr().getRepo(repoName);
+        if (repo == null) {
+            throw new AnalysisException("repository not exist.");
+        }
+        rows.add(Lists.newArrayList(repoName, repo.getCreateStatement()));
+        return new ShowResultSet(META_DATA, rows);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitShowCreateRepositoryCommand(this, context);
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowDatabaseIdCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowDatabaseIdCommand.java
new file mode 100644
index 00000000000000..f183ea9df60ea3
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowDatabaseIdCommand.java
@@ -0,0 +1,75 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.catalog.Column;
+import org.apache.doris.catalog.DatabaseIf;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.catalog.ScalarType;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.ShowResultSet;
+import org.apache.doris.qe.ShowResultSetMetaData;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.collect.Lists;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * show database id command
+ */
+public class ShowDatabaseIdCommand extends ShowCommand {
+    private final Long dbId;
+
+    /**
+     * constructor
+     */
+    public ShowDatabaseIdCommand(Long dbId) {
+        super(PlanType.SHOW_DATABASE_ID_COMMAND);
+        this.dbId = dbId;
+    }
+
+    @Override
+    public ShowResultSet doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        // check access first
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR, "SHOW DATABASE");
+        }
+        List<List<String>> rows = Lists.newArrayList();
+        DatabaseIf database = ctx.getCurrentCatalog().getDbNullable(dbId);
+        if (database != null) {
+            List<String> row = new ArrayList<>();
+            row.add(database.getFullName());
+            rows.add(row);
+        }
+        ShowResultSetMetaData.Builder builder = ShowResultSetMetaData.builder();
+        builder.addColumn(new Column("DBName", ScalarType.createVarchar(30)));
+        return new ShowResultSet(builder.build(), rows);
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitShowDatabaseIdCommand(this, context);
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowEncryptKeysCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowEncryptKeysCommand.java
new file mode 100644
index 00000000000000..c72d0437bf55d8
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowEncryptKeysCommand.java
@@ -0,0 +1,134 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.plans.commands;
+
+import org.apache.doris.catalog.Column;
+import org.apache.doris.catalog.Database;
+import org.apache.doris.catalog.DatabaseIf;
+import org.apache.doris.catalog.EncryptKey;
+import org.apache.doris.catalog.Env;
+import org.apache.doris.catalog.ScalarType;
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.ErrorCode;
+import org.apache.doris.common.ErrorReport;
+import org.apache.doris.common.util.ListComparator;
+import org.apache.doris.common.util.OrderByPair;
+import org.apache.doris.common.util.Util;
+import org.apache.doris.mysql.privilege.PrivPredicate;
+import org.apache.doris.nereids.trees.plans.PlanType;
+import org.apache.doris.nereids.trees.plans.visitor.PlanVisitor;
+import org.apache.doris.qe.ConnectContext;
+import org.apache.doris.qe.ShowResultSet;
+import org.apache.doris.qe.ShowResultSetMetaData;
+import org.apache.doris.qe.StmtExecutor;
+
+import com.google.common.base.Strings;
+import com.google.common.collect.Lists;
+
+import java.util.Collections;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Set;
+
+/**
+ * Represents the command for SHOW ENCRYPTKEYS.
+ */
+public class ShowEncryptKeysCommand extends ShowCommand {
+    private static final ShowResultSetMetaData META_DATA =
+            ShowResultSetMetaData.builder()
+                    .addColumn(new Column("EncryptKey Name", ScalarType.createVarchar(20)))
+                    .addColumn(new Column("EncryptKey String", ScalarType.createVarchar(1024)))
+                    .build();
+
+    private String dbName;
+    private final String likeString;
+
+    public ShowEncryptKeysCommand(String databaseName, String likeString) {
+        super(PlanType.SHOW_ENCRYPT_KEYS_COMMAND);
+        this.dbName = databaseName;
+        this.likeString = likeString;
+    }
+
+    private void validate(ConnectContext ctx) throws AnalysisException {
+        if (Strings.isNullOrEmpty(dbName)) {
+            dbName = ctx.getDatabase();
+            if (Strings.isNullOrEmpty(dbName)) {
+                ErrorReport.reportAnalysisException(ErrorCode.ERR_NO_DB_ERROR);
+            }
+        }
+
+        // check auth
+        if (!Env.getCurrentEnv().getAccessManager().checkGlobalPriv(ConnectContext.get(), PrivPredicate.ADMIN)) {
+            ErrorReport.reportAnalysisException(ErrorCode.ERR_SPECIFIC_ACCESS_DENIED_ERROR,
+                    PrivPredicate.ADMIN.getPrivs().toString());
+        }
+    }
+
+    @Override
+    public ShowResultSet doRun(ConnectContext ctx, StmtExecutor executor) throws Exception {
+        validate(ctx);
+        Util.prohibitExternalCatalog(ctx.getDefaultCatalog(), this.getClass().getSimpleName());
+        DatabaseIf db = ctx.getCurrentCatalog().getDbOrAnalysisException(dbName);
+        List<List<String>> resultRowSet = Lists.newArrayList();
+        if (db instanceof Database) {
+            List<EncryptKey> encryptKeys = ((Database) db).getEncryptKeys();
+            List<List<Comparable>> rowSet = Lists.newArrayList();
+            for (EncryptKey encryptKey : encryptKeys) {
+                List<Comparable> row = encryptKey.getInfo();
+                // like predicate
+                if (likeString == null || like(encryptKey.getEncryptKeyName().getKeyName())) {
+                    rowSet.add(row);
+                }
+
+            }
+
+            // sort function rows by first column asc
+            ListComparator<List<Comparable>> comparator = null;
+            OrderByPair orderByPair = new OrderByPair(0, false);
+            comparator = new ListComparator<>(orderByPair);
+            Collections.sort(rowSet, comparator);
+
+            Set<String> encryptKeyNameSet = new HashSet<>();
+            for (List<Comparable> row : rowSet) {
+                List<String> resultRow = Lists.newArrayList();
+                for (Comparable column : row) {
+                    resultRow.add(column.toString());
+                }
+                resultRowSet.add(resultRow);
+                encryptKeyNameSet.add(resultRow.get(0));
+            }
+        }
+
+        return new ShowResultSet(META_DATA, resultRowSet);
+    }
+
+    private boolean like(String str) {
+        str = str.toLowerCase();
+        return str.matches(likeString.replace(".", "\\.").replace("?", ".").replace("%", ".*").toLowerCase());
+    }
+
+    @Override
+    public <R, C> R accept(PlanVisitor<R, C> visitor, C context) {
+        return visitor.visitShowEncryptKeysCommand(this, context);
+    }
+
+    public ShowResultSetMetaData getMetaData() {
+        return META_DATA;
+    }
+}
+
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowGrantsCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowGrantsCommand.java
index f877f42b83599f..6d52d374fa7ae4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowGrantsCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowGrantsCommand.java
@@ -34,8 +34,6 @@
 import org.apache.doris.qe.StmtExecutor;
 
 import com.google.common.base.Preconditions;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
 
 import java.util.List;
 
@@ -43,7 +41,6 @@
  * show grants command
  */
 public class ShowGrantsCommand extends ShowCommand {
-    public static final Logger LOG = LogManager.getLogger(ShowGrantsCommand.class);
     private static final ShowResultSetMetaData META_DATA;
     private final boolean isAll;
     private UserIdentity userIdent; // if not given will update with self.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowPartitionIdCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowPartitionIdCommand.java
index fb7e5cdf968330..47977a8e896a37 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowPartitionIdCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowPartitionIdCommand.java
@@ -35,8 +35,6 @@
 import org.apache.doris.qe.StmtExecutor;
 
 import com.google.common.collect.Lists;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -45,7 +43,6 @@
  * show partition command
  */
 public class ShowPartitionIdCommand extends ShowCommand {
-    public static final Logger LOG = LogManager.getLogger(ShowPartitionIdCommand.class);
     private final long partitionId;
 
     /**
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowProcCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowProcCommand.java
index da2fb38c4d8d80..fc865a07457ab6 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowProcCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowProcCommand.java
@@ -35,16 +35,12 @@
 import org.apache.doris.qe.ShowResultSetMetaData;
 import org.apache.doris.qe.StmtExecutor;
 
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-
 import java.util.List;
 
 /**
  * show proc command
  */
 public class ShowProcCommand extends ShowCommand {
-    public static final Logger LOG = LogManager.getLogger(ShowProcCommand.class);
     private final String path;
 
     /**
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowRolesCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowRolesCommand.java
index 7cbb5f934cabba..4ca4c051cdbf8f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowRolesCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowRolesCommand.java
@@ -30,16 +30,12 @@
 import org.apache.doris.qe.ShowResultSetMetaData;
 import org.apache.doris.qe.StmtExecutor;
 
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-
 import java.util.List;
 
 /**
  * show roles command
  */
 public class ShowRolesCommand extends ShowCommand {
-    public static final Logger LOG = LogManager.getLogger(ShowRolesCommand.class);
     private static final ShowResultSetMetaData META_DATA;
 
     static {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowTableIdCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowTableIdCommand.java
index 3acd6c7992c4df..59e1834215a40f 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowTableIdCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/ShowTableIdCommand.java
@@ -33,8 +33,6 @@
 import org.apache.doris.qe.StmtExecutor;
 
 import com.google.common.collect.Lists;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -43,7 +41,6 @@
  * show table id command
  */
 public class ShowTableIdCommand extends ShowCommand {
-    public static final Logger LOG = LogManager.getLogger(ShowTableIdCommand.class);
     private final long tableId;
 
     /**
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/UpdateMvByPartitionCommand.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/UpdateMvByPartitionCommand.java
index de284bd837748f..869c2d0b38bd4c 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/UpdateMvByPartitionCommand.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/UpdateMvByPartitionCommand.java
@@ -28,6 +28,7 @@
 import org.apache.doris.catalog.Type;
 import org.apache.doris.common.AnalysisException;
 import org.apache.doris.common.UserException;
+import org.apache.doris.datasource.ExternalTable;
 import org.apache.doris.mtmv.BaseTableInfo;
 import org.apache.doris.mtmv.MTMVRelatedTableIf;
 import org.apache.doris.nereids.analyzer.UnboundRelation;
@@ -246,11 +247,16 @@ public Plan visitLogicalCTE(LogicalCTE<? extends Plan> cte, PredicateAddContext
             if (predicates.isEmpty()) {
                 return cte;
             }
+            List<LogicalSubQueryAlias<Plan>> rewrittenSubQueryAlias = new ArrayList<>();
             for (LogicalSubQueryAlias<Plan> subQueryAlias : cte.getAliasQueries()) {
+                List<Plan> subQueryAliasChildren = new ArrayList<>();
                 this.virtualRelationNamePartSet.add(subQueryAlias.getQualifier());
-                subQueryAlias.children().forEach(subQuery -> subQuery.accept(this, predicates));
+                subQueryAlias.children().forEach(subQuery ->
+                        subQueryAliasChildren.add(subQuery.accept(this, predicates))
+                );
+                rewrittenSubQueryAlias.add(subQueryAlias.withChildren(subQueryAliasChildren));
             }
-            return super.visitLogicalCTE(cte, predicates);
+            return super.visitLogicalCTE(new LogicalCTE<>(rewrittenSubQueryAlias, cte.child()), predicates);
         }
 
         @Override
@@ -301,16 +307,19 @@ public Plan visitLogicalCatalogRelation(LogicalCatalogRelation catalogRelation,
                     MTMVRelatedTableIf targetTable = (MTMVRelatedTableIf) table;
                     for (String partitionName : filterTableEntry.getValue()) {
                         Partition partition = targetTable.getPartition(partitionName);
-                        if (!(targetTable instanceof OlapTable)) {
-                            // check partition is have data or not, only support olap table
-                            break;
-                        }
-                        if (!((OlapTable) targetTable).selectNonEmptyPartitionIds(
+                        if (targetTable instanceof OlapTable && !((OlapTable) targetTable).selectNonEmptyPartitionIds(
                                 Lists.newArrayList(partition.getId())).isEmpty()) {
-                            // Add filter only when partition has data
+                            // Add filter only when partition has data when olap table
                             partitionHasDataItems.add(
                                     ((OlapTable) targetTable).getPartitionInfo().getItem(partition.getId()));
                         }
+                        if (targetTable instanceof ExternalTable) {
+                            // Add filter only when partition has data when external table
+                            // TODO: 2024/12/4 real snapshot
+                            partitionHasDataItems.add(
+                                    ((ExternalTable) targetTable).getNameToPartitionItems(Optional.empty())
+                                            .get(partitionName));
+                        }
                     }
                     if (partitionHasDataItems.isEmpty()) {
                         predicates.setNeedAddFilter(false);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/CreateMTMVInfo.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/CreateMTMVInfo.java
index 5c6c71c92e8111..417ab807cfe4bb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/CreateMTMVInfo.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/CreateMTMVInfo.java
@@ -157,6 +157,9 @@ public void analyze(ConnectContext ctx) throws Exception {
         if (!InternalCatalog.INTERNAL_CATALOG_NAME.equals(mvName.getCtl())) {
             throw new AnalysisException("Only support creating asynchronous materialized views in internal catalog");
         }
+        if (ctx.getSessionVariable().isInDebugMode()) {
+            throw new AnalysisException("Create materialized view fail, because is in debug mode");
+        }
         try {
             FeNameFormat.checkTableName(mvName.getTbl());
         } catch (org.apache.doris.common.AnalysisException e) {
@@ -253,9 +256,21 @@ public void analyzeQuery(ConnectContext ctx, Map<String, String> mvProperties) t
         NereidsPlanner planner = new NereidsPlanner(statementContext);
         // this is for expression column name infer when not use alias
         LogicalSink<Plan> logicalSink = new UnboundResultSink<>(logicalQuery);
-        // must disable constant folding by be, because be constant folding may return wrong type
-        ctx.getSessionVariable().setVarOnce(SessionVariable.ENABLE_FOLD_CONSTANT_BY_BE, "false");
-        Plan plan = planner.planWithLock(logicalSink, PhysicalProperties.ANY, ExplainLevel.ALL_PLAN);
+        // Should not make table without data to empty relation when analyze the related table,
+        // so add disable rules
+        Set<String> tempDisableRules = ctx.getSessionVariable().getDisableNereidsRuleNames();
+        ctx.getSessionVariable().setDisableNereidsRules(CreateMTMVInfo.MTMV_PLANER_DISABLE_RULES);
+        ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
+        Plan plan;
+        try {
+            // must disable constant folding by be, because be constant folding may return wrong type
+            ctx.getSessionVariable().setVarOnce(SessionVariable.ENABLE_FOLD_CONSTANT_BY_BE, "false");
+            plan = planner.planWithLock(logicalSink, PhysicalProperties.ANY, ExplainLevel.ALL_PLAN);
+        } finally {
+            // after operate, roll back the disable rules
+            ctx.getSessionVariable().setDisableNereidsRules(String.join(",", tempDisableRules));
+            ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
+        }
         // can not contain VIEW or MTMV
         analyzeBaseTables(planner.getAnalyzedPlan());
         // can not contain Random function
@@ -266,8 +281,7 @@ public void analyzeQuery(ConnectContext ctx, Map<String, String> mvProperties) t
             throw new AnalysisException("can not contain invalid expression");
         }
         getRelation(planner);
-        this.mvPartitionInfo = mvPartitionDefinition
-                .analyzeAndTransferToMTMVPartitionInfo(planner, ctx, logicalQuery);
+        this.mvPartitionInfo = mvPartitionDefinition.analyzeAndTransferToMTMVPartitionInfo(planner, ctx);
         this.partitionDesc = generatePartitionDesc(ctx);
         getColumns(plan, ctx, mvPartitionInfo.getPartitionCol(), distribution);
         analyzeKeys();
@@ -312,24 +326,9 @@ private void analyzeKeys() {
         }
     }
 
+    // Should use analyzed plan for collect views and tables
     private void getRelation(NereidsPlanner planner) {
-        // Should not make table without data to empty relation when analyze the related table,
-        // so add disable rules
-        ConnectContext ctx = planner.getCascadesContext().getConnectContext();
-        SessionVariable sessionVariable = ctx.getSessionVariable();
-        Set<String> tempDisableRules = sessionVariable.getDisableNereidsRuleNames();
-        sessionVariable.setDisableNereidsRules(CreateMTMVInfo.MTMV_PLANER_DISABLE_RULES);
-        if (ctx.getStatementContext() != null) {
-            ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
-        }
-        Plan plan;
-        try {
-            plan = planner.planWithLock(logicalQuery, PhysicalProperties.ANY, ExplainLevel.NONE);
-        } finally {
-            sessionVariable.setDisableNereidsRules(String.join(",", tempDisableRules));
-            ctx.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
-        }
-        this.relation = MTMVPlanUtil.generateMTMVRelation(plan);
+        this.relation = MTMVPlanUtil.generateMTMVRelation(planner.getAnalyzedPlan(), planner.getConnectContext());
     }
 
     private PartitionDesc generatePartitionDesc(ConnectContext ctx) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/MTMVPartitionDefinition.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/MTMVPartitionDefinition.java
index c4117e8608e29d..a26a97f7240793 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/MTMVPartitionDefinition.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/MTMVPartitionDefinition.java
@@ -37,7 +37,6 @@
 import org.apache.doris.nereids.analyzer.UnboundFunction;
 import org.apache.doris.nereids.analyzer.UnboundSlot;
 import org.apache.doris.nereids.exceptions.AnalysisException;
-import org.apache.doris.nereids.properties.PhysicalProperties;
 import org.apache.doris.nereids.rules.exploration.mv.MaterializedViewUtils;
 import org.apache.doris.nereids.rules.exploration.mv.MaterializedViewUtils.RelatedTableInfo;
 import org.apache.doris.nereids.trees.expressions.Cast;
@@ -45,11 +44,7 @@
 import org.apache.doris.nereids.trees.expressions.Slot;
 import org.apache.doris.nereids.trees.expressions.functions.scalar.DateTrunc;
 import org.apache.doris.nereids.trees.expressions.literal.Literal;
-import org.apache.doris.nereids.trees.plans.Plan;
-import org.apache.doris.nereids.trees.plans.commands.ExplainCommand.ExplainLevel;
-import org.apache.doris.nereids.trees.plans.logical.LogicalPlan;
 import org.apache.doris.qe.ConnectContext;
-import org.apache.doris.qe.SessionVariable;
 
 import com.google.common.collect.Sets;
 
@@ -72,11 +67,9 @@ public class MTMVPartitionDefinition {
      *
      * @param planner planner
      * @param ctx ctx
-     * @param logicalQuery logicalQuery
      * @return MTMVPartitionInfo
      */
-    public MTMVPartitionInfo analyzeAndTransferToMTMVPartitionInfo(NereidsPlanner planner, ConnectContext ctx,
-            LogicalPlan logicalQuery) {
+    public MTMVPartitionInfo analyzeAndTransferToMTMVPartitionInfo(NereidsPlanner planner, ConnectContext ctx) {
         MTMVPartitionInfo mtmvPartitionInfo = new MTMVPartitionInfo(partitionType);
         if (this.partitionType == MTMVPartitionType.SELF_MANAGE) {
             return mtmvPartitionInfo;
@@ -100,7 +93,7 @@ public MTMVPartitionInfo analyzeAndTransferToMTMVPartitionInfo(NereidsPlanner pl
             timeUnit = null;
         }
         mtmvPartitionInfo.setPartitionCol(partitionColName);
-        RelatedTableInfo relatedTableInfo = getRelatedTableInfo(planner, ctx, logicalQuery, partitionColName, timeUnit);
+        RelatedTableInfo relatedTableInfo = getRelatedTableInfo(planner, ctx, partitionColName, timeUnit);
         mtmvPartitionInfo.setRelatedCol(relatedTableInfo.getColumn());
         mtmvPartitionInfo.setRelatedTable(relatedTableInfo.getTableInfo());
         if (relatedTableInfo.getPartitionExpression().isPresent()) {
@@ -125,47 +118,33 @@ public MTMVPartitionInfo analyzeAndTransferToMTMVPartitionInfo(NereidsPlanner pl
         return mtmvPartitionInfo;
     }
 
-    private RelatedTableInfo getRelatedTableInfo(NereidsPlanner planner, ConnectContext ctx, LogicalPlan
-            logicalQuery,
-            String partitionColName,
-            String timeUnit) {
+    // Should use rewritten plan without view and subQuery to get related partition table
+    private RelatedTableInfo getRelatedTableInfo(NereidsPlanner planner, ConnectContext ctx,
+            String partitionColName, String timeUnit) {
         CascadesContext cascadesContext = planner.getCascadesContext();
-        SessionVariable sessionVariable = cascadesContext.getConnectContext().getSessionVariable();
-        Set<String> tempDisableRules = sessionVariable.getDisableNereidsRuleNames();
-        // Should not make table without data to empty relation when analyze the related table,
-        // so add disable rules
-        sessionVariable.setDisableNereidsRules(CreateMTMVInfo.MTMV_PLANER_DISABLE_RULES);
-        cascadesContext.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
+
+        RelatedTableInfo relatedTableInfo = MaterializedViewUtils
+                .getRelatedTableInfo(partitionColName, timeUnit, planner.getRewrittenPlan(), cascadesContext);
+        if (!relatedTableInfo.isPctPossible()) {
+            throw new AnalysisException(String.format("Unable to find a suitable base table for partitioning,"
+                    + " the fail reason is %s", relatedTableInfo.getFailReason()));
+        }
+        MTMVRelatedTableIf mtmvBaseRealtedTable = MTMVUtil.getRelatedTable(relatedTableInfo.getTableInfo());
+        Set<String> partitionColumnNames = Sets.newTreeSet(String.CASE_INSENSITIVE_ORDER);
         try {
-            Plan mvRewrittenPlan =
-                    planner.planWithLock(logicalQuery, PhysicalProperties.ANY, ExplainLevel.REWRITTEN_PLAN);
-            RelatedTableInfo relatedTableInfo = MaterializedViewUtils
-                    .getRelatedTableInfo(partitionColName, timeUnit, mvRewrittenPlan, cascadesContext);
-            if (!relatedTableInfo.isPctPossible()) {
-                throw new AnalysisException(String.format("Unable to find a suitable base table for partitioning,"
-                        + " the fail reason is %s", relatedTableInfo.getFailReason()));
-            }
-            MTMVRelatedTableIf mtmvBaseRealtedTable = MTMVUtil.getRelatedTable(relatedTableInfo.getTableInfo());
-            Set<String> partitionColumnNames = Sets.newTreeSet(String.CASE_INSENSITIVE_ORDER);
-            try {
-                partitionColumnNames.addAll(mtmvBaseRealtedTable.getPartitionColumnNames(Optional.empty()));
-            } catch (DdlException e) {
-                throw new AnalysisException(e.getMessage(), e);
-            }
+            partitionColumnNames.addAll(mtmvBaseRealtedTable.getPartitionColumnNames(Optional.empty()));
+        } catch (DdlException e) {
+            throw new AnalysisException(e.getMessage(), e);
+        }
 
-            if (!partitionColumnNames.contains(relatedTableInfo.getColumn())) {
-                throw new AnalysisException("error related column: " + relatedTableInfo.getColumn());
-            }
-            if (!(mtmvBaseRealtedTable instanceof HMSExternalTable)
-                    && partitionColumnNames.size() != 1) {
-                throw new AnalysisException("only hms table support multi column partition.");
-            }
-            return relatedTableInfo;
-        } finally {
-            // after operate, roll back the disable rules
-            sessionVariable.setDisableNereidsRules(String.join(",", tempDisableRules));
-            cascadesContext.getStatementContext().invalidCache(SessionVariable.DISABLE_NEREIDS_RULES);
+        if (!partitionColumnNames.contains(relatedTableInfo.getColumn())) {
+            throw new AnalysisException("error related column: " + relatedTableInfo.getColumn());
+        }
+        if (!(mtmvBaseRealtedTable instanceof HMSExternalTable)
+                && partitionColumnNames.size() != 1) {
+            throw new AnalysisException("only hms table support multi column partition.");
         }
+        return relatedTableInfo;
     }
 
     private static List<Expr> convertToLegacyArguments(List<Expression> children) {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/ShowCreateMTMVInfo.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/ShowCreateMTMVInfo.java
index 588af2365741c5..b4fde11c3e1e64 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/ShowCreateMTMVInfo.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/commands/info/ShowCreateMTMVInfo.java
@@ -74,18 +74,13 @@ public void analyze(ConnectContext ctx) {
      * @throws DdlException DdlException
      * @throws IOException IOException
      */
-    public void run(StmtExecutor executor) throws DdlException, IOException {
+    public void run(StmtExecutor executor) throws DdlException, IOException, org.apache.doris.common.AnalysisException {
         List<List<String>> rows = Lists.newArrayList();
         Database db = Env.getCurrentInternalCatalog().getDbOrDdlException(mvName.getDb());
         MTMV mtmv = (MTMV) db.getTableOrDdlException(mvName.getTbl());
-        mtmv.readLock();
-        try {
-            String mtmvDdl = Env.getMTMVDdl(mtmv);
-            rows.add(Lists.newArrayList(mtmv.getName(), mtmvDdl));
-            executor.handleShowCreateMTMVStmt(rows);
-        } finally {
-            mtmv.readUnlock();
-        }
+        String mtmvDdl = Env.getMTMVDdl(mtmv);
+        rows.add(Lists.newArrayList(mtmv.getName(), mtmvDdl));
+        executor.handleShowCreateMTMVStmt(rows);
     }
 
     /**
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalAggregate.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalAggregate.java
index 2798b1aef0102b..d80b4f3166df86 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalAggregate.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalAggregate.java
@@ -24,6 +24,8 @@
 import org.apache.doris.nereids.trees.expressions.NamedExpression;
 import org.apache.doris.nereids.trees.expressions.Slot;
 import org.apache.doris.nereids.trees.expressions.functions.ExpressionTrait;
+import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
+import org.apache.doris.nereids.trees.expressions.functions.agg.AggregatePhase;
 import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
 import org.apache.doris.nereids.trees.expressions.functions.agg.Ndv;
 import org.apache.doris.nereids.trees.plans.Plan;
@@ -271,6 +273,12 @@ public LogicalAggregate<Plan> withGroupByAndOutput(List<Expression> groupByExprL
                 hasPushed, sourceRepeat, Optional.empty(), Optional.empty(), child());
     }
 
+    public LogicalAggregate<Plan> withChildGroupByAndOutput(List<Expression> groupByExprList,
+            List<NamedExpression> outputExpressionList, Plan newChild) {
+        return new LogicalAggregate<>(groupByExprList, outputExpressionList, normalized, ordinalIsResolved, generated,
+                hasPushed, sourceRepeat, Optional.empty(), Optional.empty(), newChild);
+    }
+
     public LogicalAggregate<Plan> withChildAndOutput(CHILD_TYPE child,
                                                        List<NamedExpression> outputExpressionList) {
         return new LogicalAggregate<>(groupByExpressions, outputExpressionList, normalized, ordinalIsResolved,
@@ -386,4 +394,14 @@ public void computeEqualSet(DataTrait.Builder builder) {
     public void computeFd(DataTrait.Builder builder) {
         builder.addFuncDepsDG(child().getLogicalProperties().getTrait());
     }
+
+    /** supportAggregatePhase */
+    public boolean supportAggregatePhase(AggregatePhase aggregatePhase) {
+        for (AggregateFunction aggregateFunction : getAggregateFunctions()) {
+            if (!aggregateFunction.supportAggregatePhase(aggregatePhase)) {
+                return false;
+            }
+        }
+        return true;
+    }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalHudiScan.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalHudiScan.java
index 629690889432b3..51e68eb07631ae 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalHudiScan.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalHudiScan.java
@@ -84,7 +84,7 @@ protected LogicalHudiScan(RelationId id, ExternalTable table, List<String> quali
     public LogicalHudiScan(RelationId id, ExternalTable table, List<String> qualifier,
             Optional<TableSample> tableSample, Optional<TableSnapshot> tableSnapshot) {
         this(id, table, qualifier, Optional.empty(), Optional.empty(),
-                SelectedPartitions.NOT_PRUNED, tableSample, tableSnapshot,
+                ((HMSExternalTable) table).initHudiSelectedPartitions(tableSnapshot), tableSample, tableSnapshot,
                 Optional.empty(), Optional.empty());
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalOlapScan.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalOlapScan.java
index 90ceb24231340c..2216e58c4fa3b8 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalOlapScan.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/logical/LogicalOlapScan.java
@@ -99,6 +99,12 @@ public class LogicalOlapScan extends LogicalCatalogRelation implements OlapScan
      */
     private final List<Long> selectedTabletIds;
 
+    /**
+     * Selected tablet ids to read data from, this would be set if user query with tablets manually
+     * Such as select * from  orders TABLET(100);
+     */
+    private final List<Long> manuallySpecifiedTabletIds;
+
     ///////////////////////////////////////////////////////////////////////////
     // Members for partition ids.
     ///////////////////////////////////////////////////////////////////////////
@@ -127,12 +133,16 @@ public LogicalOlapScan(RelationId id, OlapTable table) {
         this(id, table, ImmutableList.of());
     }
 
+    /**
+     * LogicalOlapScan construct method
+     */
     public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier) {
         this(id, table, qualifier, Optional.empty(), Optional.empty(),
                 table.getPartitionIds(), false,
                 ImmutableList.of(),
                 -1, false, PreAggStatus.unset(), ImmutableList.of(), ImmutableList.of(),
-                Maps.newHashMap(), Optional.empty(), false, ImmutableMap.of());
+                Maps.newHashMap(), Optional.empty(), false, ImmutableMap.of(),
+                ImmutableList.of());
     }
 
     public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, List<Long> tabletIds,
@@ -140,7 +150,7 @@ public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, L
         this(id, table, qualifier, Optional.empty(), Optional.empty(),
                 table.getPartitionIds(), false, tabletIds,
                 -1, false, PreAggStatus.unset(), ImmutableList.of(), hints, Maps.newHashMap(),
-                tableSample, false, ImmutableMap.of());
+                tableSample, false, ImmutableMap.of(), ImmutableList.of());
     }
 
     public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, List<Long> specifiedPartitions,
@@ -149,7 +159,7 @@ public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, L
                 // must use specifiedPartitions here for prune partition by sql like 'select * from t partition p1'
                 specifiedPartitions, false, tabletIds,
                 -1, false, PreAggStatus.unset(), specifiedPartitions, hints, Maps.newHashMap(),
-                tableSample, false, ImmutableMap.of());
+                tableSample, false, ImmutableMap.of(), ImmutableList.of());
     }
 
     public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, List<Long> tabletIds,
@@ -158,7 +168,8 @@ public LogicalOlapScan(RelationId id, OlapTable table, List<String> qualifier, L
         this(id, table, qualifier, Optional.empty(), Optional.empty(),
                 selectedPartitionIds, false, tabletIds,
                 selectedIndexId, true, preAggStatus,
-                specifiedPartitions, hints, Maps.newHashMap(), tableSample, true, ImmutableMap.of());
+                specifiedPartitions, hints, Maps.newHashMap(), tableSample, true, ImmutableMap.of(),
+                ImmutableList.of());
     }
 
     /**
@@ -171,7 +182,7 @@ public LogicalOlapScan(RelationId id, Table table, List<String> qualifier,
             PreAggStatus preAggStatus, List<Long> specifiedPartitions,
             List<String> hints, Map<Pair<Long, String>, Slot> cacheSlotWithSlotName,
             Optional<TableSample> tableSample, boolean directMvScan,
-            Map<String, Set<List<String>>> colToSubPathsMap) {
+            Map<String, Set<List<String>>> colToSubPathsMap, List<Long> specifiedTabletIds) {
         super(id, PlanType.LOGICAL_OLAP_SCAN, table, qualifier,
                 groupExpression, logicalProperties);
         Preconditions.checkArgument(selectedPartitionIds != null,
@@ -182,6 +193,7 @@ public LogicalOlapScan(RelationId id, Table table, List<String> qualifier,
         this.indexSelected = indexSelected;
         this.preAggStatus = preAggStatus;
         this.manuallySpecifiedPartitions = ImmutableList.copyOf(specifiedPartitions);
+        this.manuallySpecifiedTabletIds = ImmutableList.copyOf(specifiedTabletIds);
 
         if (selectedPartitionIds.isEmpty()) {
             this.selectedPartitionIds = ImmutableList.of();
@@ -240,6 +252,7 @@ public boolean equals(Object o) {
                 && partitionPruned == that.partitionPruned && Objects.equals(preAggStatus, that.preAggStatus)
                 && Objects.equals(selectedTabletIds, that.selectedTabletIds)
                 && Objects.equals(manuallySpecifiedPartitions, that.manuallySpecifiedPartitions)
+                && Objects.equals(manuallySpecifiedTabletIds, that.manuallySpecifiedTabletIds)
                 && Objects.equals(selectedPartitionIds, that.selectedPartitionIds)
                 && Objects.equals(hints, that.hints)
                 && Objects.equals(tableSample, that.tableSample);
@@ -248,8 +261,8 @@ public boolean equals(Object o) {
     @Override
     public int hashCode() {
         return Objects.hash(super.hashCode(), selectedIndexId, indexSelected, preAggStatus, cacheSlotWithSlotName,
-                selectedTabletIds, partitionPruned, manuallySpecifiedPartitions, selectedPartitionIds, hints,
-                tableSample);
+                selectedTabletIds, partitionPruned, manuallySpecifiedTabletIds, manuallySpecifiedPartitions,
+                selectedPartitionIds, hints, tableSample);
     }
 
     @Override
@@ -258,7 +271,7 @@ public LogicalOlapScan withGroupExpression(Optional<GroupExpression> groupExpres
                 groupExpression, Optional.of(getLogicalProperties()),
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     @Override
@@ -267,7 +280,7 @@ public Plan withGroupExprLogicalPropChildren(Optional<GroupExpression> groupExpr
         return new LogicalOlapScan(relationId, (Table) table, qualifier, groupExpression, logicalProperties,
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     public LogicalOlapScan withSelectedPartitionIds(List<Long> selectedPartitionIds) {
@@ -275,7 +288,7 @@ public LogicalOlapScan withSelectedPartitionIds(List<Long> selectedPartitionIds)
                 Optional.empty(), Optional.of(getLogicalProperties()),
                 selectedPartitionIds, true, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     public LogicalOlapScan withMaterializedIndexSelected(long indexId) {
@@ -283,7 +296,7 @@ public LogicalOlapScan withMaterializedIndexSelected(long indexId) {
                 Optional.empty(), Optional.of(getLogicalProperties()),
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 indexId, true, PreAggStatus.unset(), manuallySpecifiedPartitions, hints, cacheSlotWithSlotName,
-                tableSample, directMvScan, colToSubPathsMap);
+                tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     public LogicalOlapScan withSelectedTabletIds(List<Long> selectedTabletIds) {
@@ -291,7 +304,7 @@ public LogicalOlapScan withSelectedTabletIds(List<Long> selectedTabletIds) {
                 Optional.empty(), Optional.of(getLogicalProperties()),
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     public LogicalOlapScan withPreAggStatus(PreAggStatus preAggStatus) {
@@ -299,7 +312,7 @@ public LogicalOlapScan withPreAggStatus(PreAggStatus preAggStatus) {
                 Optional.empty(), Optional.of(getLogicalProperties()),
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     public LogicalOlapScan withColToSubPathsMap(Map<String, Set<List<String>>> colToSubPathsMap) {
@@ -307,7 +320,15 @@ public LogicalOlapScan withColToSubPathsMap(Map<String, Set<List<String>>> colTo
                 Optional.empty(), Optional.empty(),
                 selectedPartitionIds, partitionPruned, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap);
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
+    }
+
+    public LogicalOlapScan withManuallySpecifiedTabletIds(List<Long> manuallySpecifiedTabletIds) {
+        return new LogicalOlapScan(relationId, (Table) table, qualifier,
+                Optional.empty(), Optional.of(getLogicalProperties()),
+                selectedPartitionIds, partitionPruned, selectedTabletIds,
+                selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
+                hints, cacheSlotWithSlotName, tableSample, directMvScan, colToSubPathsMap, manuallySpecifiedTabletIds);
     }
 
     @Override
@@ -317,7 +338,7 @@ public LogicalOlapScan withRelationId(RelationId relationId) {
                 Optional.empty(), Optional.empty(),
                 selectedPartitionIds, false, selectedTabletIds,
                 selectedIndexId, indexSelected, preAggStatus, manuallySpecifiedPartitions,
-                hints, Maps.newHashMap(), tableSample, directMvScan, colToSubPathsMap);
+                hints, Maps.newHashMap(), tableSample, directMvScan, colToSubPathsMap, selectedTabletIds);
     }
 
     @Override
@@ -333,6 +354,10 @@ public List<Long> getSelectedTabletIds() {
         return selectedTabletIds;
     }
 
+    public List<Long> getManuallySpecifiedTabletIds() {
+        return manuallySpecifiedTabletIds;
+    }
+
     @Override
     public long getSelectedIndexId() {
         return selectedIndexId;
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/CommandVisitor.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/CommandVisitor.java
index d386d097a93b49..dea3a004e816be 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/CommandVisitor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/CommandVisitor.java
@@ -18,6 +18,9 @@
 package org.apache.doris.nereids.trees.plans.visitor;
 
 import org.apache.doris.nereids.trees.plans.commands.AddConstraintCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminCheckTabletsCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminCompactTableCommand;
+import org.apache.doris.nereids.trees.plans.commands.AdminShowReplicaStatusCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterJobStatusCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.AlterRoleCommand;
@@ -33,10 +36,13 @@
 import org.apache.doris.nereids.trees.plans.commands.CancelWarmUpJobCommand;
 import org.apache.doris.nereids.trees.plans.commands.CleanAllProfileCommand;
 import org.apache.doris.nereids.trees.plans.commands.Command;
+import org.apache.doris.nereids.trees.plans.commands.CreateEncryptkeyCommand;
+import org.apache.doris.nereids.trees.plans.commands.CreateFileCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateJobCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreatePolicyCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.CreateRoleCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateSqlBlockRuleCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateTableCommand;
 import org.apache.doris.nereids.trees.plans.commands.CreateTableLikeCommand;
@@ -50,6 +56,7 @@
 import org.apache.doris.nereids.trees.plans.commands.DropJobCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.DropRepositoryCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropRoleCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropSqlBlockRuleCommand;
 import org.apache.doris.nereids.trees.plans.commands.DropUserCommand;
@@ -82,11 +89,14 @@
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateMTMVCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateMaterializedViewCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateProcedureCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowCreateRepositoryCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateTableCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowCreateViewCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowDatabaseIdCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDeleteCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDiagnoseTabletCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowDynamicPartitionCommand;
+import org.apache.doris.nereids.trees.plans.commands.ShowEncryptKeysCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowEventsCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowFrontendsCommand;
 import org.apache.doris.nereids.trees.plans.commands.ShowGrantsCommand;
@@ -175,6 +185,10 @@ default R visitExportCommand(ExportCommand exportCommand, C context) {
         return visitCommand(exportCommand, context);
     }
 
+    default R visitCreateEncryptKeyCommand(CreateEncryptkeyCommand createEncryptKeyCommand, C context) {
+        return visitCommand(createEncryptKeyCommand, context);
+    }
+
     default R visitCreateTableCommand(CreateTableCommand createTableCommand, C context) {
         return visitCommand(createTableCommand, context);
     }
@@ -187,6 +201,10 @@ default R visitCreateJobCommand(CreateJobCommand createJobCommand, C context) {
         return visitCommand(createJobCommand, context);
     }
 
+    default R visitCreateFileCommand(CreateFileCommand createFileCommand, C context) {
+        return visitCommand(createFileCommand, context);
+    }
+
     default R visitAlterMTMVCommand(AlterMTMVCommand alterMTMVCommand, C context) {
         return visitCommand(alterMTMVCommand, context);
     }
@@ -195,6 +213,10 @@ default R visitAddConstraintCommand(AddConstraintCommand addConstraintCommand, C
         return visitCommand(addConstraintCommand, context);
     }
 
+    default R visitAdminCompactTableCommand(AdminCompactTableCommand adminCompactTableCommand, C context) {
+        return visitCommand(adminCompactTableCommand, context);
+    }
+
     default R visitDropConstraintCommand(DropConstraintCommand dropConstraintCommand, C context) {
         return visitCommand(dropConstraintCommand, context);
     }
@@ -336,6 +358,10 @@ default R visitRefreshCatalogCommand(RefreshCatalogCommand refreshCatalogCommand
         return visitCommand(refreshCatalogCommand, context);
     }
 
+    default R visitShowCreateRepositoryCommand(ShowCreateRepositoryCommand showCreateRepositoryCommand, C context) {
+        return visitCommand(showCreateRepositoryCommand, context);
+    }
+
     default R visitShowLastInsertCommand(ShowLastInsertCommand showLastInsertCommand, C context) {
         return visitCommand(showLastInsertCommand, context);
     }
@@ -388,6 +414,11 @@ default R visitShowTriggersCommand(ShowTriggersCommand showTriggersCommand, C co
         return visitCommand(showTriggersCommand, context);
     }
 
+    default R visitAdminShowReplicaStatusCommand(AdminShowReplicaStatusCommand adminShowReplicaStatusCommand,
+                                                    C context) {
+        return visitCommand(adminShowReplicaStatusCommand, context);
+    }
+
     default R visitShowRepositoriesCommand(ShowRepositoriesCommand showRepositoriesCommand, C context) {
         return visitCommand(showRepositoriesCommand, context);
     }
@@ -425,6 +456,10 @@ default R visitAlterRoleCommand(AlterRoleCommand alterRoleCommand, C context) {
         return visitCommand(alterRoleCommand, context);
     }
 
+    default R visitShowDatabaseIdCommand(ShowDatabaseIdCommand showDatabaseIdCommand, C context) {
+        return visitCommand(showDatabaseIdCommand, context);
+    }
+
     default R visitAlterWorkloadGroupCommand(AlterWorkloadGroupCommand alterWorkloadGroupCommand, C context) {
         return visitCommand(alterWorkloadGroupCommand, context);
     }
@@ -473,12 +508,20 @@ default R visitShowLoadProfileCommand(ShowLoadProfileCommand showLoadProfileComm
         return visitCommand(showLoadProfileCommand, context);
     }
 
-    default R visitAlterSqlBlockRuleCommand(AlterSqlBlockRuleCommand dropRoleCommand, C context) {
-        return visitCommand(dropRoleCommand, context);
+    default R visitAlterSqlBlockRuleCommand(AlterSqlBlockRuleCommand cmd, C context) {
+        return visitCommand(cmd, context);
     }
 
-    default R visitCreateSqlBlockRuleCommand(CreateSqlBlockRuleCommand dropRoleCommand, C context) {
-        return visitCommand(dropRoleCommand, context);
+    default R visitCreateSqlBlockRuleCommand(CreateSqlBlockRuleCommand cmd, C context) {
+        return visitCommand(cmd, context);
+    }
+
+    default R visitDropRepositoryCommand(DropRepositoryCommand cmd, C context) {
+        return visitCommand(cmd, context);
+    }
+
+    default R visitCreateRoleCommand(CreateRoleCommand createRoleCommand, C context) {
+        return visitCommand(createRoleCommand, context);
     }
 
     default R visitDropRoleCommand(DropRoleCommand dropRoleCommand, C context) {
@@ -518,6 +561,10 @@ default R visitShowTableIdCommand(ShowTableIdCommand showTableIdCommand, C conte
         return visitCommand(showTableIdCommand, context);
     }
 
+    default R visitShowEncryptKeysCommand(ShowEncryptKeysCommand showEncryptKeysCommand, C context) {
+        return visitCommand(showEncryptKeysCommand, context);
+    }
+
     default R visitSyncCommand(SyncCommand syncCommand, C context) {
         return visitCommand(syncCommand, context);
     }
@@ -549,4 +596,8 @@ default R visitCreateRoutineLoadCommand(CreateRoutineLoadCommand createRoutineLo
     default R visitShowProcessListCommand(ShowProcessListCommand showProcessListCommand, C context) {
         return visitCommand(showProcessListCommand, context);
     }
+
+    default R visitAdminCheckTabletsCommand(AdminCheckTabletsCommand adminCheckTabletsCommand, C context) {
+        return visitCommand(adminCheckTabletsCommand, context);
+    }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/TableCollector.java b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/TableCollector.java
index 2e2cdb810f0f72..27ff1e4b68c075 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/TableCollector.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/plans/visitor/TableCollector.java
@@ -20,8 +20,8 @@
 import org.apache.doris.catalog.MTMV;
 import org.apache.doris.catalog.TableIf;
 import org.apache.doris.catalog.TableIf.TableType;
+import org.apache.doris.common.AnalysisException;
 import org.apache.doris.mtmv.MTMVCache;
-import org.apache.doris.mtmv.MTMVPlanUtil;
 import org.apache.doris.nereids.trees.plans.Plan;
 import org.apache.doris.nereids.trees.plans.logical.LogicalCatalogRelation;
 import org.apache.doris.nereids.trees.plans.physical.PhysicalCatalogRelation;
@@ -70,13 +70,19 @@ public Plan visitPhysicalCatalogRelation(PhysicalCatalogRelation catalogRelation
     }
 
     private void expandMvAndCollect(MTMV mtmv, TableCollectorContext context) {
-        if (!context.isExpand()) {
+        if (!context.isExpandMaterializedView()) {
             return;
         }
         // Make sure use only one connection context when in query to avoid ConnectionContext.get() wrong
-        MTMVCache expandedMv = MTMVCache.from(mtmv, context.getConnectContext() == null
-                ? MTMVPlanUtil.createMTMVContext(mtmv) : context.getConnectContext(), false);
-        expandedMv.getLogicalPlan().accept(this, context);
+        MTMVCache expandedMvCache;
+        try {
+            expandedMvCache = mtmv.getOrGenerateCache(context.getConnectContext());
+        } catch (AnalysisException exception) {
+            LOG.warn(String.format("expandMvAndCollect getOrGenerateCache fail, mtmv name is %s", mtmv.getName()),
+                    exception);
+            expandedMvCache = MTMVCache.from(mtmv, context.getConnectContext(), false);
+        }
+        expandedMvCache.getAnalyzedPlan().accept(this, context);
     }
 
     /**
@@ -87,12 +93,14 @@ public static final class TableCollectorContext {
         private final Set<TableIf> collectedTables = new HashSet<>();
         private final Set<TableType> targetTableTypes;
         // if expand the mv or not
-        private final boolean expand;
-        private ConnectContext connectContext;
+        private final boolean expandMaterializedView;
+        private final ConnectContext connectContext;
 
-        public TableCollectorContext(Set<TableType> targetTableTypes, boolean expand) {
+        public TableCollectorContext(Set<TableType> targetTableTypes, boolean expandMaterializedView,
+                ConnectContext connectContext) {
             this.targetTableTypes = targetTableTypes;
-            this.expand = expand;
+            this.expandMaterializedView = expandMaterializedView;
+            this.connectContext = connectContext;
         }
 
         public Set<TableIf> getCollectedTables() {
@@ -103,16 +111,12 @@ public Set<TableType> getTargetTableTypes() {
             return targetTableTypes;
         }
 
-        public boolean isExpand() {
-            return expand;
+        public boolean isExpandMaterializedView() {
+            return expandMaterializedView;
         }
 
         public ConnectContext getConnectContext() {
             return connectContext;
         }
-
-        public void setConnectContext(ConnectContext connectContext) {
-            this.connectContext = connectContext;
-        }
     }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/persist/BatchDropInfo.java b/fe/fe-core/src/main/java/org/apache/doris/persist/BatchDropInfo.java
index 260ad316d3cc24..8e4e9b9af8e0d9 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/persist/BatchDropInfo.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/persist/BatchDropInfo.java
@@ -86,6 +86,10 @@ public Set<Long> getIndexIdSet() {
         return indexIdSet;
     }
 
+    public boolean hasIndexNameMap() {
+        return indexNameMap != null;
+    }
+
     public Map<Long, String> getIndexNameMap() {
         return indexNameMap;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/persist/DropInfo.java b/fe/fe-core/src/main/java/org/apache/doris/persist/DropInfo.java
index 69994caf23d5dc..db0688bd6ad267 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/persist/DropInfo.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/persist/DropInfo.java
@@ -52,7 +52,7 @@ public DropInfo() {
 
     public DropInfo(long dbId, long tableId, String tableName, boolean isView, boolean forceDrop,
             long recycleTime) {
-        this(dbId, tableId, tableName, -1, "", isView, forceDrop, recycleTime);
+        this(dbId, tableId, tableName, -1L, "", isView, forceDrop, recycleTime);
     }
 
     public DropInfo(long dbId, long tableId, String tableName, long indexId, String indexName, boolean isView,
diff --git a/fe/fe-core/src/main/java/org/apache/doris/persist/EditLog.java b/fe/fe-core/src/main/java/org/apache/doris/persist/EditLog.java
index 7d1f2127eecaaf..f1377e9daebfc4 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/persist/EditLog.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/persist/EditLog.java
@@ -347,13 +347,21 @@ public static void loadJournal(Env env, Long logId, JournalEntity journal) {
                 }
                 case OperationType.OP_BATCH_DROP_ROLLUP: {
                     BatchDropInfo batchDropInfo = (BatchDropInfo) journal.getData();
-                    for (Map.Entry<Long, String> entry : batchDropInfo.getIndexNameMap().entrySet()) {
-                        long indexId = entry.getKey();
-                        String indexName = entry.getValue();
-                        DropInfo info = new DropInfo(batchDropInfo.getDbId(), batchDropInfo.getTableId(),
-                                        batchDropInfo.getTableName(), indexId, indexName, false, false, 0);
-                        env.getMaterializedViewHandler().replayDropRollup(info, env);
-                        env.getBinlogManager().addDropRollup(info, logId);
+                    if (batchDropInfo.hasIndexNameMap()) {
+                        for (Map.Entry<Long, String> entry : batchDropInfo.getIndexNameMap().entrySet()) {
+                            long indexId = entry.getKey();
+                            String indexName = entry.getValue();
+                            DropInfo info = new DropInfo(batchDropInfo.getDbId(), batchDropInfo.getTableId(),
+                                            batchDropInfo.getTableName(), indexId, indexName, false, false, 0);
+                            env.getMaterializedViewHandler().replayDropRollup(info, env);
+                            env.getBinlogManager().addDropRollup(info, logId);
+                        }
+                    } else {
+                        for (Long indexId : batchDropInfo.getIndexIdSet()) {
+                            DropInfo info = new DropInfo(batchDropInfo.getDbId(), batchDropInfo.getTableId(),
+                                    batchDropInfo.getTableName(), indexId, "", false, false, 0);
+                            env.getMaterializedViewHandler().replayDropRollup(info, env);
+                        }
                     }
                     break;
                 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/planner/RuntimeFilter.java b/fe/fe-core/src/main/java/org/apache/doris/planner/RuntimeFilter.java
index 2f3948aee161b8..80497798083dc7 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/planner/RuntimeFilter.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/planner/RuntimeFilter.java
@@ -112,6 +112,8 @@ public final class RuntimeFilter {
 
     private boolean bloomFilterSizeCalculatedByNdv = false;
 
+    private boolean singleEq = false;
+
     /**
      * Internal representation of a runtime filter target.
      */
@@ -216,9 +218,36 @@ public TRuntimeFilterDesc toThrift() {
         tFilter.setIsBroadcastJoin(isBroadcastJoin);
         tFilter.setHasLocalTargets(hasLocalTargets);
         tFilter.setHasRemoteTargets(hasRemoteTargets);
+
+        boolean hasSerialTargets = false;
         for (RuntimeFilterTarget target : targets) {
             tFilter.putToPlanIdToTargetExpr(target.node.getId().asInt(), target.expr.treeToThrift());
+            hasSerialTargets = hasSerialTargets
+                    || (target.node.isSerialOperator() && target.node.fragment.useSerialSource(ConnectContext.get()));
         }
+
+        boolean enableSyncFilterSize = ConnectContext.get() != null
+                && ConnectContext.get().getSessionVariable().enableSyncRuntimeFilterSize();
+
+        // there are two cases has local exchange between join and scan
+        // 1. hasRemoteTargets is true means join probe side do least once shuffle (has shuffle between join and scan)
+        // 2. hasSerialTargets is true means scan is pooled (has local shuffle between join and scan)
+        boolean needShuffle = hasRemoteTargets || hasSerialTargets;
+
+        // There are two cases where all instances of rf have the same size.
+        // 1. enableSyncFilterSize is true means backends will collect global size and send to every instance
+        // 2. isBroadcastJoin is true means each join node instance have the same full amount of data
+        boolean hasGlobalSize = enableSyncFilterSize || isBroadcastJoin;
+
+        // build runtime filter by exact distinct count if all of 3 conditions are met:
+        // 1. only single eq conjunct
+        // 2. rf type may be bf
+        // 3. each filter only acts on self instance(do not need any shuffle), or size of
+        // all filters will be same
+        boolean buildBfExactly = singleEq && (runtimeFilterType == TRuntimeFilterType.IN_OR_BLOOM
+                || runtimeFilterType == TRuntimeFilterType.BLOOM) && (!needShuffle || hasGlobalSize);
+        tFilter.setBuildBfExactly(buildBfExactly);
+
         tFilter.setType(runtimeFilterType);
         tFilter.setBloomFilterSizeBytes(filterSizeBytes);
         if (runtimeFilterType.equals(TRuntimeFilterType.BITMAP)) {
@@ -239,8 +268,6 @@ public TRuntimeFilterDesc toThrift() {
                 tFilter.setNullAware(false);
             }
         }
-        tFilter.setSyncFilterSize(ConnectContext.get() != null
-                && ConnectContext.get().getSessionVariable().enableSyncRuntimeFilterSize());
         return tFilter;
     }
 
@@ -597,6 +624,10 @@ public void addTarget(RuntimeFilterTarget target) {
         targets.add(target);
     }
 
+    public void setSingleEq(int eqJoinConjunctsNumbers) {
+        singleEq = (eqJoinConjunctsNumbers == 1);
+    }
+
     public void setIsBroadcast(boolean isBroadcast) {
         isBroadcastJoin = isBroadcast;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/planner/SingleNodePlanner.java b/fe/fe-core/src/main/java/org/apache/doris/planner/SingleNodePlanner.java
index 4091640066c1d7..ae5d562bd5bd30 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/planner/SingleNodePlanner.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/planner/SingleNodePlanner.java
@@ -1968,7 +1968,7 @@ private PlanNode createScanNode(Analyzer analyzer, TableRef tblRef, SelectStmt s
                                     + "please set enable_nereids_planner = true to enable new optimizer");
                         }
                         scanNode = new HudiScanNode(ctx.getNextNodeId(), tblRef.getDesc(), true,
-                                Optional.empty(), Optional.empty());
+                                Optional.empty(), Optional.empty(), ConnectContext.get().getSessionVariable());
                         break;
                     case ICEBERG:
                         scanNode = new IcebergScanNode(ctx.getNextNodeId(), tblRef.getDesc(), true);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/AbstractJobProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/qe/AbstractJobProcessor.java
new file mode 100644
index 00000000000000..2858de25d578fc
--- /dev/null
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/AbstractJobProcessor.java
@@ -0,0 +1,118 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.qe;
+
+import org.apache.doris.common.Status;
+import org.apache.doris.common.util.DebugUtil;
+import org.apache.doris.qe.runtime.BackendFragmentId;
+import org.apache.doris.qe.runtime.MultiFragmentsPipelineTask;
+import org.apache.doris.qe.runtime.PipelineExecutionTask;
+import org.apache.doris.qe.runtime.SingleFragmentPipelineTask;
+import org.apache.doris.thrift.TReportExecStatusParams;
+import org.apache.doris.thrift.TUniqueId;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableMap;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+
+import java.util.Map;
+import java.util.Map.Entry;
+import java.util.Objects;
+import java.util.Optional;
+
+/** AbstractJobProcessor */
+public abstract class AbstractJobProcessor implements JobProcessor {
+    private final Logger logger = LogManager.getLogger(getClass());
+
+    protected final CoordinatorContext coordinatorContext;
+    protected volatile Optional<PipelineExecutionTask> executionTask;
+    protected volatile Optional<Map<BackendFragmentId, SingleFragmentPipelineTask>> backendFragmentTasks;
+
+    public AbstractJobProcessor(CoordinatorContext coordinatorContext) {
+        this.coordinatorContext = Objects.requireNonNull(coordinatorContext, "coordinatorContext can not be null");
+        this.executionTask = Optional.empty();
+        this.backendFragmentTasks = Optional.empty();
+    }
+
+    protected abstract void doProcessReportExecStatus(
+            TReportExecStatusParams params, SingleFragmentPipelineTask fragmentTask);
+
+    @Override
+    public final void setPipelineExecutionTask(PipelineExecutionTask pipelineExecutionTask) {
+        Preconditions.checkArgument(pipelineExecutionTask != null, "sqlPipelineTask can not be null");
+
+        this.executionTask = Optional.of(pipelineExecutionTask);
+        Map<BackendFragmentId, SingleFragmentPipelineTask> backendFragmentTasks
+                = buildBackendFragmentTasks(pipelineExecutionTask);
+        this.backendFragmentTasks = Optional.of(backendFragmentTasks);
+
+        afterSetPipelineExecutionTask(pipelineExecutionTask);
+    }
+
+    protected void afterSetPipelineExecutionTask(PipelineExecutionTask pipelineExecutionTask) {}
+
+    @Override
+    public final void updateFragmentExecStatus(TReportExecStatusParams params) {
+        SingleFragmentPipelineTask fragmentTask = backendFragmentTasks.get().get(
+                new BackendFragmentId(params.getBackendId(), params.getFragmentId()));
+        if (fragmentTask == null || !fragmentTask.processReportExecStatus(params)) {
+            return;
+        }
+
+        TUniqueId queryId = coordinatorContext.queryId;
+        Status status = new Status(params.status);
+        // for now, abort the query if we see any error except if the error is cancelled
+        // and returned_all_results_ is true.
+        // (UpdateStatus() initiates cancellation, if it hasn't already been initiated)
+        if (!status.ok()) {
+            if (coordinatorContext.isEos() && status.isCancelled()) {
+                logger.warn("Query {} has returned all results, fragment_id={} instance_id={}, be={}"
+                                + " is reporting failed status {}",
+                        DebugUtil.printId(queryId), params.getFragmentId(),
+                        DebugUtil.printId(params.getFragmentInstanceId()),
+                        params.getBackendId(),
+                        status.toString());
+            } else {
+                logger.warn("one instance report fail, query_id={} fragment_id={} instance_id={}, be={},"
+                                + " error message: {}",
+                        DebugUtil.printId(queryId), params.getFragmentId(),
+                        DebugUtil.printId(params.getFragmentInstanceId()),
+                        params.getBackendId(), status.toString());
+                coordinatorContext.updateStatusIfOk(status);
+            }
+        }
+        doProcessReportExecStatus(params, fragmentTask);
+    }
+
+    private Map<BackendFragmentId, SingleFragmentPipelineTask> buildBackendFragmentTasks(
+            PipelineExecutionTask executionTask) {
+        ImmutableMap.Builder<BackendFragmentId, SingleFragmentPipelineTask> backendFragmentTasks
+                = ImmutableMap.builder();
+        for (Entry<Long, MultiFragmentsPipelineTask> backendTask : executionTask.getChildrenTasks().entrySet()) {
+            Long backendId = backendTask.getKey();
+            for (Entry<Integer, SingleFragmentPipelineTask> fragmentIdToTask : backendTask.getValue()
+                    .getChildrenTasks().entrySet()) {
+                Integer fragmentId = fragmentIdToTask.getKey();
+                SingleFragmentPipelineTask fragmentTask = fragmentIdToTask.getValue();
+                backendFragmentTasks.put(new BackendFragmentId(backendId, fragmentId), fragmentTask);
+            }
+        }
+        return backendFragmentTasks.build();
+    }
+}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/ConnectContext.java b/fe/fe-core/src/main/java/org/apache/doris/qe/ConnectContext.java
index c21c9ee3f86db9..c81cf4920e1f7d 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/ConnectContext.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/ConnectContext.java
@@ -31,7 +31,6 @@
 import org.apache.doris.catalog.DatabaseIf;
 import org.apache.doris.catalog.Env;
 import org.apache.doris.catalog.FunctionRegistry;
-import org.apache.doris.catalog.TableIf;
 import org.apache.doris.catalog.Type;
 import org.apache.doris.cloud.qe.ComputeGroupException;
 import org.apache.doris.cloud.system.CloudSystemInfoService;
@@ -54,7 +53,6 @@
 import org.apache.doris.mysql.ProxyMysqlChannel;
 import org.apache.doris.mysql.privilege.PrivPredicate;
 import org.apache.doris.nereids.StatementContext;
-import org.apache.doris.nereids.exceptions.AnalysisException;
 import org.apache.doris.nereids.stats.StatsErrorEstimator;
 import org.apache.doris.nereids.trees.expressions.literal.Literal;
 import org.apache.doris.plsql.Exec;
@@ -73,7 +71,6 @@
 import org.apache.doris.transaction.TransactionEntry;
 import org.apache.doris.transaction.TransactionStatus;
 
-import com.google.common.base.Preconditions;
 import com.google.common.base.Strings;
 import com.google.common.collect.Lists;
 import com.google.common.collect.Maps;
@@ -267,8 +264,6 @@ public void setUserInsertTimeout(int insertTimeout) {
     // new planner
     private Map<String, PreparedStatementContext> preparedStatementContextMap = Maps.newHashMap();
 
-    private Map<List<String>, TableIf> tables = null;
-
     private Map<String, ColumnStatistic> totalColumnStatisticMap = new HashMap<>();
 
     public Map<String, ColumnStatistic> getTotalColumnStatisticMap() {
@@ -433,30 +428,6 @@ public PreparedStatementContext getPreparedStementContext(String stmtName) {
         return this.preparedStatementContextMap.get(stmtName);
     }
 
-    public Map<List<String>, TableIf> getTables() {
-        if (tables == null) {
-            tables = Maps.newHashMap();
-        }
-        return tables;
-    }
-
-    public void setTables(Map<List<String>, TableIf> tables) {
-        this.tables = tables;
-    }
-
-    /** get table by table name, try to get from information from dumpfile first */
-    public TableIf getTableInMinidumpCache(List<String> tableQualifier) {
-        if (!getSessionVariable().isPlayNereidsDump()) {
-            return null;
-        }
-        Preconditions.checkState(tables != null, "tables should not be null");
-        TableIf table = tables.getOrDefault(tableQualifier, null);
-        if (getSessionVariable().isPlayNereidsDump() && table == null) {
-            throw new AnalysisException("Minidump cache can not find table:" + tableQualifier);
-        }
-        return table;
-    }
-
     public void closeTxn() {
         if (isTxnModel()) {
             try {
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/JobProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/qe/JobProcessor.java
index ede218848c7221..7e4042dde3c3bd 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/JobProcessor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/JobProcessor.java
@@ -19,9 +19,12 @@
 
 import org.apache.doris.common.Status;
 import org.apache.doris.qe.runtime.PipelineExecutionTask;
+import org.apache.doris.thrift.TReportExecStatusParams;
 
 public interface JobProcessor {
-    void setSqlPipelineTask(PipelineExecutionTask pipelineExecutionTask);
+    void setPipelineExecutionTask(PipelineExecutionTask pipelineExecutionTask);
 
     void cancel(Status cancelReason);
+
+    void updateFragmentExecStatus(TReportExecStatusParams params);
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/NereidsCoordinator.java b/fe/fe-core/src/main/java/org/apache/doris/qe/NereidsCoordinator.java
index a9d6becc7fafe3..a6f24806ed74aa 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/NereidsCoordinator.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/NereidsCoordinator.java
@@ -233,10 +233,7 @@ public boolean isDone() {
 
     @Override
     public void updateFragmentExecStatus(TReportExecStatusParams params) {
-        JobProcessor jobProcessor = coordinatorContext.getJobProcessor();
-        if (jobProcessor instanceof LoadProcessor) {
-            coordinatorContext.asLoadProcessor().updateFragmentExecStatus(params);
-        }
+        coordinatorContext.getJobProcessor().updateFragmentExecStatus(params);
     }
 
     @Override
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/SessionVariable.java b/fe/fe-core/src/main/java/org/apache/doris/qe/SessionVariable.java
index 3c180be9d42802..d07a8f022d7092 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/SessionVariable.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/SessionVariable.java
@@ -635,6 +635,8 @@ public class SessionVariable implements Serializable, Writable {
 
     public static final String FORCE_JNI_SCANNER = "force_jni_scanner";
 
+    public static final String HUDI_JNI_SCANNER = "hudi_jni_scanner";
+
     public static final String ENABLE_COUNT_PUSH_DOWN_FOR_EXTERNAL_TABLE = "enable_count_push_down_for_external_table";
 
     public static final String SHOW_ALL_FE_CONNECTION = "show_all_fe_connection";
@@ -1177,6 +1179,11 @@ public enum IgnoreSplitType {
             "Ignore the rf when it encounters an error" })
     public boolean ignoreRuntimeFilterError = false;
 
+    @VariableMgr.VarAttr(name = "enable_fixed_len_to_uint32_v2", needForward = true, description = {
+            "使用新版本fixed_len_to_uint32_v2,对datetimev2类型bloom filter做了优化",
+            "Using the new version fixed_len_to_uint32_v2, the datetimev2 type bloom filter has been optimized" })
+    public boolean enableFixedLenToUint32V2 = true;
+
     @VariableMgr.VarAttr(name = RUNTIME_FILTER_MODE, needForward = true)
     private String runtimeFilterMode = "GLOBAL";
 
@@ -2077,6 +2084,10 @@ public void setEnableLeftZigZag(boolean enableLeftZigZag) {
             description = {"强制使用jni方式读取外表", "Force the use of jni mode to read external table"})
     private boolean forceJniScanner = false;
 
+    @VariableMgr.VarAttr(name = HUDI_JNI_SCANNER, description = { "使用那种hudi jni scanner, 'hadoop' 或 'spark'",
+            "Which hudi jni scanner to use, 'hadoop' or 'spark'" })
+    private String hudiJniScanner = "hadoop";
+
     @VariableMgr.VarAttr(name = ENABLE_COUNT_PUSH_DOWN_FOR_EXTERNAL_TABLE,
             description = {"对外表启用 count(*) 下推优化", "enable count(*) pushdown optimization for external table"})
     private boolean enableCountPushDownForExternalTable = true;
@@ -3978,6 +3989,7 @@ public TQueryOptions toThrift() {
         tResult.setOrcMaxMergeDistanceBytes(orcMaxMergeDistanceBytes);
         tResult.setOrcOnceMaxReadBytes(orcOnceMaxReadBytes);
         tResult.setIgnoreRuntimeFilterError(ignoreRuntimeFilterError);
+        tResult.setEnableFixedLenToUint32V2(enableFixedLenToUint32V2);
 
         return tResult;
     }
@@ -4510,6 +4522,10 @@ public boolean isForceJniScanner() {
         return forceJniScanner;
     }
 
+    public String getHudiJniScanner() {
+        return hudiJniScanner;
+    }
+
     public String getIgnoreSplitType() {
         return ignoreSplitType;
     }
@@ -4530,6 +4546,10 @@ public void setForceJniScanner(boolean force) {
         forceJniScanner = force;
     }
 
+    public void setHudiJniScanner(String hudiJniScanner) {
+        this.hudiJniScanner = hudiJniScanner;
+    }
+
     public boolean isEnableCountPushDownForExternalTable() {
         return enableCountPushDownForExternalTable;
     }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/ShowExecutor.java b/fe/fe-core/src/main/java/org/apache/doris/qe/ShowExecutor.java
index 9bda42139ef639..3dcb7069abf423 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/ShowExecutor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/ShowExecutor.java
@@ -1184,15 +1184,9 @@ private void handleShowCreateMTMV() throws AnalysisException {
                 .getDbOrAnalysisException(showStmt.getDb());
         MTMV mtmv = (MTMV) db.getTableOrAnalysisException(showStmt.getTable());
         List<List<String>> rows = Lists.newArrayList();
-
-        mtmv.readLock();
-        try {
-            String mtmvDdl = Env.getMTMVDdl(mtmv);
-            rows.add(Lists.newArrayList(mtmv.getName(), mtmvDdl));
-            resultSet = new ShowResultSet(showStmt.getMetaData(), rows);
-        } finally {
-            mtmv.readUnlock();
-        }
+        String mtmvDdl = Env.getMTMVDdl(mtmv);
+        rows.add(Lists.newArrayList(mtmv.getName(), mtmvDdl));
+        resultSet = new ShowResultSet(showStmt.getMetaData(), rows);
     }
 
     // Describe statement
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/LoadProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/LoadProcessor.java
index 3a448521fca0bf..fb32919d834a54 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/LoadProcessor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/LoadProcessor.java
@@ -24,46 +24,39 @@
 import org.apache.doris.datasource.hive.HMSTransaction;
 import org.apache.doris.datasource.iceberg.IcebergTransaction;
 import org.apache.doris.nereids.util.Utils;
+import org.apache.doris.qe.AbstractJobProcessor;
 import org.apache.doris.qe.CoordinatorContext;
-import org.apache.doris.qe.JobProcessor;
 import org.apache.doris.qe.LoadContext;
 import org.apache.doris.thrift.TFragmentInstanceReport;
 import org.apache.doris.thrift.TReportExecStatusParams;
 import org.apache.doris.thrift.TStatusCode;
 import org.apache.doris.thrift.TUniqueId;
 
-import com.google.common.base.Preconditions;
-import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.Lists;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
 import java.util.List;
 import java.util.Map;
-import java.util.Map.Entry;
-import java.util.Objects;
 import java.util.Optional;
 import java.util.concurrent.TimeUnit;
 
-public class LoadProcessor implements JobProcessor {
+public class LoadProcessor extends AbstractJobProcessor {
     private static final Logger LOG = LogManager.getLogger(LoadProcessor.class);
 
-    public final CoordinatorContext coordinatorContext;
     public final LoadContext loadContext;
     public final long jobId;
 
     // this latch is used to wait finish for load, for example, insert into statement
     // MarkedCountDownLatch:
     //  key: fragmentId, value: backendId
-    private volatile Optional<PipelineExecutionTask> executionTask;
     private volatile Optional<MarkedCountDownLatch<Integer, Long>> latch;
-    private volatile Optional<Map<BackendFragmentId, SingleFragmentPipelineTask>> backendFragmentTasks;
     private volatile List<SingleFragmentPipelineTask> topFragmentTasks;
 
     public LoadProcessor(CoordinatorContext coordinatorContext, long jobId) {
-        this.coordinatorContext = Objects.requireNonNull(coordinatorContext, "coordinatorContext can not be null");
+        super(coordinatorContext);
+
         this.loadContext = new LoadContext();
-        this.executionTask = Optional.empty();
         this.latch = Optional.empty();
         this.backendFragmentTasks = Optional.empty();
 
@@ -87,14 +80,8 @@ public LoadProcessor(CoordinatorContext coordinatorContext, long jobId) {
     }
 
     @Override
-    public void setSqlPipelineTask(PipelineExecutionTask pipelineExecutionTask) {
-        Preconditions.checkArgument(pipelineExecutionTask != null, "sqlPipelineTask can not be null");
-
-        this.executionTask = Optional.of(pipelineExecutionTask);
-        Map<BackendFragmentId, SingleFragmentPipelineTask> backendFragmentTasks
-                = buildBackendFragmentTasks(pipelineExecutionTask);
-        this.backendFragmentTasks = Optional.of(backendFragmentTasks);
-
+    protected void afterSetPipelineExecutionTask(PipelineExecutionTask pipelineExecutionTask) {
+        Map<BackendFragmentId, SingleFragmentPipelineTask> backendFragmentTasks = this.backendFragmentTasks.get();
         MarkedCountDownLatch<Integer, Long> latch = new MarkedCountDownLatch<>(backendFragmentTasks.size());
         for (BackendFragmentId backendFragmentId : backendFragmentTasks.keySet()) {
             latch.addMark(backendFragmentId.fragmentId, backendFragmentId.backendId);
@@ -168,34 +155,9 @@ public boolean await(long timeout, TimeUnit unit) throws InterruptedException {
         return latch.get().await(timeout, unit);
     }
 
-    public void updateFragmentExecStatus(TReportExecStatusParams params) {
-        SingleFragmentPipelineTask fragmentTask = backendFragmentTasks.get().get(
-                new BackendFragmentId(params.getBackendId(), params.getFragmentId()));
-        if (fragmentTask == null || !fragmentTask.processReportExecStatus(params)) {
-            return;
-        }
-        TUniqueId queryId = coordinatorContext.queryId;
-        Status status = new Status(params.status);
-        // for now, abort the query if we see any error except if the error is cancelled
-        // and returned_all_results_ is true.
-        // (UpdateStatus() initiates cancellation, if it hasn't already been initiated)
-        if (!status.ok()) {
-            if (coordinatorContext.isEos() && status.isCancelled()) {
-                LOG.warn("Query {} has returned all results, fragment_id={} instance_id={}, be={}"
-                                + " is reporting failed status {}",
-                        DebugUtil.printId(queryId), params.getFragmentId(),
-                        DebugUtil.printId(params.getFragmentInstanceId()),
-                        params.getBackendId(),
-                        status.toString());
-            } else {
-                LOG.warn("one instance report fail, query_id={} fragment_id={} instance_id={}, be={},"
-                                + " error message: {}",
-                        DebugUtil.printId(queryId), params.getFragmentId(),
-                        DebugUtil.printId(params.getFragmentInstanceId()),
-                        params.getBackendId(), status.toString());
-                coordinatorContext.updateStatusIfOk(status);
-            }
-        }
+
+    @Override
+    protected void doProcessReportExecStatus(TReportExecStatusParams params, SingleFragmentPipelineTask fragmentTask) {
         LoadContext loadContext = coordinatorContext.asLoadProcessor().loadContext;
         if (params.isSetDeltaUrls()) {
             loadContext.updateDeltaUrls(params.getDeltaUrls());
@@ -234,7 +196,7 @@ public void updateFragmentExecStatus(TReportExecStatusParams params) {
         if (fragmentTask.isDone()) {
             if (LOG.isDebugEnabled()) {
                 LOG.debug("Query {} fragment {} is marked done",
-                        DebugUtil.printId(queryId), params.getFragmentId());
+                        DebugUtil.printId(coordinatorContext.queryId), params.getFragmentId());
             }
             latch.get().markedCountDown(params.getFragmentId(), params.getBackendId());
         }
@@ -258,22 +220,6 @@ public void updateFragmentExecStatus(TReportExecStatusParams params) {
         }
     }
 
-    private Map<BackendFragmentId, SingleFragmentPipelineTask> buildBackendFragmentTasks(
-            PipelineExecutionTask executionTask) {
-        ImmutableMap.Builder<BackendFragmentId, SingleFragmentPipelineTask> backendFragmentTasks
-                = ImmutableMap.builder();
-        for (Entry<Long, MultiFragmentsPipelineTask> backendTask : executionTask.getChildrenTasks().entrySet()) {
-            Long backendId = backendTask.getKey();
-            for (Entry<Integer, SingleFragmentPipelineTask> fragmentIdToTask : backendTask.getValue()
-                    .getChildrenTasks().entrySet()) {
-                Integer fragmentId = fragmentIdToTask.getKey();
-                SingleFragmentPipelineTask fragmentTask = fragmentIdToTask.getValue();
-                backendFragmentTasks.put(new BackendFragmentId(backendId, fragmentId), fragmentTask);
-            }
-        }
-        return backendFragmentTasks.build();
-    }
-
     /*
      * Check the state of backends in needCheckBackendExecStates.
      * return true if all of them are OK. Otherwise, return false.
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTask.java b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTask.java
index 8c1b9714c35db8..ae87d59d075d12 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTask.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTask.java
@@ -102,7 +102,7 @@ public void execute() throws Exception {
 
     @Override
     public String toString() {
-        return "SqlPipelineTask(\n"
+        return "PipelineExecutionTask(\n"
                 + childrenTasks.allTasks()
                     .stream()
                     .map(multiFragmentsPipelineTask -> "  " + multiFragmentsPipelineTask)
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTaskBuilder.java b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTaskBuilder.java
index fd00bf0e3e8536..0da6f4a5fe2e43 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTaskBuilder.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/PipelineExecutionTaskBuilder.java
@@ -61,7 +61,7 @@ private PipelineExecutionTask buildTask(CoordinatorContext coordinatorContext,
                 backendServiceProxy,
                 buildMultiFragmentTasks(coordinatorContext, backendServiceProxy, workerToFragmentsParam)
         );
-        coordinatorContext.getJobProcessor().setSqlPipelineTask(pipelineExecutionTask);
+        coordinatorContext.getJobProcessor().setPipelineExecutionTask(pipelineExecutionTask);
         return pipelineExecutionTask;
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/QueryProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/QueryProcessor.java
index 2ec38e8cc8e3ea..a5a5100faece1a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/QueryProcessor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/QueryProcessor.java
@@ -25,13 +25,14 @@
 import org.apache.doris.nereids.trees.plans.distribute.worker.job.AssignedJob;
 import org.apache.doris.planner.DataSink;
 import org.apache.doris.planner.ResultSink;
+import org.apache.doris.qe.AbstractJobProcessor;
 import org.apache.doris.qe.ConnectContext;
 import org.apache.doris.qe.CoordinatorContext;
-import org.apache.doris.qe.JobProcessor;
 import org.apache.doris.qe.ResultReceiver;
 import org.apache.doris.qe.RowBatch;
 import org.apache.doris.rpc.RpcException;
 import org.apache.doris.thrift.TNetworkAddress;
+import org.apache.doris.thrift.TReportExecStatusParams;
 import org.apache.doris.thrift.TStatusCode;
 
 import com.google.common.base.Strings;
@@ -44,24 +45,21 @@
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
-import java.util.Optional;
 import java.util.concurrent.CopyOnWriteArrayList;
 
-public class QueryProcessor implements JobProcessor {
+public class QueryProcessor extends AbstractJobProcessor {
     private static final Logger LOG = LogManager.getLogger(QueryProcessor.class);
 
     // constant fields
     private final long limitRows;
 
     // mutable field
-    private Optional<PipelineExecutionTask> sqlPipelineTask;
-    private final CoordinatorContext coordinatorContext;
     private final List<ResultReceiver> runningReceivers;
     private int receiverOffset;
     private long numReceivedRows;
 
     public QueryProcessor(CoordinatorContext coordinatorContext, List<ResultReceiver> runningReceivers) {
-        this.coordinatorContext = Objects.requireNonNull(coordinatorContext, "coordinatorContext can not be null");
+        super(coordinatorContext);
         this.runningReceivers = new CopyOnWriteArrayList<>(
                 Objects.requireNonNull(runningReceivers, "runningReceivers can not be null")
         );
@@ -69,8 +67,6 @@ public QueryProcessor(CoordinatorContext coordinatorContext, List<ResultReceiver
         this.limitRows = coordinatorContext.fragments.get(coordinatorContext.fragments.size() - 1)
                 .getPlanRoot()
                 .getLimit();
-
-        this.sqlPipelineTask = Optional.empty();
     }
 
     public static QueryProcessor build(CoordinatorContext coordinatorContext) {
@@ -109,8 +105,8 @@ public static QueryProcessor build(CoordinatorContext coordinatorContext) {
     }
 
     @Override
-    public void setSqlPipelineTask(PipelineExecutionTask pipelineExecutionTask) {
-        this.sqlPipelineTask = Optional.ofNullable(pipelineExecutionTask);
+    protected void doProcessReportExecStatus(TReportExecStatusParams params, SingleFragmentPipelineTask fragmentTask) {
+
     }
 
     public boolean isEos() {
@@ -178,7 +174,7 @@ public void cancel(Status cancelReason) {
             receiver.cancel(cancelReason);
         }
 
-        this.sqlPipelineTask.ifPresent(sqlPipelineTask -> {
+        this.executionTask.ifPresent(sqlPipelineTask -> {
             for (MultiFragmentsPipelineTask fragmentsTask : sqlPipelineTask.getChildrenTasks().values()) {
                 fragmentsTask.cancelExecute(cancelReason);
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/ThriftPlansBuilder.java b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/ThriftPlansBuilder.java
index a02ee90e901cd5..54bc0b24d3e821 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/ThriftPlansBuilder.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/qe/runtime/ThriftPlansBuilder.java
@@ -240,14 +240,19 @@ private static Map<Integer, Integer> computeExchangeSenderNum(PipelineDistribute
         return senderNum;
     }
 
-    private static void setMultiCastDestinationThrift(PipelineDistributedPlan fragmentPlan) {
+    private static void setMultiCastDestinationThriftIfNotSet(PipelineDistributedPlan fragmentPlan) {
         MultiCastDataSink multiCastDataSink = (MultiCastDataSink) fragmentPlan.getFragmentJob().getFragment().getSink();
         List<List<TPlanFragmentDestination>> destinationList = multiCastDataSink.getDestinations();
 
         List<DataStreamSink> dataStreamSinks = multiCastDataSink.getDataStreamSinks();
         for (int i = 0; i < dataStreamSinks.size(); i++) {
-            DataStreamSink realSink = dataStreamSinks.get(i);
             List<TPlanFragmentDestination> destinations = destinationList.get(i);
+            if (!destinations.isEmpty()) {
+                // we should only set destination only once,
+                // because all backends share the same MultiCastDataSink object
+                continue;
+            }
+            DataStreamSink realSink = dataStreamSinks.get(i);
             for (Entry<DataSink, List<AssignedJob>> kv : fragmentPlan.getDestinations().entrySet()) {
                 DataSink sink = kv.getKey();
                 if (sink == realSink) {
@@ -318,7 +323,7 @@ private static TPipelineFragmentParams fragmentToThriftIfAbsent(
             List<TPlanFragmentDestination> nonMultiCastDestinations;
             if (fragment.getSink() instanceof MultiCastDataSink) {
                 nonMultiCastDestinations = Lists.newArrayList();
-                setMultiCastDestinationThrift(fragmentPlan);
+                setMultiCastDestinationThriftIfNotSet(fragmentPlan);
             } else {
                 nonMultiCastDestinations = nonMultiCastDestinationToThrift(fragmentPlan);
             }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/scheduler/disruptor/TaskDisruptor.java b/fe/fe-core/src/main/java/org/apache/doris/scheduler/disruptor/TaskDisruptor.java
index 345b31d6bc2537..8144ca22ea22eb 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/scheduler/disruptor/TaskDisruptor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/scheduler/disruptor/TaskDisruptor.java
@@ -20,6 +20,7 @@
 import org.apache.doris.common.Config;
 import org.apache.doris.common.CustomThreadFactory;
 import org.apache.doris.scheduler.constants.TaskType;
+import org.apache.doris.scheduler.exception.JobException;
 
 import com.lmax.disruptor.EventTranslatorThreeArg;
 import com.lmax.disruptor.LiteTimeoutBlockingWaitStrategy;
@@ -119,15 +120,17 @@ public void tryPublish(Long jobId, Long taskId, TaskType taskType) {
      *
      * @param taskId task id
      */
-    public void tryPublishTask(Long taskId) {
+    public void tryPublishTask(Long taskId) throws JobException {
         if (isClosed) {
             log.info("tryPublish failed, disruptor is closed, taskId: {}", taskId);
             return;
         }
-        try {
+        // We reserve two slots in the ring buffer
+        // to prevent it from becoming stuck due to competition between producers and consumers.
+        if (disruptor.getRingBuffer().hasAvailableCapacity(2)) {
             disruptor.publishEvent(TRANSLATOR, taskId, 0L, TaskType.TRANSIENT_TASK);
-        } catch (Exception e) {
-            log.warn("tryPublish failed, taskId: {}", taskId, e);
+        } else {
+            throw new JobException("There is not enough available capacity in the RingBuffer.");
         }
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/scheduler/manager/TransientTaskManager.java b/fe/fe-core/src/main/java/org/apache/doris/scheduler/manager/TransientTaskManager.java
index 7461399c8eb0c5..de501d3e0c2ffd 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/scheduler/manager/TransientTaskManager.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/scheduler/manager/TransientTaskManager.java
@@ -21,7 +21,6 @@
 import org.apache.doris.scheduler.exception.JobException;
 import org.apache.doris.scheduler.executor.TransientTaskExecutor;
 
-import lombok.Setter;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
@@ -41,7 +40,6 @@ public class TransientTaskManager {
      * disruptor is used to handle task
      * disruptor will start a thread pool to handle task
      */
-    @Setter
     private TaskDisruptor disruptor;
 
     public TransientTaskManager() {
@@ -56,7 +54,7 @@ public TransientTaskExecutor getMemoryTaskExecutor(Long taskId) {
         return taskExecutorMap.get(taskId);
     }
 
-    public Long addMemoryTask(TransientTaskExecutor executor) {
+    public Long addMemoryTask(TransientTaskExecutor executor) throws JobException {
         Long taskId = executor.getId();
         taskExecutorMap.put(taskId, executor);
         disruptor.tryPublishTask(taskId);
diff --git a/fe/fe-core/src/main/java/org/apache/doris/service/FrontendServiceImpl.java b/fe/fe-core/src/main/java/org/apache/doris/service/FrontendServiceImpl.java
index e35fd2dc852322..1ad8d733ddea07 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/service/FrontendServiceImpl.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/service/FrontendServiceImpl.java
@@ -659,6 +659,7 @@ public TListTableStatusResult listTableStatus(TGetTablesParams params) throws TE
                             status.setRows(table.getCachedRowCount());
                             status.setDataLength(table.getDataLength());
                             status.setAvgRowLength(table.getAvgRowLength());
+                            status.setIndexLength(table.getIndexLength());
                             tablesResult.add(status);
                         } finally {
                             table.readUnlock();
@@ -971,6 +972,10 @@ private TColumnDesc getColumnDesc(Column column) {
             }
             desc.setChildren(children);
         }
+        String defaultValue = column.getDefaultValue();
+        if (defaultValue != null) {
+            desc.setDefaultValue(defaultValue);
+        }
         return desc;
     }
 
diff --git a/fe/fe-core/src/main/java/org/apache/doris/service/arrowflight/FlightSqlConnectProcessor.java b/fe/fe-core/src/main/java/org/apache/doris/service/arrowflight/FlightSqlConnectProcessor.java
index 3fba602a1c1e2f..345d7d824a23ff 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/service/arrowflight/FlightSqlConnectProcessor.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/service/arrowflight/FlightSqlConnectProcessor.java
@@ -196,11 +196,11 @@ public void fetchArrowFlightSchema(int timeoutMs) {
     public void close() throws Exception {
         ctx.setCommand(MysqlCommand.COM_SLEEP);
         ctx.clear();
-        // TODO support query profile
         for (StmtExecutor asynExecutor : returnResultFromRemoteExecutor) {
             asynExecutor.finalizeQuery();
         }
         returnResultFromRemoteExecutor.clear();
+        executor.finalizeQuery();
         ConnectContext.remove();
     }
 }
diff --git a/fe/fe-core/src/main/java/org/apache/doris/task/CreateReplicaTask.java b/fe/fe-core/src/main/java/org/apache/doris/task/CreateReplicaTask.java
index 94b73ef286475a..90e709c96c3e5a 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/task/CreateReplicaTask.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/task/CreateReplicaTask.java
@@ -125,7 +125,7 @@ public class CreateReplicaTask extends AgentTask {
     private boolean storeRowColumn;
 
     private BinlogConfig binlogConfig;
-    private List<Integer> clusterKeyIndexes;
+    private List<Integer> clusterKeyUids;
 
     private Map<Object, Object> objectPool;
     private List<Integer> rowStoreColumnUniqueIds;
@@ -276,8 +276,8 @@ public void setInvertedIndexFileStorageFormat(TInvertedIndexFileStorageFormat in
         this.invertedIndexFileStorageFormat = invertedIndexFileStorageFormat;
     }
 
-    public void setClusterKeyIndexes(List<Integer> clusterKeyIndexes) {
-        this.clusterKeyIndexes = clusterKeyIndexes;
+    public void setClusterKeyUids(List<Integer> clusterKeyUids) {
+        this.clusterKeyUids = clusterKeyUids;
     }
 
     public TCreateTabletReq toThrift() {
@@ -337,10 +337,10 @@ public TCreateTabletReq toThrift() {
         tSchema.setSequenceColIdx(sequenceCol);
         tSchema.setVersionColIdx(versionCol);
         tSchema.setRowStoreColCids(rowStoreColumnUniqueIds);
-        if (!CollectionUtils.isEmpty(clusterKeyIndexes)) {
-            tSchema.setClusterKeyIdxes(clusterKeyIndexes);
+        if (!CollectionUtils.isEmpty(clusterKeyUids)) {
+            tSchema.setClusterKeyUids(clusterKeyUids);
             if (LOG.isDebugEnabled()) {
-                LOG.debug("cluster key index={}, table_id={}, tablet_id={}", clusterKeyIndexes, tableId, tabletId);
+                LOG.debug("cluster key uids={}, table_id={}, tablet_id={}", clusterKeyUids, tableId, tabletId);
             }
         }
         if (CollectionUtils.isNotEmpty(indexes)) {
diff --git a/fe/fe-core/src/test/java/org/apache/doris/analysis/InvertedIndexUtilTest.java b/fe/fe-core/src/test/java/org/apache/doris/analysis/InvertedIndexUtilTest.java
new file mode 100644
index 00000000000000..a9be242cf3f744
--- /dev/null
+++ b/fe/fe-core/src/test/java/org/apache/doris/analysis/InvertedIndexUtilTest.java
@@ -0,0 +1,47 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.analysis;
+
+import org.apache.doris.common.AnalysisException;
+
+import org.junit.jupiter.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.HashMap;
+import java.util.Map;
+
+public class InvertedIndexUtilTest {
+    @Test
+    public void testCheckInvertedIndexProperties() throws AnalysisException {
+        Map<String, String> properties = new HashMap<>();
+        properties.put(InvertedIndexUtil.INVERTED_INDEX_DICT_COMPRESSION_KEY, "true");
+
+        InvertedIndexUtil.checkInvertedIndexProperties(properties);
+
+        properties.put(InvertedIndexUtil.INVERTED_INDEX_DICT_COMPRESSION_KEY, "invalid_value");
+        try {
+            InvertedIndexUtil.checkInvertedIndexProperties(properties);
+            Assertions.fail("Expected AnalysisException was not thrown");
+        } catch (AnalysisException e) {
+            Assertions.assertEquals(
+                    "errCode = 2, detailMessage = Invalid inverted index 'dict_compression' value: invalid_value, "
+                            + "dict_compression must be true or false",
+                    e.getMessage());
+        }
+    }
+}
diff --git a/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowCreateTableStmtTest.java b/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowCreateTableStmtTest.java
index 353fbad9fabfc8..0faf4a8f34e8a8 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowCreateTableStmtTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowCreateTableStmtTest.java
@@ -32,7 +32,7 @@ protected void runBeforeAll() throws Exception {
         createDatabase("test");
         useDatabase("test");
         createTable("create table table1\n"
-                + "(k1 int comment 'test column k1', k2 int comment 'test column k2')  comment 'test table1' "
+                + "(k1 int comment 'test column k1', k2 int comment 'test column k2', `timestamp` DATE NOT NULL COMMENT '[''0000-01-01'', ''9999-12-31'']')  comment 'test table1' "
                 + "PARTITION BY RANGE(`k1`)\n"
                 + "(\n"
                 + "    PARTITION `p01` VALUES LESS THAN (\"10\"),\n"
@@ -48,10 +48,20 @@ public void testNormal() throws Exception {
         String sql = "show create table table1";
         ShowResultSet showResultSet = showCreateTable(sql);
         String showSql = showResultSet.getResultRows().get(0).get(1);
-        Assertions.assertTrue(showSql.contains("`k1` int NULL COMMENT 'test column k1'"));
+        Assertions.assertTrue(showSql.contains("`k1` int NULL COMMENT \"test column k1\""));
         Assertions.assertTrue(showSql.contains("COMMENT 'test table1'"));
     }
 
+    @Test
+    public void testColumnComment() throws Exception {
+        String sql = "show create table table1";
+        ShowResultSet showResultSet = showCreateTable(sql);
+        String showSql = showResultSet.getResultRows().get(0).get(1);
+        Assertions.assertTrue(showSql.contains("`k1` int NULL COMMENT \"test column k1\""));
+        Assertions.assertTrue(showSql.contains("`k2` int NULL COMMENT \"test column k2\""));
+        Assertions.assertTrue(showSql.contains("`timestamp` date NOT NULL COMMENT \"['0000-01-01', '9999-12-31']\""));
+    }
+
     @Test
     public void testBrief() throws Exception {
         String sql = "show brief create table table1";
diff --git a/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowDataStmtTest.java b/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowDataStmtTest.java
index 9b421de0c397bd..83d230274f6f29 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowDataStmtTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/analysis/ShowDataStmtTest.java
@@ -139,7 +139,7 @@ public void setUp() throws UserException {
 
     @Test
     public void testNormal() throws AnalysisException, UserException {
-        ShowDataStmt stmt = new ShowDataStmt(null, null, null);
+        ShowDataStmt stmt = new ShowDataStmt(null, null, null, false);
         stmt.analyze(analyzer);
         Assert.assertEquals("SHOW DATA", stmt.toString());
         Assert.assertEquals(4, stmt.getMetaData().getColumnCount());
@@ -151,7 +151,7 @@ public void testNormal() throws AnalysisException, UserException {
         OrderByElement orderByElementTwo = new OrderByElement(slotRefTwo, false, false);
 
         stmt = new ShowDataStmt(new TableName(InternalCatalog.INTERNAL_CATALOG_NAME, "testDb", "test_tbl"),
-                Arrays.asList(orderByElementOne, orderByElementTwo), null);
+                Arrays.asList(orderByElementOne, orderByElementTwo), null, false);
         stmt.analyze(analyzer);
         Assert.assertEquals(
                 "SHOW DATA FROM `testDb`.`test_tbl` ORDER BY `ReplicaCount` DESC, `Size` DESC",
@@ -159,7 +159,7 @@ public void testNormal() throws AnalysisException, UserException {
         Assert.assertEquals(6, stmt.getMetaData().getColumnCount());
         Assert.assertEquals(true, stmt.hasTable());
 
-        stmt = new ShowDataStmt(null, Arrays.asList(orderByElementOne, orderByElementTwo), null);
+        stmt = new ShowDataStmt(null, Arrays.asList(orderByElementOne, orderByElementTwo), null, false);
         stmt.analyze(analyzer);
         Assert.assertEquals("SHOW DATA ORDER BY `ReplicaCount` DESC, `Size` DESC",
                 stmt.toString());
diff --git a/fe/fe-core/src/test/java/org/apache/doris/catalog/CreateTableWithBloomFilterIndexTest.java b/fe/fe-core/src/test/java/org/apache/doris/catalog/CreateTableWithBloomFilterIndexTest.java
new file mode 100644
index 00000000000000..54787ee8eefe92
--- /dev/null
+++ b/fe/fe-core/src/test/java/org/apache/doris/catalog/CreateTableWithBloomFilterIndexTest.java
@@ -0,0 +1,905 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.catalog;
+
+import org.apache.doris.common.AnalysisException;
+import org.apache.doris.common.DdlException;
+import org.apache.doris.common.ExceptionChecker;
+import org.apache.doris.utframe.TestWithFeService;
+
+import org.junit.jupiter.api.Test;
+
+import java.util.UUID;
+
+public class CreateTableWithBloomFilterIndexTest extends TestWithFeService {
+    private static String runningDir = "fe/mocked/CreateTableWithBloomFilterIndexTest/"
+            + UUID.randomUUID().toString() + "/";
+
+    @Override
+    protected void runBeforeAll() throws Exception {
+        createDatabase("test");
+    }
+
+    @Test
+    public void testCreateTableWithTinyIntBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "TINYINT is not supported in bloom filter index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_tinyint_bf (\n"
+                        + "k1 TINYINT, \n"
+                        + "v1 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithSupportedIntBloomFilterIndex() throws Exception {
+        // smallint
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_smallint_bf (\n"
+                + "k1 SMALLINT, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+
+        // int
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_int_bf (\n"
+                + "k1 INT, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+
+        // bigint
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_bigint_bf (\n"
+                + "k1 BIGINT, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+
+        // largeint
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_largeint_bf (\n"
+                + "k1 LARGEINT, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithFloatBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "FLOAT is not supported in bloom filter index. invalid column: k2",
+                () -> createTable("CREATE TABLE test.tbl_float_bf (\n"
+                        + "k1 INT, \n"
+                        + "k2 FLOAT, \n"
+                        + "v1 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k2\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithDoubleBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "DOUBLE is not supported in bloom filter index. invalid column: k2",
+                () -> createTable("CREATE TABLE test.tbl_double_bf (\n"
+                        + "k1 INT, \n"
+                        + "k2 DOUBLE, \n"
+                        + "v1 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k2\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithDecimalBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_decimal_bf (\n"
+                + "k1 DECIMAL(10,2), \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithCharBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_char_bf (\n"
+                + "k1 CHAR(20), \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithVarcharBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_varchar_bf (\n"
+                + "k1 VARCHAR(20), \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithTextBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_text_bf (\n"
+                + "k1 INT, \n"
+                + "k2 TEXT, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k2\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithDecimalV3BloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_decimalv3_bf (\n"
+                + "k1 DECIMALV3(10,2), \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithIPv4BloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_ipv4_bf (\n"
+                + "k1 IPV4, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithIPv6BloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_ipv6_bf (\n"
+                + "k1 IPV6, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithDateBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_date_bf (\n"
+                + "k1 DATE, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithDateTimeBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_datetime_bf (\n"
+                + "k1 DATETIME, \n"
+                + "v1 INT\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithCharNgramBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_char_ngram_bf (\n"
+                + "k1 CHAR(20), \n"
+                + "v1 INT,\n"
+                + "INDEX idx_k1_ngram (k1) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"3\", \"bf_size\"=\"1024\")\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithVarcharNgramBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_varchar_ngram_bf (\n"
+                + "k1 VARCHAR(50), \n"
+                + "v1 INT,\n"
+                + "INDEX idx_k1_ngram (k1) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"3\", \"bf_size\"=\"1024\")\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithStringNgramBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_string_ngram_bf (\n"
+                + "k1 INT, \n"
+                + "k2 STRING, \n"
+                + "v1 INT,\n"
+                + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"3\", \"bf_size\"=\"1024\")\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithArrayNumericBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                        "ARRAY is not supported in bloom filter index. invalid column: k1",
+                        () -> createTable("CREATE TABLE test.tbl_array_numeric_bf (\n"
+                + "v1 INT,\n"
+                + "k1 ARRAY<INT>\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(v1)\n"
+                + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithArrayDateBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                        "ARRAY is not supported in bloom filter index. invalid column: k1",
+                        () -> createTable("CREATE TABLE test.tbl_array_date_bf (\n"
+                + "v1 INT,\n"
+                + "k1 ARRAY<DATE>\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(v1)\n"
+                + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithArrayStringNgramBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                " ARRAY is not supported in ngram_bf index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_array_string_ngram_bf (\n"
+                        + "v1 INT,\n"
+                        + "k1 ARRAY<STRING>,\n"
+                        + "INDEX idx_k1_ngram (k1) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"3\", \"bf_size\"=\"1024\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(v1)\n"
+                        + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithMapBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "MAP is not supported in bloom filter index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_map_bf (\n"
+                        + "v1 INT,\n"
+                        + "k1 MAP<INT, STRING>\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(v1)\n"
+                        + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithStructBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "STRUCT is not supported in bloom filter index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_struct_bf (\n"
+                        + "v1 INT,\n"
+                        + "k1 STRUCT<f1:INT, f2:STRING>\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(v1)\n"
+                        + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithJsonBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                " JSON is not supported in bloom filter index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_json_bf (\n"
+                        + "v1 INT,\n"
+                        + "k1 JSON\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(v1)\n"
+                        + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateTableWithHllBloomFilterIndex() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                " HLL is not supported in bloom filter index. invalid column: k1",
+                () -> createTable("CREATE TABLE test.tbl_hll_bf (\n"
+                        + "v1 INT,\n"
+                        + "k1 HLL\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(v1)\n"
+                        + "DISTRIBUTED BY HASH(v1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testCreateMowTableWithBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_mow_bf (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "UNIQUE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\",\n"
+                + "\"bloom_filter_columns\" = \"v1\",\n"
+                + "\"enable_unique_key_merge_on_write\" = \"true\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateDuplicateTableWithBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_duplicate_bf (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"v1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateMorTableWithBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_mor_bf (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "UNIQUE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\",\n"
+                + "\"bloom_filter_columns\" = \"v1\",\n"
+                + "\"enable_unique_key_merge_on_write\" = \"false\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testCreateAggTableWithBloomFilterIndex() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_agg_bf (\n"
+                + "k1 INT, \n"
+                + "v1 INT SUM\n"
+                + ") ENGINE=OLAP\n"
+                + "AGGREGATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsValidCharacters() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_bf_valid_chars (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1,v1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsInvalidCharacters() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: k1;v1",
+                () -> createTable("CREATE TABLE test.tbl_bf_invalid_chars (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1;v1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterFppValidInput() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_bf_fpp_valid (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"v1\",\n"
+                + "\"bloom_filter_fpp\" = \"0.05\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterFppInvalidInput() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter fpp should in [1.0E-4, 0.05]",
+                () -> createTable("CREATE TABLE test.tbl_bf_fpp_invalid (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"v1\",\n"
+                        + "\"bloom_filter_fpp\" = \"-0.05\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterGramSizeValidInput() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_ngram_gramsize_valid (\n"
+                + "k1 INT, \n"
+                + "k2 STRING, \n"
+                + "v1 INT,\n"
+                + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"4\")\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterGramSizeInvalidInput() {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                "'gram_size' should be an integer between 1 and 255",
+                () -> createTable("CREATE TABLE test.tbl_ngram_gramsize_invalid (\n"
+                        + "k1 INT, \n"
+                        + "k2 STRING, \n"
+                        + "v1 INT,\n"
+                        + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"-1\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterGramSizeInvalidInput256() {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                "'gram_size' should be an integer between 1 and 255",
+                () -> createTable("CREATE TABLE test.tbl_ngram_gram_size_invalid (\n"
+                        + "k1 INT, \n"
+                        + "k2 STRING, \n"
+                        + "v1 INT,\n"
+                        + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"gram_size\"=\"256\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterBfSizeValidInput() throws Exception {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                "'bf_size' should be an integer between 64 and 65535",
+                () -> createTable("CREATE TABLE test.tbl_ngram_bfsize_valid (\n"
+                        + "k1 INT, \n"
+                        + "k2 STRING, \n"
+                        + "v1 INT,\n"
+                        + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"bf_size\"=\"256000000\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterBfSizeInvalidInput() {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                "'bf_size' should be an integer between 64 and 65535",
+                () -> createTable("CREATE TABLE test.tbl_ngram_bfsize_invalid (\n"
+                        + "k1 INT, \n"
+                        + "k2 STRING, \n"
+                        + "v1 INT,\n"
+                        + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"bf_size\"=\"-256000000\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testNgramBloomFilterBfSizeInvalidInput65536() {
+        ExceptionChecker.expectThrowsWithMsg(AnalysisException.class,
+                "'bf_size' should be an integer between 64 and 65535",
+                () -> createTable("CREATE TABLE test.tbl_ngram_bf_size_invalid (\n"
+                        + "k1 INT, \n"
+                        + "k2 STRING, \n"
+                        + "v1 INT,\n"
+                        + "INDEX idx_k2_ngram (k2) USING NGRAM_BF PROPERTIES(\"bf_size\"=\"65536\")\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                        + "PROPERTIES (\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsDuplicated() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Reduplicated bloom filter column: k1",
+                () -> createTable("CREATE TABLE test.tbl_bf_duplicated_columns (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1,k1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnDoesNotExist() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: k3",
+                () -> createTable("CREATE TABLE test.tbl_bf_column_not_exist (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k3\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnInvalidType() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "BOOLEAN is not supported in bloom filter index. invalid column: k2",
+                () -> createTable("CREATE TABLE test.tbl_bf_invalid_type (\n"
+                        + "k1 INT, \n"
+                        + "k2 BOOLEAN,\n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k2\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnNonKeyInAggKeys() throws Exception {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                        "Bloom filter index should only be used in columns of UNIQUE_KEYS/DUP_KEYS table or key columns of AGG_KEYS table. invalid column: v1",
+                        () -> createTable("CREATE TABLE test.tbl_bf_nonkey_in_agg (\n"
+                + "k1 INT, \n"
+                + "v1 INT SUM\n"
+                + ") ENGINE=OLAP\n"
+                + "AGGREGATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 3\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"v1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterFppNotDouble() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter fpp is not Double",
+                () -> createTable("CREATE TABLE test.tbl_bf_fpp_not_double (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"v1\",\n"
+                        + "\"bloom_filter_fpp\" = \"abc\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterFppOutOfRange() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter fpp should in [1.0E-4, 0.05]",
+                () -> createTable("CREATE TABLE test.tbl_bf_fpp_out_of_range (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"v1\",\n"
+                        + "\"bloom_filter_fpp\" = \"0.1\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterFppBelowMin() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter fpp should in [1.0E-4, 0.05]",
+                () -> createTable("CREATE TABLE test.tbl_bf_fpp_below_min (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"v1\",\n"
+                        + "\"bloom_filter_fpp\" = \"1e-5\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsEmptyString() throws Exception {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                        "Unknown properties: {bloom_filter_columns=}",
+                        () -> createTable("CREATE TABLE test.tbl_bf_empty_columns (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsOnlyCommas() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Unknown properties: {bloom_filter_columns=,,,}",
+                () -> createTable("CREATE TABLE test.tbl_bf_only_commas (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \",,,\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsNonExistingColumns() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: k3",
+                () -> createTable("CREATE TABLE test.tbl_bf_non_existing_columns (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20),\n"
+                        + "k2 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k2,k3\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithSpecialCharacters() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: k1@",
+                () -> createTable("CREATE TABLE test.tbl_bf_special_chars (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20),\n"
+                        + "k2 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"k1@,v1#\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithDifferentCase() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_bf_different_case (\n"
+                + "k1 INT, \n"
+                + "V1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(K1)\n"
+                + "DISTRIBUTED BY HASH(K1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"k1,v1\",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithSpaces() throws Exception {
+        ExceptionChecker.expectThrowsNoException(() -> createTable("CREATE TABLE test.tbl_bf_columns_with_spaces (\n"
+                + "k1 INT, \n"
+                + "v1 VARCHAR(20)\n"
+                + ") ENGINE=OLAP\n"
+                + "DUPLICATE KEY(k1)\n"
+                + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                + "PROPERTIES (\n"
+                + "\"bloom_filter_columns\" = \"  k1  ,  v1  \",\n"
+                + "\"replication_num\" = \"1\"\n"
+                + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithLongColumnName() throws Exception {
+        StringBuilder sb = new StringBuilder("k");
+        for (int i = 0; i < 1000; i++) {
+            sb.append('1');
+        }
+        String longColumnName = sb.toString();
+
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: " + longColumnName,
+                () -> createTable("CREATE TABLE test.tbl_bf_long_column_name (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20),\n"
+                        + "k2 INT\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"" + longColumnName + "\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithUnicodeCharacters() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: 名字",
+                () -> createTable("CREATE TABLE test.tbl_bf_unicode_columns (\n"
+                        + "k1 INT, \n"
+                        + "name VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \"名字\",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+
+    @Test
+    public void testBloomFilterColumnsWithNullOrWhitespace() {
+        ExceptionChecker.expectThrowsWithMsg(DdlException.class,
+                "Bloom filter column does not exist in table. invalid column: ",
+                () -> createTable("CREATE TABLE test.tbl_bf_null_or_whitespace (\n"
+                        + "k1 INT, \n"
+                        + "v1 VARCHAR(20)\n"
+                        + ") ENGINE=OLAP\n"
+                        + "DUPLICATE KEY(k1)\n"
+                        + "DISTRIBUTED BY HASH(k1) BUCKETS 1\n"
+                        + "PROPERTIES (\n"
+                        + "\"bloom_filter_columns\" = \" , \",\n"
+                        + "\"replication_num\" = \"1\"\n"
+                        + ");"));
+    }
+}
diff --git a/fe/fe-core/src/test/java/org/apache/doris/catalog/PartitionKeyTest.java b/fe/fe-core/src/test/java/org/apache/doris/catalog/PartitionKeyTest.java
index affd5a4cc2c397..c6b45c0b136e61 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/catalog/PartitionKeyTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/catalog/PartitionKeyTest.java
@@ -268,4 +268,10 @@ public void testSerialization() throws Exception {
         dis.close();
         Files.deleteIfExists(path);
     }
+
+    @Test
+    public void testMaxValueToSql() throws Exception {
+        PartitionKey key = PartitionKey.createInfinityPartitionKey(allColumns, true);
+        Assert.assertEquals("(MAXVALUE, MAXVALUE, MAXVALUE, MAXVALUE, MAXVALUE, MAXVALUE, MAXVALUE)", key.toSql());
+    }
 }
diff --git a/fe/fe-core/src/test/java/org/apache/doris/common/PropertyAnalyzerTest.java b/fe/fe-core/src/test/java/org/apache/doris/common/PropertyAnalyzerTest.java
index 041ca89bfc5bde..6d708aa0826ddf 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/common/PropertyAnalyzerTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/common/PropertyAnalyzerTest.java
@@ -28,6 +28,7 @@
 import org.apache.doris.common.util.PropertyAnalyzer;
 import org.apache.doris.common.util.TimeUtils;
 import org.apache.doris.resource.Tag;
+import org.apache.doris.thrift.TInvertedIndexFileStorageFormat;
 import org.apache.doris.thrift.TStorageFormat;
 import org.apache.doris.thrift.TStorageMedium;
 
@@ -37,6 +38,7 @@
 import org.junit.Assert;
 import org.junit.Rule;
 import org.junit.Test;
+import org.junit.jupiter.api.Assertions;
 import org.junit.rules.ExpectedException;
 
 import java.time.Instant;
@@ -236,4 +238,52 @@ public void testStoragePageSize() throws AnalysisException {
             Assert.assertTrue(e.getMessage().contains("Storage page size must be between 4KB and 10MB"));
         }
     }
+
+    @Test
+    public void testAnalyzeInvertedIndexFileStorageFormat() throws AnalysisException {
+        TInvertedIndexFileStorageFormat result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(null);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V2, result);
+
+        Config.inverted_index_storage_format = "V1";
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(new HashMap<>());
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V1, result);
+
+        Map<String, String> propertiesWithV1 = new HashMap<>();
+        propertiesWithV1.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "v1");
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithV1);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V1, result);
+
+        Map<String, String> propertiesWithV2 = new HashMap<>();
+        propertiesWithV2.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "v2");
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithV2);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V2, result);
+
+        Map<String, String> propertiesWithV3 = new HashMap<>();
+        propertiesWithV3.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "v3");
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithV3);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V3, result);
+
+        Config.inverted_index_storage_format = "V1";
+        Map<String, String> propertiesWithDefaultV1 = new HashMap<>();
+        propertiesWithDefaultV1.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "default");
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithDefaultV1);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V1, result);
+
+        Config.inverted_index_storage_format = "V2";
+        Map<String, String> propertiesWithDefaultV2 = new HashMap<>();
+        propertiesWithDefaultV2.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "default");
+        result = PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithDefaultV2);
+        Assertions.assertEquals(TInvertedIndexFileStorageFormat.V2, result);
+
+        Map<String, String> propertiesWithUnknown = new HashMap<>();
+        propertiesWithUnknown.put(PropertyAnalyzer.PROPERTIES_INVERTED_INDEX_STORAGE_FORMAT, "unknown_format");
+        try {
+            PropertyAnalyzer.analyzeInvertedIndexFileStorageFormat(propertiesWithUnknown);
+            Assertions.fail("Expected AnalysisException was not thrown");
+        } catch (AnalysisException e) {
+            Assertions.assertEquals(
+                    "errCode = 2, detailMessage = unknown inverted index storage format: unknown_format",
+                    e.getMessage());
+        }
+    }
 }
diff --git a/fe/fe-core/src/test/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTabletTest.java b/fe/fe-core/src/test/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTabletTest.java
index e7940cdfb9b519..385657cd3f229e 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTabletTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/nereids/rules/rewrite/PruneOlapScanTabletTest.java
@@ -28,6 +28,7 @@
 import org.apache.doris.catalog.OlapTable;
 import org.apache.doris.catalog.Partition;
 import org.apache.doris.catalog.PrimitiveType;
+import org.apache.doris.nereids.sqltest.SqlTestBase;
 import org.apache.doris.nereids.trees.expressions.EqualTo;
 import org.apache.doris.nereids.trees.expressions.GreaterThanEqual;
 import org.apache.doris.nereids.trees.expressions.InPredicate;
@@ -51,8 +52,9 @@
 import org.junit.jupiter.api.Test;
 
 import java.util.List;
+import java.util.Objects;
 
-class PruneOlapScanTabletTest implements MemoPatternMatchSupported {
+class PruneOlapScanTabletTest extends SqlTestBase implements MemoPatternMatchSupported {
 
     @Test
     void testPruneOlapScanTablet(@Mocked OlapTable olapTable,
@@ -154,4 +156,21 @@ void testPruneOlapScanTablet(@Mocked OlapTable olapTable,
                         )
                 );
     }
+
+    @Test
+    void testPruneOlapScanTabletWithManually() {
+        String sql = "select * from T4 TABLET(110) where id > 8";
+        PlanChecker.from(connectContext)
+                .analyze(sql)
+                .applyTopDown(new PruneOlapScanTablet())
+                .matches(
+                        logicalFilter(
+                                logicalOlapScan().when(s ->
+                                        Objects.equals(s.getSelectedTabletIds(), Lists.newArrayList(110L))
+                                                && Objects.equals(s.getManuallySpecifiedTabletIds(),
+                                                Lists.newArrayList(110L))
+                                )
+                        )
+                );
+    }
 }
diff --git a/fe/fe-core/src/test/java/org/apache/doris/nereids/sqltest/SqlTestBase.java b/fe/fe-core/src/test/java/org/apache/doris/nereids/sqltest/SqlTestBase.java
index f5b301dcc49b25..9ebbc22a85c826 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/nereids/sqltest/SqlTestBase.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/nereids/sqltest/SqlTestBase.java
@@ -87,6 +87,9 @@ protected void runBeforeAll() throws Exception {
                         + "    score bigint\n"
                         + ")\n"
                         + "DUPLICATE KEY(id)\n"
+                        + "AUTO PARTITION BY LIST(`id`)\n"
+                        + "(\n"
+                        + ")\n"
                         + "DISTRIBUTED BY HASH(id) BUCKETS 1\n"
                         + "PROPERTIES (\n"
                         + "  \"replication_num\" = \"1\"\n"
diff --git a/fe/fe-core/src/test/java/org/apache/doris/nereids/trees/plans/PlanVisitorTest.java b/fe/fe-core/src/test/java/org/apache/doris/nereids/trees/plans/PlanVisitorTest.java
index 60f6e19faab635..0c54f8fad5a107 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/nereids/trees/plans/PlanVisitorTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/nereids/trees/plans/PlanVisitorTest.java
@@ -130,7 +130,7 @@ public void test1() {
                             Assertions.assertTrue(nondeterministicFunctionSet.get(0) instanceof Random);
                             // Check get tables
                             TableCollectorContext collectorContext = new TableCollector.TableCollectorContext(
-                                    Sets.newHashSet(TableType.OLAP), true);
+                                    Sets.newHashSet(TableType.OLAP), true, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, collectorContext);
                             Set<String> expectedTables = new HashSet<>();
                             expectedTables.add("table1");
@@ -159,7 +159,7 @@ public void test2() {
                             Assertions.assertTrue(nondeterministicFunctionSet.get(1) instanceof Random);
                             // Check get tables
                             TableCollectorContext collectorContext = new TableCollector.TableCollectorContext(
-                                    Sets.newHashSet(TableType.OLAP), true);
+                                    Sets.newHashSet(TableType.OLAP), true, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, collectorContext);
                             Set<String> expectedTables = new HashSet<>();
                             expectedTables.add("table1");
@@ -196,7 +196,7 @@ public BitSet getDisableNereidsRules() {
                             Assertions.assertTrue(nondeterministicFunctionSet.get(0) instanceof Uuid);
                             // Check get tables
                             TableCollectorContext collectorContext = new TableCollector.TableCollectorContext(
-                                    Sets.newHashSet(TableType.OLAP), true);
+                                    Sets.newHashSet(TableType.OLAP), true, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, collectorContext);
                             Set<String> expectedTables = new HashSet<>();
                             expectedTables.add("table1");
@@ -210,7 +210,7 @@ public BitSet getDisableNereidsRules() {
 
                             TableCollectorContext collectorContextWithNoExpand =
                                     new TableCollector.TableCollectorContext(Sets.newHashSet(TableType.OLAP),
-                                            false);
+                                            false, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, collectorContextWithNoExpand);
                             Set<String> expectedTablesWithNoExpand = new HashSet<>();
                             expectedTablesWithNoExpand.add("table1");
@@ -222,7 +222,7 @@ public BitSet getDisableNereidsRules() {
                                     expectedTablesWithNoExpand);
 
                             TableCollectorContext mvCollectorContext = new TableCollector.TableCollectorContext(
-                                    Sets.newHashSet(TableType.MATERIALIZED_VIEW), true);
+                                    Sets.newHashSet(TableType.MATERIALIZED_VIEW), true, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, mvCollectorContext);
                             Set<String> expectedMvs = new HashSet<>();
                             expectedMvs.add("mv1");
@@ -234,7 +234,7 @@ public BitSet getDisableNereidsRules() {
 
                             TableCollectorContext mvCollectorContextWithNoExpand =
                                     new TableCollector.TableCollectorContext(
-                                    Sets.newHashSet(TableType.MATERIALIZED_VIEW), false);
+                                    Sets.newHashSet(TableType.MATERIALIZED_VIEW), false, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, mvCollectorContextWithNoExpand);
                             Set<String> expectedMvsWithNoExpand = new HashSet<>();
                             expectedMvsWithNoExpand.add("mv1");
@@ -246,7 +246,7 @@ public BitSet getDisableNereidsRules() {
 
                             TableCollectorContext allTableTypeWithExpand =
                                     new TableCollector.TableCollectorContext(
-                                            Sets.newHashSet(TableType.values()), true);
+                                            Sets.newHashSet(TableType.values()), true, connectContext);
                             physicalPlan.accept(TableCollector.INSTANCE, allTableTypeWithExpand);
                             // when collect in plan with expand, should collect table which is expended
                             Set<String> expectedTablesWithExpand = new HashSet<>();
diff --git a/fe/fe-core/src/test/java/org/apache/doris/nereids/util/ReadLockTest.java b/fe/fe-core/src/test/java/org/apache/doris/nereids/util/ReadLockTest.java
index 3e1752e41bcdce..1e1535a573610b 100644
--- a/fe/fe-core/src/test/java/org/apache/doris/nereids/util/ReadLockTest.java
+++ b/fe/fe-core/src/test/java/org/apache/doris/nereids/util/ReadLockTest.java
@@ -18,7 +18,6 @@
 package org.apache.doris.nereids.util;
 
 import org.apache.doris.catalog.TableIf;
-import org.apache.doris.nereids.CascadesContext;
 import org.apache.doris.nereids.NereidsPlanner;
 import org.apache.doris.nereids.StatementContext;
 import org.apache.doris.nereids.datasets.ssb.SSBTestBase;
@@ -48,10 +47,8 @@ public void testSimple() {
                 parser.parseSingle(sql),
                 PhysicalProperties.ANY
         );
-        CascadesContext cascadesContext = planner.getCascadesContext();
-
-        Map<List<String>, TableIf> f = cascadesContext.getTables();
-        Assertions.assertEquals(2, f.size());
+        Map<List<String>, TableIf> f = statementContext.getTables();
+        Assertions.assertEquals(1, f.size());
         Set<String> tableNames = new HashSet<>();
         for (Map.Entry<List<String>, TableIf> entry : f.entrySet()) {
             TableIf table = entry.getValue();
@@ -75,8 +72,7 @@ public void testCTE() {
                 parser.parseSingle(sql),
                 PhysicalProperties.ANY
         );
-        CascadesContext cascadesContext = planner.getCascadesContext();
-        Map<List<String>, TableIf> f = cascadesContext.getTables();
+        Map<List<String>, TableIf> f = statementContext.getTables();
         Assertions.assertEquals(1, f.size());
         for (Map.Entry<List<String>, TableIf> entry : f.entrySet()) {
             TableIf table = entry.getValue();
@@ -93,8 +89,7 @@ public void testSubQuery() {
                 parser.parseSingle(sql),
                 PhysicalProperties.ANY
         );
-        CascadesContext cascadesContext = planner.getCascadesContext();
-        Map<List<String>, TableIf> f = cascadesContext.getTables();
+        Map<List<String>, TableIf> f = statementContext.getTables();
         Assertions.assertEquals(1, f.size());
         for (Map.Entry<List<String>, TableIf> entry : f.entrySet()) {
             TableIf table = entry.getValue();
@@ -111,8 +106,7 @@ public void testScalarSubQuery() {
                 parser.parseSingle(sql),
                 PhysicalProperties.ANY
         );
-        CascadesContext cascadesContext = planner.getCascadesContext();
-        Map<List<String>, TableIf> f = cascadesContext.getTables();
+        Map<List<String>, TableIf> f = statementContext.getTables();
         Assertions.assertEquals(2, f.size());
         Set<String> tableNames = new HashSet<>();
         for (Map.Entry<List<String>, TableIf> entry : f.entrySet()) {
@@ -134,15 +128,14 @@ public void testInserInto() {
                 (LogicalPlan) insertIntoTableCommand.getExplainPlan(connectContext),
                 PhysicalProperties.ANY
         );
-        CascadesContext cascadesContext = planner.getCascadesContext();
-        Map<List<String>, TableIf> f = cascadesContext.getTables();
-        Assertions.assertEquals(2, f.size());
+        Map<List<String>, TableIf> f = statementContext.getTables();
+        // when table in insert would not be added to statement context, but be lock when insert
+        Assertions.assertEquals(1, f.size());
         Set<String> tableNames = new HashSet<>();
         for (Map.Entry<List<String>, TableIf> entry : f.entrySet()) {
             TableIf table = entry.getValue();
             tableNames.add(table.getName());
         }
-        Assertions.assertTrue(tableNames.contains("supplier"));
         Assertions.assertTrue(tableNames.contains("lineorder"));
     }
 }
diff --git a/fe/pom.xml b/fe/pom.xml
index 651a155ff59b68..469844d191cabb 100644
--- a/fe/pom.xml
+++ b/fe/pom.xml
@@ -226,7 +226,7 @@ under the License.
         <avro.version>1.11.4</avro.version>
         <parquet.version>1.13.1</parquet.version>
         <spark.version>3.4.3</spark.version>
-        <hudi.version>0.14.1</hudi.version>
+        <hudi.version>0.15.0</hudi.version>
         <obs.dependency.scope>compile</obs.dependency.scope>
         <cos.dependency.scope>compile</cos.dependency.scope>
         <gcs.dependency.scope>compile</gcs.dependency.scope>
@@ -321,7 +321,6 @@ under the License.
         <iceberg.version>1.4.3</iceberg.version>
         <maxcompute.version>0.49.0-public</maxcompute.version>
         <arrow.version>17.0.0</arrow.version>
-        <!-- hudi -->
         <presto.hadoop.version>2.7.4-11</presto.hadoop.version>
         <presto.hive.version>3.0.0-8</presto.hive.version>
         <!-- lakesoul -->
@@ -1662,7 +1661,7 @@ under the License.
             <dependency>
                 <groupId>io.airlift</groupId>
                 <artifactId>concurrent</artifactId>
-                <version>${airlift.version}</version>
+                <version>${airlift.concurrent.version}</version>
             </dependency>
             <dependency>
                 <groupId>org.bouncycastle</groupId>
diff --git a/gensrc/proto/cloud.proto b/gensrc/proto/cloud.proto
index 381075074335c5..c113868a2c3286 100644
--- a/gensrc/proto/cloud.proto
+++ b/gensrc/proto/cloud.proto
@@ -544,6 +544,10 @@ message TabletCompactionJobPB {
     optional int64 delete_bitmap_lock_initiator = 24;
     optional int64 full_compaction_cnt = 25;  // prepare
     optional bool check_input_versions_range = 26;
+    optional int64 index_size_input_rowsets = 27;
+    optional int64 segment_size_input_rowsets = 28;
+    optional int64 index_size_output_rowsets = 29;
+    optional int64 segment_size_output_rowsets = 30;
 }
 
 message TabletSchemaChangeJobPB {
@@ -563,6 +567,8 @@ message TabletSchemaChangeJobPB {
     optional int64 output_cumulative_point = 12;
     optional bool is_inverted_index_change = 13 [default = false];
     optional int64 delete_bitmap_lock_initiator = 14;
+    optional int64 index_size_output_rowsets = 15;
+    optional int64 segment_size_output_rowsets = 16;
 }
 
 message TabletJobInfoPB {
@@ -576,7 +582,7 @@ message TabletJobInfoPB {
 //==============================================================================
 message TabletStatsPB {
     optional TabletIndexPB idx = 1;
-    optional int64 data_size = 2;
+    optional int64 data_size = 2; // data_size = index_size + segment_size
     optional int64 num_rows = 3;
     optional int64 num_rowsets = 4;
     optional int64 num_segments = 5;
@@ -588,6 +594,8 @@ message TabletStatsPB {
     optional int64 last_cumu_compaction_time_ms = 11;
     optional int64 full_compaction_cnt = 12;
     optional int64 last_full_compaction_time_ms = 13;
+    optional int64 index_size = 14;
+    optional int64 segment_size = 15; 
 }
 
 message ObjectFilePB {
diff --git a/gensrc/proto/olap_file.proto b/gensrc/proto/olap_file.proto
index 259f9f2861a11c..2c378fe2d458e0 100644
--- a/gensrc/proto/olap_file.proto
+++ b/gensrc/proto/olap_file.proto
@@ -343,6 +343,7 @@ enum IndexType {
 enum InvertedIndexStorageFormatPB {
     V1 = 0;
     V2 = 1;
+    V3 = 2;
 }
 
 message TabletIndexPB {
@@ -391,7 +392,7 @@ message TabletSchemaPB {
     repeated string partial_update_input_columns = 21; // deprecated
     optional bool enable_single_replica_compaction = 22 [default=false];
     optional bool skip_write_index_on_load = 23 [default=false];
-    repeated int32 cluster_key_idxes = 24;
+    repeated int32 cluster_key_uids = 24;
     optional InvertedIndexStorageFormatPB inverted_index_storage_format = 25 [default=V1];
     // column unique ids for row store columns
     repeated int32 row_store_column_unique_ids = 26;
@@ -424,7 +425,7 @@ message TabletSchemaCloudPB {
     reserved 21; // deprecated partial_update_input_columns
     optional bool enable_single_replica_compaction = 22 [default=false];
     optional bool skip_write_index_on_load = 23 [default=false];
-    repeated int32 cluster_key_idxes = 24;
+    repeated int32 cluster_key_uids = 24;
     optional InvertedIndexStorageFormatPB inverted_index_storage_format = 25 [default=V1];
     // column unique ids for row store columns
     repeated int32 row_store_column_unique_ids = 26;
diff --git a/gensrc/thrift/AgentService.thrift b/gensrc/thrift/AgentService.thrift
index fdbf4483bf8c4c..7bb24ba8d4d9da 100644
--- a/gensrc/thrift/AgentService.thrift
+++ b/gensrc/thrift/AgentService.thrift
@@ -44,7 +44,7 @@ struct TTabletSchema {
     16: optional bool store_row_column = false
     17: optional bool enable_single_replica_compaction = false
     18: optional bool skip_write_index_on_load = false
-    19: optional list<i32> cluster_key_idxes
+    19: optional list<i32> cluster_key_uids
     // col unique id for row store column
     20: optional list<i32> row_store_col_cids
     21: optional i64 row_store_page_size = 16384
diff --git a/gensrc/thrift/BackendService.thrift b/gensrc/thrift/BackendService.thrift
index 7f073b2b71095a..aed248adfe891a 100644
--- a/gensrc/thrift/BackendService.thrift
+++ b/gensrc/thrift/BackendService.thrift
@@ -32,13 +32,18 @@ struct TExportTaskRequest {
 
 struct TTabletStat {
     1: required i64 tablet_id
-    // local data size
+    // local data size = local inverted index file size + local segment file size
     2: optional i64 data_size
     3: optional i64 row_count
     4: optional i64 total_version_count
+    // remote data size = remote inverted index file size + remote segment file size
     5: optional i64 remote_data_size
     6: optional i64 visible_version_count
     7: optional i64 visible_version
+    8: optional i64 local_index_size = 0      // .idx
+    9: optional i64 local_segment_size = 0    // .dat
+    10: optional i64 remote_index_size = 0    // .idx
+    11: optional i64 remote_segment_size = 0  // .dat
 }
 
 struct TTabletStatResult {
diff --git a/gensrc/thrift/FrontendService.thrift b/gensrc/thrift/FrontendService.thrift
index e2af8937425d0c..916885028ad4a0 100644
--- a/gensrc/thrift/FrontendService.thrift
+++ b/gensrc/thrift/FrontendService.thrift
@@ -53,6 +53,7 @@ struct TColumnDesc {
   6: optional bool isAllowNull
   7: optional string columnKey
   8: optional list<TColumnDesc> children
+  9: optional string defaultValue
 }
 
 // A column definition; used by CREATE TABLE and DESCRIBE <table> statements. A column
@@ -350,6 +351,7 @@ struct TTableStatus {
     11: optional i64 rows;
     12: optional i64 avg_row_length
     13: optional i64 data_length;
+    14: optional i64 index_length;
 }
 
 struct TListTableStatusResult {
diff --git a/gensrc/thrift/MasterService.thrift b/gensrc/thrift/MasterService.thrift
index 9d8cd9111ba5c1..a045fa3adcb5bd 100644
--- a/gensrc/thrift/MasterService.thrift
+++ b/gensrc/thrift/MasterService.thrift
@@ -47,6 +47,10 @@ struct TTabletInfo {
     19: optional i64 cooldown_term
     20: optional Types.TUniqueId cooldown_meta_id
     21: optional i64 visible_version_count
+    22: optional i64 local_index_size = 0      // .idx
+    23: optional i64 local_segment_size = 0    // .dat
+    24: optional i64 remote_index_size = 0     // .idx
+    25: optional i64 remote_segment_size = 0   // .dat
 
     // For cloud
     1000: optional bool is_persistent
diff --git a/gensrc/thrift/PaloInternalService.thrift b/gensrc/thrift/PaloInternalService.thrift
index 9a0fd910d94387..745cb8f21fb627 100644
--- a/gensrc/thrift/PaloInternalService.thrift
+++ b/gensrc/thrift/PaloInternalService.thrift
@@ -358,6 +358,8 @@ struct TQueryOptions {
   140: optional i64 orc_max_merge_distance_bytes = 1048576;
 
   141: optional bool ignore_runtime_filter_error = false;
+  142: optional bool enable_fixed_len_to_uint32_v2 = false;
+
   // For cloud, to control if the content would be written into file cache
   // In write path, to control if the content would be written into file cache.
   // In read path, read from file cache or remote storage when execute query.
diff --git a/gensrc/thrift/PlanNodes.thrift b/gensrc/thrift/PlanNodes.thrift
index 0bbd364fda1c2a..bd8c43622d1f60 100644
--- a/gensrc/thrift/PlanNodes.thrift
+++ b/gensrc/thrift/PlanNodes.thrift
@@ -353,7 +353,10 @@ struct TMaxComputeFileDesc {
     1: optional string partition_spec // deprecated 
     2: optional string session_id 
     3: optional string table_batch_read_session
-
+    // for mc network configuration
+    4: optional i32 connect_timeout
+    5: optional i32 read_timeout
+    6: optional i32 retry_times
 }
 
 struct THudiFileDesc {
@@ -367,6 +370,7 @@ struct THudiFileDesc {
     8: optional list<string> column_names;
     9: optional list<string> column_types;
     10: optional list<string> nested_fields;
+    11: optional string hudi_jni_scanner;
 }
 
 struct TLakeSoulFileDesc {
@@ -406,6 +410,7 @@ enum TTextSerdeType {
 struct TFileScanRangeParams {
     // deprecated, move to TFileScanRange
     1: optional Types.TFileType file_type;
+    // deprecated, move to TFileScanRange
     2: optional TFileFormatType format_type;
     // deprecated, move to TFileScanRange
     3: optional TFileCompressType compress_type;
@@ -480,6 +485,7 @@ struct TFileRangeDesc {
     // for hive table, different files may have different fs,
     // so fs_name should be with TFileRangeDesc
     12: optional string fs_name
+    13: optional TFileFormatType format_type;
 }
 
 struct TSplitSource {
@@ -1293,7 +1299,9 @@ struct TRuntimeFilterDesc {
   // true, if join type is null aware like <=>. rf should dispose the case
   15: optional bool null_aware;
 
-  16: optional bool sync_filter_size;
+  16: optional bool sync_filter_size; // Deprecated
+  
+  17: optional bool build_bf_exactly;
 }
 
 
diff --git a/gensrc/thrift/Types.thrift b/gensrc/thrift/Types.thrift
index 1912f950587dbf..623da9ce067061 100644
--- a/gensrc/thrift/Types.thrift
+++ b/gensrc/thrift/Types.thrift
@@ -124,7 +124,8 @@ enum TStorageBackendType {
 enum TInvertedIndexFileStorageFormat {
     DEFAULT = 0, // Default format, unspecified storage method.
     V1 = 1,      // Index per idx: Each index is stored separately based on its identifier.
-    V2 = 2      // Segment id per idx: Indexes are organized based on segment identifiers, grouping indexes by their associated segment.
+    V2 = 2       // Segment id per idx: Indexes are organized based on segment identifiers, grouping indexes by their associated segment.
+    V3 = 3       // Position and dictionary compression
 }
 
 struct TScalarType {
diff --git a/regression-test/data/account_p0/test_information_schema.out b/regression-test/data/account_p0/test_information_schema.out
index 77d5f6dccd50e8..e4f0ed09d0e1c7 100644
--- a/regression-test/data/account_p0/test_information_schema.out
+++ b/regression-test/data/account_p0/test_information_schema.out
@@ -17,3 +17,10 @@
 -- !sql --
 DUP
 
+-- !default --
+id	largeint	YES	\N
+name	varchar(20)	YES	无
+age	smallint(6)	YES	0
+address	varchar(100)	YES	beijing
+date	datetime	YES	20240101
+
diff --git a/regression-test/data/catalog_recycle_bin_p0/test_create_drop_multiple.out b/regression-test/data/catalog_recycle_bin_p0/test_create_drop_multiple.out
new file mode 100644
index 00000000000000..9e3ccdba6fe27a
--- /dev/null
+++ b/regression-test/data/catalog_recycle_bin_p0/test_create_drop_multiple.out
@@ -0,0 +1,20 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !select_check_1 --
+1	a	2022-01-02
+2	a	2023-01-02
+3	a	2024-01-02
+
+-- !select_check_2 --
+3	a	2024-01-02
+
+-- !select_check_recover_1_value4 --
+4	a	2024-01-02
+
+-- !select_check_recover_2_value3 --
+3	a	2024-01-02
+
+-- !select_check_recover_3_value123 --
+1	a	2022-01-02
+2	a	2023-01-02
+3	a	2024-01-02
+
diff --git a/regression-test/data/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.out b/regression-test/data/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.out
new file mode 100644
index 00000000000000..4930be08bd12fe
--- /dev/null
+++ b/regression-test/data/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.out
@@ -0,0 +1,23 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !select_check_1 --
+1	a	2022-01-02
+2	a	2023-01-02
+3	a	2024-01-02
+
+-- !select_check_2 --
+3	a	2024-01-02
+
+-- !select_check_3 --
+4	a	2024-01-02
+
+-- !select_check_recover_1_value4 --
+4	a	2024-01-02
+
+-- !select_check_recover_2_value3 --
+3	a	2024-01-02
+
+-- !select_check_recover_3_value123 --
+1	a	2022-01-02
+2	a	2023-01-02
+3	a	2024-01-02
+
diff --git a/regression-test/data/compaction/test_full_compaction.out b/regression-test/data/compaction/test_full_compaction.out
index b25fdad93145cc..aaab47b4c3678b 100644
--- a/regression-test/data/compaction/test_full_compaction.out
+++ b/regression-test/data/compaction/test_full_compaction.out
@@ -41,3 +41,7 @@
 2	200
 3	0
 
+-- !select_final2 --
+1	100
+2	200
+
diff --git a/regression-test/data/compaction/test_full_compaction_ck.out b/regression-test/data/compaction/test_full_compaction_ck.out
new file mode 100644
index 00000000000000..f76314e79a7579
--- /dev/null
+++ b/regression-test/data/compaction/test_full_compaction_ck.out
@@ -0,0 +1,47 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !1 --
+1	1
+2	2
+
+-- !2 --
+1	10
+2	20
+
+-- !3 --
+1	100
+2	200
+
+-- !4 --
+1	100
+2	200
+3	300
+
+-- !5 --
+1	100
+2	200
+3	100
+
+-- !6 --
+1	100
+2	200
+
+-- !skip_delete --
+1	1
+1	10
+1	100
+2	2
+2	20
+2	200
+3	100
+3	100
+3	300
+
+-- !select_final --
+1	100
+2	200
+3	100
+
+-- !select_final2 --
+1	100
+2	200
+
diff --git a/regression-test/data/correctness_p0/test_mv_case/test_mv_case.out b/regression-test/data/correctness_p0/test_mv_case/test_mv_case.out
index e87ee694dc1adb..bab672bd6abd07 100644
--- a/regression-test/data/correctness_p0/test_mv_case/test_mv_case.out
+++ b/regression-test/data/correctness_p0/test_mv_case/test_mv_case.out
@@ -5,3 +5,6 @@ cib2205045_1_1s	2023-06-10T03:56:33	{"DB1":168939,"DNT":"2023-06-10 03:56:33"}
 cib2205045_1_1s	2023-06-10T03:57:33	{"DB1":168939,"DNT":"2023-06-10 03:57:33"}
 cib2205045_1_1s	2023-06-10T03:58:33	{"DB1":168939,"DNT":"2023-06-10 03:58:33"}
 
+-- !select_mv --
+123	{3:"5", 6:"8"}
+
diff --git a/regression-test/data/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.out b/regression-test/data/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.out
index b7757222ab4991..24f2f19c5769a5 100644
--- a/regression-test/data/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.out
+++ b/regression-test/data/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.out
@@ -170,12 +170,6 @@ c	double	No	false	\N	NONE,STORED GENERATED
 b	int	Yes	false	\N	NONE
 d	int	Yes	false	\N	NONE,STORED GENERATED
 
--- !test_update --
-1
-
--- !test_update_generated_column --
-1	20	21
-
 -- !gen_col_unique_key --
 0
 
@@ -221,3 +215,9 @@ d	int	Yes	false	\N	NONE,STORED GENERATED
 -- !agg_replace_null --
 1	2	3	4	13
 
+-- !test_update --
+1
+
+-- !test_update_generated_column --
+1	20	21
+
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_incremental.out b/regression-test/data/external_table_p2/hudi/test_hudi_incremental.out
index b1bdad85013bfc..50644f34961942 100644
--- a/regression-test/data/external_table_p2/hudi/test_hudi_incremental.out
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_incremental.out
@@ -347,3 +347,177 @@
 -- !incremental_9_10 --
 1000
 
+-- !incremental_1_end --
+9000
+
+-- !incremental_earliest_1 --
+1000
+
+-- !incremental_2_end --
+8000
+
+-- !incremental_earliest_2 --
+2000
+
+-- !incremental_1_2 --
+1000
+
+-- !incremental_3_end --
+7000
+
+-- !incremental_earliest_3 --
+3000
+
+-- !incremental_2_3 --
+1000
+
+-- !incremental_4_end --
+6000
+
+-- !incremental_earliest_4 --
+4000
+
+-- !incremental_3_4 --
+1000
+
+-- !incremental_5_end --
+5000
+
+-- !incremental_earliest_5 --
+5000
+
+-- !incremental_4_5 --
+1000
+
+-- !incremental_6_end --
+4000
+
+-- !incremental_earliest_6 --
+6000
+
+-- !incremental_5_6 --
+1000
+
+-- !incremental_7_end --
+3000
+
+-- !incremental_earliest_7 --
+7000
+
+-- !incremental_6_7 --
+1000
+
+-- !incremental_8_end --
+2000
+
+-- !incremental_earliest_8 --
+8000
+
+-- !incremental_7_8 --
+1000
+
+-- !incremental_9_end --
+1000
+
+-- !incremental_earliest_9 --
+9000
+
+-- !incremental_8_9 --
+1000
+
+-- !incremental_10_end --
+0
+
+-- !incremental_earliest_10 --
+10000
+
+-- !incremental_9_10 --
+1000
+
+-- !incremental_1_end --
+9000
+
+-- !incremental_earliest_1 --
+1000
+
+-- !incremental_2_end --
+8000
+
+-- !incremental_earliest_2 --
+2000
+
+-- !incremental_1_2 --
+1000
+
+-- !incremental_3_end --
+7000
+
+-- !incremental_earliest_3 --
+3000
+
+-- !incremental_2_3 --
+1000
+
+-- !incremental_4_end --
+6000
+
+-- !incremental_earliest_4 --
+4000
+
+-- !incremental_3_4 --
+1000
+
+-- !incremental_5_end --
+5000
+
+-- !incremental_earliest_5 --
+5000
+
+-- !incremental_4_5 --
+1000
+
+-- !incremental_6_end --
+4000
+
+-- !incremental_earliest_6 --
+6000
+
+-- !incremental_5_6 --
+1000
+
+-- !incremental_7_end --
+3000
+
+-- !incremental_earliest_7 --
+7000
+
+-- !incremental_6_7 --
+1000
+
+-- !incremental_8_end --
+2000
+
+-- !incremental_earliest_8 --
+8000
+
+-- !incremental_7_8 --
+1000
+
+-- !incremental_9_end --
+1000
+
+-- !incremental_earliest_9 --
+9000
+
+-- !incremental_8_9 --
+1000
+
+-- !incremental_10_end --
+0
+
+-- !incremental_earliest_10 --
+10000
+
+-- !incremental_9_10 --
+1000
+
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_orc_tables.out b/regression-test/data/external_table_p2/hudi/test_hudi_orc_tables.out
new file mode 100644
index 00000000000000..9e28074dc9114e
--- /dev/null
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_orc_tables.out
@@ -0,0 +1,15 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !cow --
+20241204190011744	20241204190011744_0_6	20241204190011744_0_0		a99e363a-6c10-40f3-a675-9117506d1a43-0_0-38-94_20241204190011744.orc	1	A
+20241204190011744	20241204190011744_0_7	20241204190011744_2_0		a99e363a-6c10-40f3-a675-9117506d1a43-0_0-38-94_20241204190011744.orc	3	C
+20241204190011744	20241204190011744_0_8	20241204190011744_4_0		a99e363a-6c10-40f3-a675-9117506d1a43-0_0-38-94_20241204190011744.orc	5	E
+20241204190011744	20241204190011744_0_9	20241204190011744_1_0		a99e363a-6c10-40f3-a675-9117506d1a43-0_0-38-94_20241204190011744.orc	2	B
+20241204190011744	20241204190011744_0_10	20241204190011744_3_0		a99e363a-6c10-40f3-a675-9117506d1a43-0_0-38-94_20241204190011744.orc	4	D
+
+-- !mor --
+20241204190002046	20241204190002046_0_11	20241204190002046_0_0		b1e68412-01d6-467f-b4c2-b4b18ec71346-0_0-30-75_20241204190002046.orc	1	A
+20241204190002046	20241204190002046_0_12	20241204190002046_2_0		b1e68412-01d6-467f-b4c2-b4b18ec71346-0_0-30-75_20241204190002046.orc	3	C
+20241204190002046	20241204190002046_0_13	20241204190002046_4_0		b1e68412-01d6-467f-b4c2-b4b18ec71346-0_0-30-75_20241204190002046.orc	5	E
+20241204190002046	20241204190002046_0_14	20241204190002046_1_0		b1e68412-01d6-467f-b4c2-b4b18ec71346-0_0-30-75_20241204190002046.orc	2	B
+20241204190002046	20241204190002046_0_15	20241204190002046_3_0		b1e68412-01d6-467f-b4c2-b4b18ec71346-0_0-30-75_20241204190002046.orc	4	D
+
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_partition_prune.out b/regression-test/data/external_table_p2/hudi/test_hudi_partition_prune.out
new file mode 100644
index 00000000000000..fd3eafa0255722
--- /dev/null
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_partition_prune.out
@@ -0,0 +1,357 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !time_travel_two_partition_1_3 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+
+-- !time_travel_two_partition_2_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !time_travel_two_partition_3_1 --
+4	David	US	2
+5	Eva	US	2
+
+-- !time_travel_two_partition_4_0 --
+
+-- !time_travel_two_partition_5_0 --
+
+-- !time_travel_two_partition_6_1 --
+1	Alice	US	1
+
+-- !one_partition_boolean --
+1	Alice	true
+2	Bob	true
+
+-- !one_partition_tinyint --
+1	Alice	1
+2	Bob	1
+
+-- !one_partition_smallint --
+1	Alice	10
+2	Bob	10
+
+-- !one_partition_int --
+1	Alice	100
+2	Bob	100
+
+-- !one_partition_bigint --
+1	Alice	1234567890
+2	Bob	1234567890
+
+-- !one_partition_string --
+1	Alice	RegionA
+2	Bob	RegionA
+
+-- !one_partition_date --
+1	Alice	2023-12-01
+2	Bob	2023-12-01
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !time_travel_two_partition_1_3 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+
+-- !time_travel_two_partition_2_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !time_travel_two_partition_3_1 --
+4	David	US	2
+5	Eva	US	2
+
+-- !time_travel_two_partition_4_0 --
+
+-- !time_travel_two_partition_5_0 --
+
+-- !time_travel_two_partition_6_1 --
+1	Alice	US	1
+
+-- !one_partition_boolean --
+1	Alice	true
+2	Bob	true
+
+-- !one_partition_tinyint --
+1	Alice	1
+2	Bob	1
+
+-- !one_partition_smallint --
+1	Alice	10
+2	Bob	10
+
+-- !one_partition_int --
+1	Alice	100
+2	Bob	100
+
+-- !one_partition_bigint --
+1	Alice	1234567890
+2	Bob	1234567890
+
+-- !one_partition_string --
+1	Alice	RegionA
+2	Bob	RegionA
+
+-- !one_partition_date --
+1	Alice	2023-12-01
+2	Bob	2023-12-01
+
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_schema_evolution.out b/regression-test/data/external_table_p2/hudi/test_hudi_schema_evolution.out
index 12dd0cf086d3f0..da7273d4c14ef9 100644
--- a/regression-test/data/external_table_p2/hudi/test_hudi_schema_evolution.out
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_schema_evolution.out
@@ -31,3 +31,35 @@
 20241118012149007	20241118012149007_0_4	5		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	5	Eva	{"age":31.5, "address":"Chengdu"}
 20241118012149007	20241118012149007_0_5	6		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	6	Frank	{"age":29.2, "address":"Wuhan"}
 
+-- !adding_simple_columns_table --
+20241118012126237	20241118012126237_0_1	1		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	1	Alice	\N
+20241118012126237	20241118012126237_0_0	2		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	2	Bob	\N
+20241118012126237	20241118012126237_0_2	3		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	3	Cathy	\N
+20241118012132306	20241118012132306_0_3	4		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	4	David	25
+20241118012132306	20241118012132306_0_4	5		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	5	Eva	30
+20241118012132306	20241118012132306_0_5	6		5166112a-90d8-4ba8-8646-337fbeb2a375-0_0-35-121_20241118012132306.parquet	6	Frank	28
+
+-- !altering_simple_columns_table --
+20241118012136512	20241118012136512_0_0	1		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	1	Alice	25.0
+20241118012136512	20241118012136512_0_2	2		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	2	Bob	30.0
+20241118012136512	20241118012136512_0_1	3		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	3	Cathy	28.0
+20241118012138287	20241118012138287_0_3	4		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	4	David	26.0
+20241118012138287	20241118012138287_0_4	5		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	5	Eva	31.5
+20241118012138287	20241118012138287_0_5	6		203f0f43-ae9d-4c17-8d5d-834f0dbc62c9-0_0-78-246_20241118012138287.parquet	6	Frank	29.2
+
+-- !adding_complex_columns_table --
+20241118012144831	20241118012144831_0_1	1		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	1	Alice	{"age":25, "address":"Guangzhou", "email":null}
+20241118012144831	20241118012144831_0_0	2		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	2	Bob	{"age":30, "address":"Shanghai", "email":null}
+20241118012144831	20241118012144831_0_2	3		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	3	Cathy	{"age":28, "address":"Beijing", "email":null}
+20241118012146150	20241118012146150_0_3	4		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	4	David	{"age":25, "address":"Shenzhen", "email":"david@example.com"}
+20241118012146150	20241118012146150_0_4	5		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	5	Eva	{"age":30, "address":"Chengdu", "email":"eva@example.com"}
+20241118012146150	20241118012146150_0_5	6		3c038df9-a652-4878-9b8a-221ae443448e-0_0-165-497_20241118012146150.parquet	6	Frank	{"age":28, "address":"Wuhan", "email":"frank@example.com"}
+
+-- !altering_complex_columns_table --
+20241118012147879	20241118012147879_0_0	1		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	1	Alice	{"age":25, "address":"Guangzhou"}
+20241118012147879	20241118012147879_0_2	2		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	2	Bob	{"age":30, "address":"Shanghai"}
+20241118012147879	20241118012147879_0_1	3		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	3	Cathy	{"age":28, "address":"Beijing"}
+20241118012149007	20241118012149007_0_3	4		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	4	David	{"age":26, "address":"Shenzhen"}
+20241118012149007	20241118012149007_0_4	5		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	5	Eva	{"age":31.5, "address":"Chengdu"}
+20241118012149007	20241118012149007_0_5	6		185d101f-a484-45ce-b236-03ccd33c521b-0_0-208-622_20241118012149007.parquet	6	Frank	{"age":29.2, "address":"Wuhan"}
+
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_snapshot.out b/regression-test/data/external_table_p2/hudi/test_hudi_snapshot.out
index efad67ffbfa8c4..1e151c2a86fa20 100644
Binary files a/regression-test/data/external_table_p2/hudi/test_hudi_snapshot.out and b/regression-test/data/external_table_p2/hudi/test_hudi_snapshot.out differ
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_timestamp.out b/regression-test/data/external_table_p2/hudi/test_hudi_timestamp.out
index dc47ff86d90a8d..9bdb0f7cb7285f 100644
--- a/regression-test/data/external_table_p2/hudi/test_hudi_timestamp.out
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_timestamp.out
@@ -1,6 +1,31 @@
 -- This file is automatically generated. You should know what you did if you want to edit this
--- !timestamp --
+-- !timestamp1 --
 20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T08:00
-20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-25T09:30:00
-20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-25T11:00:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-25T09:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-25T11:00
+
+-- !timestamp2 --
+20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T23:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-26T00:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-26T02:00
+
+-- !timestamp3 --
+20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T15:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-25T16:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-25T18:00
+
+-- !timestamp1 --
+20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T08:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-25T09:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-25T11:00
+
+-- !timestamp2 --
+20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T23:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-26T00:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-26T02:00
+
+-- !timestamp3 --
+20241115015956800	20241115015956800_0_2	1		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	1	Alice	2024-10-25T15:00
+20241115015956800	20241115015956800_0_0	2		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	2	Bob	2024-10-25T16:30
+20241115015956800	20241115015956800_0_1	3		eec4913a-0d5f-4b8b-a0f5-934e252c2e45-0_0-7-14_20241115015956800.parquet	3	Charlie	2024-10-25T18:00
 
diff --git a/regression-test/data/external_table_p2/hudi/test_hudi_timetravel.out b/regression-test/data/external_table_p2/hudi/test_hudi_timetravel.out
index a9b5d23595a8e3..00d15805baf04e 100644
--- a/regression-test/data/external_table_p2/hudi/test_hudi_timetravel.out
+++ b/regression-test/data/external_table_p2/hudi/test_hudi_timetravel.out
@@ -119,3 +119,123 @@
 -- !timetravel10 --
 10000
 
+-- !timetravel1 --
+1000
+
+-- !timetravel2 --
+2000
+
+-- !timetravel3 --
+3000
+
+-- !timetravel4 --
+4000
+
+-- !timetravel5 --
+5000
+
+-- !timetravel6 --
+6000
+
+-- !timetravel7 --
+7000
+
+-- !timetravel8 --
+8000
+
+-- !timetravel9 --
+9000
+
+-- !timetravel10 --
+10000
+
+-- !timetravel1 --
+1000
+
+-- !timetravel2 --
+2000
+
+-- !timetravel3 --
+3000
+
+-- !timetravel4 --
+4000
+
+-- !timetravel5 --
+5000
+
+-- !timetravel6 --
+6000
+
+-- !timetravel7 --
+7000
+
+-- !timetravel8 --
+8000
+
+-- !timetravel9 --
+9000
+
+-- !timetravel10 --
+10000
+
+-- !timetravel1 --
+1000
+
+-- !timetravel2 --
+2000
+
+-- !timetravel3 --
+3000
+
+-- !timetravel4 --
+4000
+
+-- !timetravel5 --
+5000
+
+-- !timetravel6 --
+6000
+
+-- !timetravel7 --
+7000
+
+-- !timetravel8 --
+8000
+
+-- !timetravel9 --
+9000
+
+-- !timetravel10 --
+10000
+
+-- !timetravel1 --
+1000
+
+-- !timetravel2 --
+2000
+
+-- !timetravel3 --
+3000
+
+-- !timetravel4 --
+4000
+
+-- !timetravel5 --
+5000
+
+-- !timetravel6 --
+6000
+
+-- !timetravel7 --
+7000
+
+-- !timetravel8 --
+8000
+
+-- !timetravel9 --
+9000
+
+-- !timetravel10 --
+10000
+
diff --git a/regression-test/data/external_table_p2/maxcompute/test_max_compute_partition_prune.out b/regression-test/data/external_table_p2/maxcompute/test_max_compute_partition_prune.out
index 8f443829c4c394..d6c23e6b5abf52 100644
--- a/regression-test/data/external_table_p2/maxcompute/test_max_compute_partition_prune.out
+++ b/regression-test/data/external_table_p2/maxcompute/test_max_compute_partition_prune.out
@@ -123,3 +123,1367 @@
 
 -- !three_partition_11_0 --
 
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
+-- !one_partition_1_1 --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+
+-- !one_partition_2_1 --
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_3_all --
+1	Alice	2024
+2	Bob	2024
+3	Charlie	2024
+4	David	2025
+5	Eva	2025
+
+-- !one_partition_4_all --
+5	Eva	2025
+
+-- !one_partition_5_1 --
+3	Charlie	2024
+
+-- !two_partition_1_1 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+
+-- !two_partition_2_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_3_2 --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+
+-- !two_partition_4_all --
+1	Alice	US	1
+2	Bob	US	1
+3	Charlie	US	1
+4	David	US	2
+5	Eva	US	2
+6	Frank	EU	1
+7	Grace	EU	1
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !two_partition_5_1 --
+
+-- !two_partition_6_1 --
+8	Hannah	EU	2
+9	Ivy	EU	2
+10	Jack	EU	2
+
+-- !three_partition_1_1 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+
+-- !three_partition_2_1 --
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+
+-- !three_partition_3_3 --
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_4_2 --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+6	Frank	US	2025	Q1
+
+-- !three_partition_5_all --
+1	Alice	US	2024	Q1
+2	Bob	US	2024	Q1
+3	Charlie	US	2024	Q1
+4	David	US	2024	Q2
+5	Eva	US	2024	Q2
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_6_1 --
+8	Hannah	EU	2024	Q1
+9	Ivy	EU	2024	Q1
+
+-- !three_partition_7_7 --
+6	Frank	US	2025	Q1
+7	Grace	US	2025	Q2
+10	Jack	EU	2025	Q2
+11	Leo	EU	2025	Q2
+12	Mia	EU	2025	Q3
+13	Nina	AS	2025	Q1
+14	Oscar	AS	2025	Q2
+15	Paul	AS	2025	Q3
+
+-- !three_partition_8_2 --
+7	Grace	US	2025	Q2
+
+-- !one_partition_6_0 --
+
+-- !two_partition_7_0 --
+
+-- !two_partition_8_0 --
+
+-- !three_partition_9_0 --
+
+-- !three_partition_10_0 --
+
+-- !three_partition_11_0 --
+
diff --git a/regression-test/data/insert_p0/test_insert_docs_demo.out b/regression-test/data/insert_p0/test_insert_docs_demo.out
new file mode 100644
index 00000000000000..f984fb09c6d433
--- /dev/null
+++ b/regression-test/data/insert_p0/test_insert_docs_demo.out
@@ -0,0 +1,6 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !insert --
+5	Ava	17
+1	Emily	25
+3	Olivia	28
+
diff --git a/regression-test/data/inverted_index_p0/test_inverted_index_v3.out b/regression-test/data/inverted_index_p0/test_inverted_index_v3.out
new file mode 100644
index 00000000000000..9dc20f3e0e0a85
--- /dev/null
+++ b/regression-test/data/inverted_index_p0/test_inverted_index_v3.out
@@ -0,0 +1,25 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !sql --
+238
+
+-- !sql --
+104
+
+-- !sql --
+104
+
+-- !sql --
+105
+
+-- !sql --
+238
+
+-- !sql --
+104
+
+-- !sql --
+104
+
+-- !sql --
+105
+
diff --git a/regression-test/data/javaudf_p0/test_javaudf_const_test.out b/regression-test/data/javaudf_p0/test_javaudf_const_test.out
new file mode 100644
index 00000000000000..984cd976b3ec40
--- /dev/null
+++ b/regression-test/data/javaudf_p0/test_javaudf_const_test.out
@@ -0,0 +1,13 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !java_udf_all_types --
+1	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+2	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+3	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+4	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+5	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+6	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+7	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+8	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+9	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+10	true	2	3	4.4000	5.5	6.6	2020-02-02	2022-02-03T10:10:10	asd	["a", "b"]	{"s_id":2, "s_name":"sa2"}	{"aa":"bb"}
+
diff --git a/regression-test/data/mtmv_p0/test_hive_rewrite_mtmv.out b/regression-test/data/mtmv_p0/test_hive_rewrite_mtmv.out
new file mode 100644
index 00000000000000..452cff71e53e9c
--- /dev/null
+++ b/regression-test/data/mtmv_p0/test_hive_rewrite_mtmv.out
@@ -0,0 +1,31 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !refresh_one_partition --
+20230101	3
+
+-- !refresh_one_partition_rewrite --
+20230101	3
+20230102	3
+
+-- !refresh_complete --
+20230101	3
+20230102	3
+
+-- !refresh_all_partition_rewrite --
+20230101	3
+20230102	3
+
+-- !refresh_one_partition --
+20230101	3
+
+-- !refresh_one_partition_rewrite --
+20230101	3
+20230102	3
+
+-- !refresh_complete --
+20230101	3
+20230102	3
+
+-- !refresh_all_partition_rewrite --
+20230101	3
+20230102	3
+
diff --git a/regression-test/data/nereids_function_p0/scalar_function/IP.out b/regression-test/data/nereids_function_p0/scalar_function/IP.out
index 5b44453ceb6232..af146b66223378 100644
--- a/regression-test/data/nereids_function_p0/scalar_function/IP.out
+++ b/regression-test/data/nereids_function_p0/scalar_function/IP.out
@@ -410,6 +410,108 @@
 99	{"min":"224.0.0.0", "max":"224.0.255.255"}
 100	{"min":"224.0.0.0", "max":"224.0.255.255"}
 
+-- !sql_cidr_ipv6_nullable_ --
+1	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+2	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+3	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+4	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+5	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+6	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+7	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+8	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+9	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+10	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+11	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+12	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+13	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+14	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+15	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+16	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+17	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+18	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+19	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+20	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+21	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+22	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+23	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+24	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+25	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+26	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+27	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+28	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+29	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+30	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+31	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+32	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+33	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+34	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+35	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+36	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+37	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+38	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+39	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+40	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+41	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+42	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+43	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+44	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+45	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+46	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+47	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+48	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+49	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+50	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+51	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+52	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+53	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+54	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+55	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+56	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+57	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+58	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+59	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+60	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+61	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+62	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+63	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+64	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+65	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+66	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+67	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+68	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+69	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+70	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+71	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+72	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+73	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+74	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+75	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+76	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+77	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+78	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+79	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+80	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+81	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+82	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+83	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+84	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+85	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+86	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+87	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+88	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+89	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+90	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+91	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+92	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+93	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+94	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+95	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+96	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+97	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+98	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+99	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+100	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+
 -- !sql_num2string_ipv6 --
 1	::1
 2	fc00::
@@ -6121,6 +6223,108 @@
 99	{"min":"224.0.0.0", "max":"224.0.255.255"}
 100	{"min":"224.0.0.0", "max":"224.0.255.255"}
 
+-- !sql_not_null_cidr_ipv6_nullable_ --
+1	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+2	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+3	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+4	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+5	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+6	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+7	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+8	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+9	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+10	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+11	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+12	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+13	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+14	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+15	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+16	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+17	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+18	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+19	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+20	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+21	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+22	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+23	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+24	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+25	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+26	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+27	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+28	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+29	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+30	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+31	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+32	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+33	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+34	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+35	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+36	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+37	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+38	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+39	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+40	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+41	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+42	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+43	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+44	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+45	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+46	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+47	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+48	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+49	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+50	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+51	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+52	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+53	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+54	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+55	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+56	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+57	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+58	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+59	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+60	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+61	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+62	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+63	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+64	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+65	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+66	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+67	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+68	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+69	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+70	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+71	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+72	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+73	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+74	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+75	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+76	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+77	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+78	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+79	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+80	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+81	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+82	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+83	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+84	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+85	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+86	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+87	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+88	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+89	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+90	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+91	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+92	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+93	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+94	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+95	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+96	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+97	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+98	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+99	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+100	{"min":"::", "max":"::ffff:ffff:ffff:ffff:ffff:ffff"}
+
 -- !sql_not_null_ipv6_string_to_num --
 1	00000000000000000000000000000001
 2	FC000000000000000000000000000000
diff --git a/regression-test/data/nereids_p0/system/test_query_sys_tables.out b/regression-test/data/nereids_p0/system/test_query_sys_tables.out
index a43229a87adead..16b71543a11302 100644
--- a/regression-test/data/nereids_p0/system/test_query_sys_tables.out
+++ b/regression-test/data/nereids_p0/system/test_query_sys_tables.out
@@ -25,9 +25,9 @@ internal	test_query_sys_db_5	\N
 internal	test_query_sys_db_6	\N
 
 -- !tables --
-internal	test_query_sys_tb_4	BASE TABLE	0	\N	\N
-internal	test_query_sys_tb_5	BASE TABLE	0	\N	\N
-internal	test_query_sys_tb_6	BASE TABLE	0	\N	\N
+internal	test_query_sys_tb_4	BASE TABLE	0	\N	0
+internal	test_query_sys_tb_5	BASE TABLE	0	\N	0
+internal	test_query_sys_tb_6	BASE TABLE	0	\N	0
 
 -- !session_variables --
 wait_timeout	30000
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/basic.out b/regression-test/data/nereids_rules_p0/eager_aggregate/basic.out
index ba18189efcad82..19b1b3cdb85590 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/basic.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/basic.out
@@ -40,14 +40,17 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------filter((a.event_id = 'ad_click'))
-----------PhysicalOlapScan[com_dd_library]
---------filter((cast(experiment_id as DOUBLE) = 37.0))
-----------PhysicalOlapScan[shunt_log_com_dd_library]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------filter((a.event_id = 'ad_click'))
+--------------PhysicalOlapScan[com_dd_library]
+--------hashAgg[LOCAL]
+----------filter((cast(experiment_id as DOUBLE) = 37.0))
+------------PhysicalOlapScan[shunt_log_com_dd_library]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed: use_push_down_agg_through_join
 SyntaxError:
 
 -- !with_hint_2 --
@@ -55,13 +58,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library]
---------filter((cast(experiment_id as DOUBLE) = 73.0))
-----------PhysicalOlapScan[shunt_log_com_dd_library]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[com_dd_library]
+--------hashAgg[LOCAL]
+----------filter((cast(experiment_id as DOUBLE) = 73.0))
+------------PhysicalOlapScan[shunt_log_com_dd_library]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed: use_push_down_agg_through_join
 SyntaxError:
 
 -- !with_hint_3 --
@@ -69,13 +75,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library]
+--------hashAgg[LOCAL]
+----------PhysicalOlapScan[com_dd_library]
 --------filter((cast(experiment_id as DOUBLE) = 73.0))
 ----------PhysicalOlapScan[shunt_log_com_dd_library]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed: use_push_down_agg_through_join
 SyntaxError:
 
 -- !with_hint_4 --
@@ -83,11 +90,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library]
---------PhysicalOlapScan[shunt_log_com_dd_library]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[com_dd_library]
+--------hashAgg[LOCAL]
+----------PhysicalOlapScan[shunt_log_com_dd_library]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed: use_push_down_agg_through_join
 SyntaxError:
 
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/basic_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/basic_one_side.out
index aaf6afeca1e9f6..66f1729e2e3816 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/basic_one_side.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/basic_one_side.out
@@ -40,14 +40,17 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------filter((a.event_id = 'ad_click'))
-----------PhysicalOlapScan[com_dd_library_one_side]
---------filter((cast(experiment_id as DOUBLE) = 37.0))
-----------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------filter((a.event_id = 'ad_click'))
+--------------PhysicalOlapScan[com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------filter((cast(experiment_id as DOUBLE) = 37.0))
+------------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_2 --
@@ -55,13 +58,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library_one_side]
---------filter((cast(experiment_id as DOUBLE) = 73.0))
-----------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------filter((cast(experiment_id as DOUBLE) = 73.0))
+------------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_3 --
@@ -69,13 +75,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------PhysicalOlapScan[com_dd_library_one_side]
 --------filter((cast(experiment_id as DOUBLE) = 73.0))
 ----------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_4 --
@@ -83,11 +90,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((a.device_id = b.device_id)) otherCondition=()
---------PhysicalOlapScan[com_dd_library_one_side]
---------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[com_dd_library_one_side]
+--------hashAgg[LOCAL]
+----------PhysicalOlapScan[shunt_log_com_dd_library_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.out
new file mode 100644
index 00000000000000..4a84ff5117c008
--- /dev/null
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.out
@@ -0,0 +1,237 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !groupby_pushdown_basic --
+1
+1
+1
+3
+
+-- !groupby_pushdown_left_join --
+1
+1
+1
+3
+
+-- !groupby_pushdown_right_join --
+1
+1
+1
+3
+
+-- !groupby_pushdown_full_join --
+1
+1
+1
+3
+
+-- !groupby_pushdown_left_semi_join --
+1
+1
+1
+3
+
+-- !groupby_pushdown_left_anti_join --
+
+-- !groupby_pushdown_complex_conditions --
+
+-- !groupby_pushdown_with_aggregate --
+1	1.0
+1	2.0
+1	3.0
+3	2.0
+
+-- !groupby_pushdown_subquery --
+
+-- !groupby_pushdown_outer_join --
+1
+1
+1
+3
+
+-- !groupby_pushdown_deep_subquery --
+
+-- !groupby_pushdown_having --
+
+-- !groupby_pushdown_mixed_aggregates --
+1	1
+1	2
+1	3
+3	6
+
+-- !groupby_pushdown_multi_table_join --
+1
+1
+1
+
+-- !groupby_pushdown_with_order_by --
+1
+1
+1
+3
+
+-- !groupby_pushdown_multiple_equal_conditions --
+1
+1
+1
+
+-- !groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	1
+3	1
+
+-- !groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	1
+c	1
+
+-- !groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	1	1
+c	1	1
+
+-- !groupby_pushdown_with_where_clause --
+
+-- !groupby_pushdown_varied_aggregates --
+1	1.5	1
+1	4.5	1
+1	7.5	1
+3	7.0	0
+
+-- !groupby_pushdown_with_order_by_limit --
+1
+1
+1
+3
+
+-- !groupby_pushdown_alias_multiple_equal_conditions --
+1
+1
+1
+
+-- !groupby_pushdown_complex_join_condition --
+
+-- !groupby_pushdown_function_processed_columns --
+0
+1
+1
+1
+
+-- !groupby_pushdown_nested_queries --
+
+-- !with_hint_groupby_pushdown_basic --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_left_join --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_right_join --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_full_join --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_left_semi_join --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_left_anti_join --
+
+-- !with_hint_groupby_pushdown_complex_conditions --
+
+-- !with_hint_groupby_pushdown_with_aggregate --
+1	1.0
+1	2.0
+1	3.0
+3	2.0
+
+-- !with_hint_groupby_pushdown_subquery --
+
+-- !with_hint_groupby_pushdown_outer_join --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_deep_subquery --
+
+-- !with_hint_groupby_pushdown_having --
+
+-- !with_hint_groupby_pushdown_mixed_aggregates --
+1	1
+1	2
+1	3
+3	6
+
+-- !with_hint_groupby_pushdown_multi_table_join --
+1
+1
+1
+
+-- !with_hint_groupby_pushdown_with_order_by --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_multiple_equal_conditions --
+1
+1
+1
+
+-- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	1
+3	1
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	1
+c	1
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	1	1
+c	1	1
+
+-- !with_hint_groupby_pushdown_with_where_clause --
+
+-- !with_hint_groupby_pushdown_varied_aggregates --
+1	1.5	1
+1	4.5	1
+1	7.5	1
+3	7.0	0
+
+-- !with_hint_groupby_pushdown_with_order_by_limit --
+1
+1
+1
+3
+
+-- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
+1
+1
+1
+
+-- !with_hint_groupby_pushdown_complex_join_condition --
+
+-- !with_hint_groupby_pushdown_function_processed_columns --
+0
+1
+1
+1
+
+-- !with_hint_groupby_pushdown_nested_queries --
+
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.out
index 8267eb3e38ff91..251bc580d3279d 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.out
@@ -404,12 +404,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_join --
@@ -456,12 +462,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_anti_join --
@@ -482,12 +494,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=((t1.name < t2.name))
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 --------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_aggregate --
@@ -508,13 +522,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 10))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 10))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_outer_join --
@@ -535,13 +555,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 10))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 10))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_having --
@@ -550,12 +576,18 @@ PhysicalResultSink
 ----hashAgg[GLOBAL]
 ------hashAgg[LOCAL]
 --------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[count_t_one_side]
-----------PhysicalOlapScan[count_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------hashAgg[GLOBAL]
+----------------hashAgg[LOCAL]
+------------------PhysicalOlapScan[count_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_mixed_aggregates --
@@ -563,12 +595,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 --------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multi_table_join --
@@ -576,14 +610,26 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.name = t3.name)) otherCondition=()
---------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[count_t_one_side]
-----------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------hashAgg[GLOBAL]
+------------------------hashAgg[LOCAL]
+--------------------------PhysicalOlapScan[count_t_one_side]
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_order_by --
@@ -593,12 +639,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[count_t_one_side]
-------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multiple_equal_conditions --
@@ -606,12 +658,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
@@ -619,12 +677,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection --
@@ -632,12 +694,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection_with_aggregate --
@@ -645,12 +713,20 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_where_clause --
@@ -658,13 +734,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((t1.score > 50))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((t1.score > 50))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_varied_aggregates --
@@ -687,12 +769,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[count_t_one_side]
-------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
@@ -700,12 +788,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1_alias.id = t2_alias.id) and (t1_alias.name = t2_alias.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_complex_join_condition --
@@ -713,12 +807,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.score = t2.score)) otherCondition=(( not (name = name)))
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 --------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_function_processed_columns --
@@ -739,14 +835,20 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------filter((count_t_one_side.id < 100))
-----------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 20) and (t1.id < 100))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((count_t_one_side.id < 100))
+--------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 20) and (t1.id < 100))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_basic --
@@ -754,12 +856,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_join --
@@ -806,12 +914,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_anti_join --
@@ -832,12 +946,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=((t1.name < t2.name))
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 --------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_aggregate --
@@ -845,12 +961,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_subquery --
@@ -858,13 +980,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 10))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 10))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_outer_join --
@@ -885,13 +1013,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 10))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 10))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_having --
@@ -900,12 +1034,18 @@ PhysicalResultSink
 ----hashAgg[GLOBAL]
 ------hashAgg[LOCAL]
 --------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[count_t_one_side]
-----------PhysicalOlapScan[count_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------hashAgg[GLOBAL]
+----------------hashAgg[LOCAL]
+------------------PhysicalOlapScan[count_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multi_table_join --
@@ -913,14 +1053,26 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.name = t3.name)) otherCondition=()
---------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[count_t_one_side]
-----------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------hashAgg[GLOBAL]
+------------------------hashAgg[LOCAL]
+--------------------------PhysicalOlapScan[count_t_one_side]
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_order_by --
@@ -930,12 +1082,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[count_t_one_side]
-------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multiple_equal_conditions --
@@ -943,12 +1101,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection --
@@ -956,12 +1120,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_where_clause --
@@ -969,13 +1139,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[count_t_one_side]
---------filter((t1.score > 50))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((t1.score > 50))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_varied_aggregates --
@@ -998,12 +1174,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[count_t_one_side]
-------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[count_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_complex_join_condition --
@@ -1011,12 +1193,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.score = t2.score)) otherCondition=(( not (name = name)))
---------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[count_t_one_side]
 --------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_nested_queries --
@@ -1024,14 +1208,20 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------filter((count_t_one_side.id < 100))
-----------PhysicalOlapScan[count_t_one_side]
---------filter((count_t_one_side.score > 20) and (t1.id < 100))
-----------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((count_t_one_side.id < 100))
+--------------PhysicalOlapScan[count_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((count_t_one_side.score > 20) and (t1.id < 100))
+------------------PhysicalOlapScan[count_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !shape --
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_max_through_join.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_max_through_join.out
index 79b4ed890ded95..7cf9813e5b7181 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_max_through_join.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_max_through_join.out
@@ -224,12 +224,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_join --
@@ -276,12 +278,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_anti_join --
@@ -302,12 +306,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=((t1.name < t2.name))
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_aggregate --
@@ -329,12 +335,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[max_t]
---------filter((max_t.score > 10))
-----------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((max_t.score > 10))
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_outer_join --
@@ -356,12 +364,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[max_t]
---------filter((max_t.score > 10))
-----------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((max_t.score > 10))
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_having --
@@ -370,12 +380,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[max_t]
---------filter((t1.score > 100))
-----------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((t1.score > 100))
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_mixed_aggregates --
@@ -383,12 +395,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multi_table_join --
@@ -396,14 +410,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.name = t3.name)) otherCondition=()
---------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[max_t]
-----------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+--------------hashAgg[GLOBAL]
+----------------hashAgg[LOCAL]
+------------------PhysicalOlapScan[max_t]
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_order_by --
@@ -413,12 +431,14 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[max_t]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[max_t]
 ------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multiple_equal_conditions --
@@ -426,12 +446,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
@@ -439,12 +461,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[max_t]
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection --
@@ -452,12 +478,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection_with_aggregate --
@@ -465,12 +493,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[max_t]
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_where_clause --
@@ -479,12 +511,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[max_t]
---------filter((t1.score > 50))
-----------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((t1.score > 50))
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_varied_aggregates --
@@ -507,12 +541,14 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[max_t]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[max_t]
 ------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
@@ -520,12 +556,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1_alias.id = t2_alias.id) and (t1_alias.name = t2_alias.name)) otherCondition=()
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_complex_join_condition --
@@ -533,12 +571,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.score = t2.score)) otherCondition=(( not (name = name)))
---------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[max_t]
 --------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_function_processed_columns --
@@ -561,11 +601,13 @@ PhysicalResultSink
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------filter((max_t.id < 100))
 ----------PhysicalOlapScan[max_t]
---------filter((max_t.score > 20) and (t1.id < 100))
-----------PhysicalOlapScan[max_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((max_t.score > 20) and (t1.id < 100))
+--------------PhysicalOlapScan[max_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.out
new file mode 100644
index 00000000000000..db15483c496eb4
--- /dev/null
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.out
@@ -0,0 +1,237 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !groupby_pushdown_basic --
+1
+1
+2
+3
+
+-- !groupby_pushdown_left_join --
+1
+1
+2
+3
+
+-- !groupby_pushdown_right_join --
+1
+1
+2
+3
+
+-- !groupby_pushdown_full_join --
+1
+1
+2
+3
+
+-- !groupby_pushdown_left_semi_join --
+1
+1
+2
+3
+
+-- !groupby_pushdown_left_anti_join --
+
+-- !groupby_pushdown_complex_conditions --
+
+-- !groupby_pushdown_with_aggregate --
+1	1.0
+1	2.0
+2	2.0
+3	3.0
+
+-- !groupby_pushdown_subquery --
+
+-- !groupby_pushdown_outer_join --
+1
+1
+2
+3
+
+-- !groupby_pushdown_deep_subquery --
+
+-- !groupby_pushdown_having --
+
+-- !groupby_pushdown_mixed_aggregates --
+1	1
+1	6
+2	2
+3	3
+
+-- !groupby_pushdown_multi_table_join --
+1
+2
+3
+
+-- !groupby_pushdown_with_order_by --
+1
+1
+2
+3
+
+-- !groupby_pushdown_multiple_equal_conditions --
+1
+2
+3
+
+-- !groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	2
+3	3
+
+-- !groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	2
+c	3
+
+-- !groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	2	2
+c	3	3
+
+-- !groupby_pushdown_with_where_clause --
+
+-- !groupby_pushdown_varied_aggregates --
+1	1.5	a
+1	7.0	\N
+2	4.5	b
+3	7.5	c
+
+-- !groupby_pushdown_with_order_by_limit --
+1
+1
+2
+3
+
+-- !groupby_pushdown_alias_multiple_equal_conditions --
+1
+2
+3
+
+-- !groupby_pushdown_complex_join_condition --
+
+-- !groupby_pushdown_function_processed_columns --
+\N
+1
+1
+1
+
+-- !groupby_pushdown_nested_queries --
+
+-- !with_hint_groupby_pushdown_basic --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_left_join --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_right_join --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_full_join --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_left_semi_join --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_left_anti_join --
+
+-- !with_hint_groupby_pushdown_complex_conditions --
+
+-- !with_hint_groupby_pushdown_with_aggregate --
+1	1.0
+1	2.0
+2	2.0
+3	3.0
+
+-- !with_hint_groupby_pushdown_subquery --
+
+-- !with_hint_groupby_pushdown_outer_join --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_deep_subquery --
+
+-- !with_hint_groupby_pushdown_having --
+
+-- !with_hint_groupby_pushdown_mixed_aggregates --
+1	1
+1	6
+2	2
+3	3
+
+-- !with_hint_groupby_pushdown_multi_table_join --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_with_order_by --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_multiple_equal_conditions --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	2
+3	3
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	2
+c	3
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	2	2
+c	3	3
+
+-- !with_hint_groupby_pushdown_with_where_clause --
+
+-- !with_hint_groupby_pushdown_varied_aggregates --
+1	1.5	a
+1	7.0	\N
+2	4.5	b
+3	7.5	c
+
+-- !with_hint_groupby_pushdown_with_order_by_limit --
+1
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_complex_join_condition --
+
+-- !with_hint_groupby_pushdown_function_processed_columns --
+\N
+1
+1
+1
+
+-- !with_hint_groupby_pushdown_nested_queries --
+
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_through_join.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_through_join.out
index d4efe7df093503..e435bcd4efd335 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_through_join.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_min_through_join.out
@@ -224,12 +224,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_join --
@@ -276,12 +278,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_anti_join --
@@ -302,12 +306,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=((t1.name < t2.name))
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_aggregate --
@@ -329,12 +335,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[min_t]
---------filter((min_t.score > 10))
-----------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((min_t.score > 10))
+--------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_outer_join --
@@ -356,12 +364,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[min_t]
---------filter((min_t.score > 10))
-----------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((min_t.score > 10))
+--------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_having --
@@ -370,12 +380,14 @@ PhysicalResultSink
 ----hashAgg[GLOBAL]
 ------hashAgg[LOCAL]
 --------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[min_t]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------PhysicalOlapScan[min_t]
 ----------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_mixed_aggregates --
@@ -383,12 +395,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multi_table_join --
@@ -396,14 +410,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.name = t3.name)) otherCondition=()
---------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[min_t]
-----------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+--------------hashAgg[GLOBAL]
+----------------hashAgg[LOCAL]
+------------------PhysicalOlapScan[min_t]
+--------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_order_by --
@@ -413,12 +431,14 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[min_t]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[min_t]
 ------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multiple_equal_conditions --
@@ -426,12 +446,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
@@ -439,12 +461,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[min_t]
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection --
@@ -452,12 +478,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection_with_aggregate --
@@ -465,12 +493,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[min_t]
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_where_clause --
@@ -479,12 +511,14 @@ PhysicalResultSink
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------PhysicalOlapScan[min_t]
---------filter((t1.score > 50))
-----------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((t1.score > 50))
+--------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_varied_aggregates --
@@ -507,12 +541,14 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[min_t]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[min_t]
 ------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
@@ -520,12 +556,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1_alias.id = t2_alias.id) and (t1_alias.name = t2_alias.name)) otherCondition=()
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_complex_join_condition --
@@ -533,12 +571,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.score = t2.score)) otherCondition=(( not (name = name)))
---------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[min_t]
 --------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_function_processed_columns --
@@ -561,11 +601,13 @@ PhysicalResultSink
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
 --------filter((min_t.id < 100))
 ----------PhysicalOlapScan[min_t]
---------filter((min_t.score > 20) and (t1.id < 100))
-----------PhysicalOlapScan[min_t]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((min_t.score > 20) and (t1.id < 100))
+--------------PhysicalOlapScan[min_t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.out
new file mode 100644
index 00000000000000..bb8366176a7ba6
--- /dev/null
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.out
@@ -0,0 +1,231 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !groupby_pushdown_basic --
+1
+2
+3
+6
+
+-- !groupby_pushdown_left_join --
+1
+2
+3
+6
+
+-- !groupby_pushdown_right_join --
+1
+2
+3
+6
+
+-- !groupby_pushdown_full_join --
+1
+2
+3
+6
+
+-- !groupby_pushdown_left_semi_join --
+1
+2
+3
+6
+
+-- !groupby_pushdown_left_anti_join --
+
+-- !groupby_pushdown_complex_conditions --
+
+-- !groupby_pushdown_with_aggregate --
+1	1.0
+2	2.0
+3	3.0
+6	2.0
+
+-- !groupby_pushdown_subquery --
+
+-- !groupby_pushdown_outer_join --
+1
+2
+3
+6
+
+-- !groupby_pushdown_deep_subquery --
+
+-- !groupby_pushdown_having --
+
+-- !groupby_pushdown_mixed_aggregates --
+1	1
+2	2
+3	3
+6	6
+
+-- !groupby_pushdown_multi_table_join --
+1
+2
+3
+
+-- !groupby_pushdown_with_order_by --
+1
+2
+3
+6
+
+-- !groupby_pushdown_multiple_equal_conditions --
+1
+2
+3
+
+-- !groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	2
+3	3
+
+-- !groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	2
+c	3
+
+-- !groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	2	2
+c	3	3
+
+-- !groupby_pushdown_with_where_clause --
+
+-- !groupby_pushdown_varied_aggregates --
+1
+2
+3
+6
+
+-- !groupby_pushdown_with_order_by_limit --
+1
+2
+3
+6
+
+-- !groupby_pushdown_alias_multiple_equal_conditions --
+1
+2
+3
+
+-- !groupby_pushdown_complex_join_condition --
+
+-- !groupby_pushdown_function_processed_columns --
+1
+2
+3
+6
+
+-- !groupby_pushdown_nested_queries --
+
+-- !with_hint_groupby_pushdown_basic --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_left_join --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_right_join --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_full_join --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_left_semi_join --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_left_anti_join --
+
+-- !with_hint_groupby_pushdown_complex_conditions --
+
+-- !with_hint_groupby_pushdown_with_aggregate --
+1	1.0
+2	2.0
+3	3.0
+6	2.0
+
+-- !with_hint_groupby_pushdown_subquery --
+
+-- !with_hint_groupby_pushdown_outer_join --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_deep_subquery --
+
+-- !with_hint_groupby_pushdown_having --
+
+-- !with_hint_groupby_pushdown_mixed_aggregates --
+1	1
+2	2
+3	3
+6	6
+
+-- !with_hint_groupby_pushdown_multi_table_join --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_with_order_by --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_multiple_equal_conditions --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
+1	1
+2	2
+3	3
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate --
+a	1
+b	2
+c	3
+
+-- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate --
+a	1	1
+b	2	2
+c	3	3
+
+-- !with_hint_groupby_pushdown_with_where_clause --
+
+-- !with_hint_groupby_pushdown_varied_aggregates --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_with_order_by_limit --
+1
+2
+3
+6
+
+-- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
+1
+2
+3
+
+-- !with_hint_groupby_pushdown_complex_join_condition --
+
+-- !with_hint_groupby_pushdown_nested_queries --
+
diff --git a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_through_join_one_side.out b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_through_join_one_side.out
index 5013dc7dbdfb93..3a945f58e29e3c 100644
--- a/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_through_join_one_side.out
+++ b/regression-test/data/nereids_rules_p0/eager_aggregate/push_down_sum_through_join_one_side.out
@@ -224,12 +224,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_join --
@@ -276,12 +282,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_left_anti_join --
@@ -302,12 +314,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=((t1.name < t2.name))
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
 --------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_aggregate --
@@ -328,13 +342,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------filter((sum_t_one_side.score > 10))
-----------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((sum_t_one_side.score > 10))
+------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_outer_join --
@@ -355,13 +375,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------filter((sum_t_one_side.score > 10))
-----------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((sum_t_one_side.score > 10))
+------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_having --
@@ -370,12 +396,18 @@ PhysicalResultSink
 ----hashAgg[GLOBAL]
 ------hashAgg[LOCAL]
 --------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[sum_t_one_side]
-----------PhysicalOlapScan[sum_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------PhysicalOlapScan[sum_t_one_side]
+----------hashAgg[GLOBAL]
+------------hashAgg[LOCAL]
+--------------hashAgg[GLOBAL]
+----------------hashAgg[LOCAL]
+------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_mixed_aggregates --
@@ -383,12 +415,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
 --------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multi_table_join --
@@ -396,14 +430,26 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.name = t3.name)) otherCondition=()
---------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-----------PhysicalOlapScan[sum_t_one_side]
-----------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------PhysicalOlapScan[sum_t_one_side]
+------------------hashAgg[GLOBAL]
+--------------------hashAgg[LOCAL]
+----------------------hashAgg[GLOBAL]
+------------------------hashAgg[LOCAL]
+--------------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_order_by --
@@ -413,12 +459,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[sum_t_one_side]
-------------PhysicalOlapScan[sum_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_multiple_equal_conditions --
@@ -426,12 +478,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_with_aggregate --
@@ -439,12 +497,16 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection --
@@ -452,12 +514,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_equal_conditions_non_aggregate_selection_with_aggregate --
@@ -465,12 +533,20 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.name = t2.name)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_with_where_clause --
@@ -478,13 +554,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------filter((t1.score > 50))
-----------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((t1.score > 50))
+------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_varied_aggregates --
@@ -507,12 +589,18 @@ PhysicalResultSink
 ------hashAgg[GLOBAL]
 --------hashAgg[LOCAL]
 ----------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
-------------PhysicalOlapScan[sum_t_one_side]
-------------PhysicalOlapScan[sum_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------hashAgg[GLOBAL]
+------------------hashAgg[LOCAL]
+--------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_alias_multiple_equal_conditions --
@@ -520,12 +608,18 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1_alias.id = t2_alias.id) and (t1_alias.name = t2_alias.name)) otherCondition=()
---------PhysicalOlapScan[sum_t_one_side]
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_complex_join_condition --
@@ -533,12 +627,14 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id) and (t1.score = t2.score)) otherCondition=(( not (name = name)))
---------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------PhysicalOlapScan[sum_t_one_side]
 --------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
 -- !with_hint_groupby_pushdown_function_processed_columns --
@@ -559,13 +655,19 @@ PhysicalResultSink
 --hashAgg[GLOBAL]
 ----hashAgg[LOCAL]
 ------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------filter((sum_t_one_side.id < 100))
-----------PhysicalOlapScan[sum_t_one_side]
---------filter((sum_t_one_side.score > 20) and (t1.id < 100))
-----------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------filter((sum_t_one_side.id < 100))
+--------------PhysicalOlapScan[sum_t_one_side]
+--------hashAgg[GLOBAL]
+----------hashAgg[LOCAL]
+------------hashAgg[GLOBAL]
+--------------hashAgg[LOCAL]
+----------------filter((sum_t_one_side.score > 20) and (t1.id < 100))
+------------------PhysicalOlapScan[sum_t_one_side]
 
 Hint log:
-Used:
-UnUsed: use_push_down_agg_through_join_one_side
+Used: use_push_down_agg_through_join_one_side
+UnUsed:
 SyntaxError:
 
diff --git a/regression-test/data/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.out b/regression-test/data/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.out
index b495302e80d3c8..1b2f876cfba50a 100644
--- a/regression-test/data/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.out
+++ b/regression-test/data/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.out
@@ -41,3 +41,15 @@
 7.0	\N	\N
 7.0	7.0	7
 
+-- !same_percentile --
+52	1.0	1.0	2.0
+
+-- !same_percentile_group_by --
+\N	6.0	6.0	6.0
+2	3.0	3.0	3.0
+25	3.0	3.0	3.0
+4	2.0	2.0	2.0
+5	1.0	1.0	1.6
+7	6.0	6.0	6.0
+9	1.2	1.2	1.8
+
diff --git a/regression-test/data/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.out b/regression-test/data/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.out
index 3b9c3a1219ea15..c400e078daff1a 100644
--- a/regression-test/data/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.out
+++ b/regression-test/data/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.out
@@ -315,3 +315,35 @@ a	3	3	a,a,a	4.0	yy	3	1
 a	4	2	a,a	4.0	yy	2	1
 c	3	6	c,c,c	5.333333333333333	mi	3	2
 
+-- !query28_0_before --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query28_0_after --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query29_0_before --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query29_0_after --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query30_0_before --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query30_0_after --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query31_0_before --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
+-- !query31_0_after --
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	\N	\N	8	8	1
+1	2023-12-09	1	yy	2	2	2	4	3	\N	2	3	1	2	8	8	1
+
diff --git a/regression-test/data/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.out b/regression-test/data/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.out
new file mode 100644
index 00000000000000..639b3b0b977a55
--- /dev/null
+++ b/regression-test/data/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.out
@@ -0,0 +1,19 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !query1_0_before --
+o	3	21	o,o,o,o,o,o,o,o,o,o,o,o,o,o	4.571428571428571	mi	14	2
+o	4	4	o,o,o,o	4.0	yy	4	1
+
+-- !query1_0_after --
+o	3	21	o,o,o,o,o,o,o,o,o,o,o,o,o,o	4.571428571428571	mi	14	2
+o	4	4	o,o,o,o	4.0	yy	4	1
+
+-- !query2_0_before --
+o	3	21	o,o,o,o,o,o,o,o,o,o,o,o,o,o	4.571428571428571	mi	14	2
+o	4	4	o,o,o,o	4.0	yy	4	1
+
+-- !query3_0_before --
+o	25	o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o	4.444444444444445	18	2
+
+-- !query3_0_after --
+o	25	o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o,o	4.444444444444445	18	2
+
diff --git a/regression-test/data/nereids_rules_p0/mv/micro_test/micro_test_when_cte.out b/regression-test/data/nereids_rules_p0/mv/micro_test/micro_test_when_cte.out
new file mode 100644
index 00000000000000..8abaaf9adec0a8
--- /dev/null
+++ b/regression-test/data/nereids_rules_p0/mv/micro_test/micro_test_when_cte.out
@@ -0,0 +1,128 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !query_0_after --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
+-- !query_mv_0 --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
+-- !query_mv_1 --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
+-- !query_0_after --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
+-- !query_mv_2 --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
+-- !query_mv_3 --
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-08	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-09	4	1	3
+2023-12-10	4	1	3
+2023-12-10	4	1	3
+2023-12-10	4	1	3
+2023-12-10	4	1	3
+2023-12-10	4	1	3
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-10	4	1	4
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-11	4	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+2023-12-12	6	2	3
+
diff --git a/regression-test/data/nereids_rules_p0/push_down_distinct_through_join/push_down_distinct_through_join.out b/regression-test/data/nereids_rules_p0/push_down_distinct_through_join/push_down_distinct_through_join.out
index 65baed4f1194a0..4c5c60acd31a8e 100644
--- a/regression-test/data/nereids_rules_p0/push_down_distinct_through_join/push_down_distinct_through_join.out
+++ b/regression-test/data/nereids_rules_p0/push_down_distinct_through_join/push_down_distinct_through_join.out
@@ -15,14 +15,15 @@ SyntaxError:
 PhysicalResultSink
 --hashAgg[LOCAL]
 ----hashJoin[INNER_JOIN] hashCondition=((t1.id = t3.id)) otherCondition=()
-------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
---------PhysicalOlapScan[t]
---------PhysicalOlapScan[t]
+------hashAgg[LOCAL]
+--------hashJoin[INNER_JOIN] hashCondition=((t1.id = t2.id)) otherCondition=()
+----------PhysicalOlapScan[t]
+----------PhysicalOlapScan[t]
 ------PhysicalOlapScan[t]
 
 Hint log:
-Used:
-UnUsed: use_push_down_distinct_through_join
+Used: use_push_down_distinct_through_join
+UnUsed:
 SyntaxError:
 
 -- !basic_sql --
diff --git a/regression-test/data/query_p0/aggregate/array_agg.out b/regression-test/data/query_p0/aggregate/array_agg.out
index 1fe44df3a144bc..62ffb5fcf475c0 100644
--- a/regression-test/data/query_p0/aggregate/array_agg.out
+++ b/regression-test/data/query_p0/aggregate/array_agg.out
@@ -251,3 +251,6 @@
 8	[{"id":8}, {"id":8}, {"id":8}, {"id":8}]
 9	[{"id":9}, {"id":9}, {"id":9}, {"id":9}]
 
+-- !select --
+[null, "0.0.0.123", "0.0.12.42", "0.119.130.67"]	[null, "::855d", "::0.4.221.183", "::a:7429:d0d6:6e08:9f5f"]
+
diff --git a/regression-test/data/query_p0/sql_functions/array_functions/test_array_map_function_with_column.out b/regression-test/data/query_p0/sql_functions/array_functions/test_array_map_function_with_column.out
new file mode 100644
index 00000000000000..24d7b53e2b34f1
--- /dev/null
+++ b/regression-test/data/query_p0/sql_functions/array_functions/test_array_map_function_with_column.out
@@ -0,0 +1,41 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !select_1 --
+\N	\N	\N	\N	\N
+1	2	[1, 2, 3, 4]	[null, 2, 3]	[1, 1, 1, 1]
+2	3	[6, 7, null, 9]	[4, null, 6]	[1, 1, null, 1]
+3	4	\N	[4, 5, 6]	\N
+
+-- !select_2 --
+\N	\N	\N	\N	\N
+1	2	[1, 2, 3, 4]	[null, 2, 3]	[1, 1, 1, 1]
+2	3	[6, 7, null, 9]	[4, null, 6]	[1, 1, null, 1]
+3	4	\N	[4, 5, 6]	\N
+
+-- !select_3 --
+\N	\N	\N	\N	\N
+1	2	[1, 2, 3, 4]	[null, 2, 3]	[1, 1, 1, 1]
+2	3	[6, 7, null, 9]	[4, null, 6]	[1, 1, null, 1]
+3	4	\N	[4, 5, 6]	\N
+
+-- !select_4 --
+\N	\N	\N	\N	\N
+1	2	[1, 2, 3, 4]	[null, 2, 3]	[1, 1, 1, 1]
+2	3	[6, 7, null, 9]	[4, null, 6]	[1, 1, null, 1]
+3	4	\N	[4, 5, 6]	\N
+
+-- !select_5 --
+\N	\N	\N	\N	\N
+1	2	[1, 2, 3, 4]	[null, 2, 3]	[1, 1, 1, 1]
+2	3	[6, 7, null, 9]	[4, null, 6]	[1, 1, null, 1]
+3	4	\N	[4, 5, 6]	\N
+
+-- !select_6 --
+\N	\N	\N	\N	\N
+4	5	[6, 7, null, 9]	[4, 5, 6, 7]	[0, 0, null, 0]
+5	6	[10, 11, 12, 13]	[8, 9, null, 11]	[0, 0, null, 0]
+6	7	\N	\N	\N
+
+-- !select_7 --
+4	5	[6, 7, null, 9]	[4, 5, 6, 7]	[0, 0, null, 0]
+5	6	[10, 11, 12, 13]	[8, 9, null, 11]	[0, 0, null, 0]
+
diff --git a/regression-test/data/query_p0/system/test_query_sys_tables.out b/regression-test/data/query_p0/system/test_query_sys_tables.out
index cdd89914994c63..0100314ef799a1 100644
--- a/regression-test/data/query_p0/system/test_query_sys_tables.out
+++ b/regression-test/data/query_p0/system/test_query_sys_tables.out
@@ -158,9 +158,9 @@ internal	test_query_sys_db_2	\N
 internal	test_query_sys_db_3	\N
 
 -- !tables --
-internal	test_query_sys_tb_1	BASE TABLE	0	\N	\N
-internal	test_query_sys_tb_2	BASE TABLE	0	\N	\N
-internal	test_query_sys_tb_3	BASE TABLE	0	\N	\N
+internal	test_query_sys_tb_1	BASE TABLE	0	\N	0
+internal	test_query_sys_tb_2	BASE TABLE	0	\N	0
+internal	test_query_sys_tb_3	BASE TABLE	0	\N	0
 
 -- !session_variables --
 wait_timeout	30000
diff --git a/regression-test/data/unique_with_mow_c_p0/test_schema_change_and_compaction.out b/regression-test/data/unique_with_mow_c_p0/test_schema_change_and_compaction.out
new file mode 100644
index 00000000000000..35f26a488beff3
--- /dev/null
+++ b/regression-test/data/unique_with_mow_c_p0/test_schema_change_and_compaction.out
@@ -0,0 +1,8 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !select1 --
+10	20	35	40
+
+-- !select2 --
+10	20	40	37
+11	20	40	37
+
diff --git a/regression-test/data/unique_with_mow_c_p0/test_select.out b/regression-test/data/unique_with_mow_c_p0/test_select.out
new file mode 100644
index 00000000000000..11c66ecf4dbc47
--- /dev/null
+++ b/regression-test/data/unique_with_mow_c_p0/test_select.out
@@ -0,0 +1,9 @@
+-- This file is automatically generated. You should know what you did if you want to edit this
+-- !sql0 --
+0
+can
+
+-- !sql1 --
+0
+can
+
diff --git a/regression-test/framework/pom.xml b/regression-test/framework/pom.xml
index 6b749bf0fd1dae..813659989ae60c 100644
--- a/regression-test/framework/pom.xml
+++ b/regression-test/framework/pom.xml
@@ -75,6 +75,7 @@ under the License.
         <antlr.version>4.9.3</antlr.version>
         <hadoop.version>2.8.0</hadoop.version>
         <aws-java-sdk-s3.version>1.11.95</aws-java-sdk-s3.version>
+        <!-- Arrow 18 only supports jdk17 -->
         <arrow.version>17.0.0</arrow.version>
     </properties>
     <build>
diff --git a/regression-test/framework/src/main/groovy/org/apache/doris/regression/Config.groovy b/regression-test/framework/src/main/groovy/org/apache/doris/regression/Config.groovy
index 379d177fbc280d..246558eaf06d07 100644
--- a/regression-test/framework/src/main/groovy/org/apache/doris/regression/Config.groovy
+++ b/regression-test/framework/src/main/groovy/org/apache/doris/regression/Config.groovy
@@ -1028,7 +1028,18 @@ class Config {
             excludeDirectorySet.add("fault_injection_p0/partial_update")
             excludeDirectorySet.add("fault_injection_p0/flexible")
             excludeDirectorySet.add("doc")
-            List<String> excludeCases = ["test_table_properties", "test_default_hll", "test_default_pi", "test_full_compaction", "test_full_compaction_by_table_id", "test_create_table", "txn_insert", "test_update_mow", "test_new_update", "test_update_unique", "test_partial_update_generated_column", "nereids_partial_update_native_insert_stmt", "partial_update", "nereids_update_on_current_timestamp", "update_on_current_timestamp", "test_default_bitmap_empty", "nereids_delete_mow_partial_update", "delete_mow_partial_update", "partial_update_seq_col", "nereids_partial_update_native_insert_stmt_complex", "regression_test_variant_delete_and_update", "test_unique_table_auto_inc_partial_update_correct_stream_load", "test_unique_table_auto_inc", "test_unique_table_auto_inc_partial_update_correct_insert", "test_update_schema_change", "test_partial_update_rowset_not_found_fault_injection"]
+            excludeDirectorySet.add("schema_change_p0/unique_ck")
+            List<String> excludeCases = ["test_table_properties", "test_create_table"
+                , "test_default_hll", "test_default_pi", "test_default_bitmap_empty"
+                , "test_full_compaction", "test_full_compaction_by_table_id"
+                // schema change
+                , "test_alter_muti_modify_column"
+                // partial update
+                , "txn_insert", "test_update_schema_change", "test_generated_column_update", "test_nested_type_with_rowstore", "test_partial_update_generated_column", "nereids_partial_update_native_insert_stmt"
+                , "partial_update", "nereids_update_on_current_timestamp", "update_on_current_timestamp", "nereids_delete_mow_partial_update", "delete_mow_partial_update", "test_unique_table_auto_inc"
+                , "test_unique_table_auto_inc_partial_update_correct_insert", "partial_update_seq_col", "nereids_partial_update_native_insert_stmt_complex", "regression_test_variant_delete_and_update"
+                , "test_unique_table_auto_inc_partial_update_correct_stream_load", "test_update_mow", "test_new_update", "test_update_unique", "nereids_partial_update_native_insert_seq_col"
+                , "test_partial_update_rowset_not_found_fault_injection"]
             for (def excludeCase in excludeCases) {
                 excludeSuiteWildcard.add(excludeCase)
             }
@@ -1056,19 +1067,23 @@ class Config {
         return buildUrlWithDb(jdbcUrl, dbName)
     }
 
-    Connection getConnectionByArrowFlightSql(String dbName) {
+    Connection getConnectionByArrowFlightSqlDbName(String dbName) {
         Class.forName("org.apache.arrow.driver.jdbc.ArrowFlightJdbcDriver")
         String arrowFlightSqlHost = otherConfigs.get("extArrowFlightSqlHost")
         String arrowFlightSqlPort = otherConfigs.get("extArrowFlightSqlPort")
         String arrowFlightSqlUrl = "jdbc:arrow-flight-sql://${arrowFlightSqlHost}:${arrowFlightSqlPort}" +
                 "/?useServerPrepStmts=false&useSSL=false&useEncryption=false"
-        // TODO jdbc:arrow-flight-sql not support connect db
-        String dbUrl = buildUrlWithDbImpl(arrowFlightSqlUrl, dbName)
+        // Arrow 17.0.0-rc03 support jdbc:arrow-flight-sql connect db
+        // https://github.com/apache/arrow/issues/41947
+        if (dbName?.trim()) {
+            arrowFlightSqlUrl = "jdbc:arrow-flight-sql://${arrowFlightSqlHost}:${arrowFlightSqlPort}" +
+                "/catalog=" + dbName + "?useServerPrepStmts=false&useSSL=false&useEncryption=false"
+        }
         tryCreateDbIfNotExist(dbName)
-        log.info("connect to ${dbUrl}".toString())
+        log.info("connect to ${arrowFlightSqlUrl}".toString())
         String arrowFlightSqlJdbcUser = otherConfigs.get("extArrowFlightSqlUser")
         String arrowFlightSqlJdbcPassword = otherConfigs.get("extArrowFlightSqlPassword")
-        return DriverManager.getConnection(dbUrl, arrowFlightSqlJdbcUser, arrowFlightSqlJdbcPassword)
+        return DriverManager.getConnection(arrowFlightSqlUrl, arrowFlightSqlJdbcUser, arrowFlightSqlJdbcPassword)
     }
 
     Connection getDownstreamConnection() {
diff --git a/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/Suite.groovy b/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/Suite.groovy
index 62e6032578fd6a..d622084c24bd82 100644
--- a/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/Suite.groovy
+++ b/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/Suite.groovy
@@ -770,6 +770,8 @@ class Suite implements GroovyInterceptable {
         runAction(new WaitForAction(context), actionSupplier)
         if (ObjectUtils.isNotEmpty(insertSql)){
             sql insertSql
+        } else {
+            sql "SYNC"
         }
         if (cleanOperator==true){
             if (ObjectUtils.isEmpty(tbName)) throw new RuntimeException("tbName cloud not be null")
@@ -1876,6 +1878,22 @@ class Suite implements GroovyInterceptable {
         sql "analyze table ${db}.${mv_name} with sync;"
     }
 
+    def create_async_partition_mv = { db, mv_name, mv_sql, partition_col ->
+
+        sql """DROP MATERIALIZED VIEW IF EXISTS ${db}.${mv_name}"""
+        sql"""
+        CREATE MATERIALIZED VIEW ${db}.${mv_name} 
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL 
+        PARTITION BY ${partition_col} 
+        DISTRIBUTED BY RANDOM BUCKETS 2 
+        PROPERTIES ('replication_num' = '1')  
+        AS ${mv_sql}
+        """
+        def job_name = getJobName(db, mv_name);
+        waitingMTMVTaskFinished(job_name)
+        sql "analyze table ${db}.${mv_name} with sync;"
+    }
+
     // mv not part in rewrite process
     void mv_not_part_in(query_sql, mv_name, sync_cbo_rewrite = enable_sync_mv_cost_based_rewrite()) {
         logger.info("query_sql = " + query_sql + ", mv_names = " + mv_name + ", sync_cbo_rewrite = " + sync_cbo_rewrite)
diff --git a/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/SuiteContext.groovy b/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/SuiteContext.groovy
index d2d49efa1a86de..88ad1fac355d17 100644
--- a/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/SuiteContext.groovy
+++ b/regression-test/framework/src/main/groovy/org/apache/doris/regression/suite/SuiteContext.groovy
@@ -156,7 +156,7 @@ class SuiteContext implements Closeable {
         def threadConnInfo = threadArrowFlightSqlConn.get()
         if (threadConnInfo == null) {
             threadConnInfo = new ConnectionInfo()
-            threadConnInfo.conn = config.getConnectionByArrowFlightSql(dbName)
+            threadConnInfo.conn = config.getConnectionByArrowFlightSqlDbName(dbName)
             threadConnInfo.username = config.jdbcUser
             threadConnInfo.password = config.jdbcPassword
             threadArrowFlightSqlConn.set(threadConnInfo)
diff --git a/regression-test/java-udf-src/src/main/java/org/apache/doris/udf/UDFConstTest.java b/regression-test/java-udf-src/src/main/java/org/apache/doris/udf/UDFConstTest.java
new file mode 100644
index 00000000000000..86370356998fed
--- /dev/null
+++ b/regression-test/java-udf-src/src/main/java/org/apache/doris/udf/UDFConstTest.java
@@ -0,0 +1,99 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.udf;
+
+import java.math.BigDecimal;
+import java.math.BigInteger;
+import java.time.LocalDate;
+import java.time.LocalDateTime;
+import java.util.ArrayList;
+import java.util.HashMap;
+
+public class UDFConstTest {
+    public static class ConstBoolean {
+        public Boolean evaluate(Integer i, Boolean value) {
+            return value;
+        }
+    }
+
+    public static class ConstInt {
+        public Integer evaluate(Integer i, Integer value) {
+            return value;
+        }
+    }
+
+    public static class ConstFloat {
+        public Float evaluate(Integer i, Float value) {
+            return value;
+        }
+    }
+
+    public static class ConstDouble {
+        public Double evaluate(Integer i, Double value) {
+            return value;
+        }
+    }
+
+    public static class ConstLargeInt {
+        public BigInteger evaluate(Integer i, BigInteger value) {
+            return value;
+        }
+    }
+
+    public static class ConstDecimal {
+        public BigDecimal evaluate(Integer i, BigDecimal value) {
+            return value;
+        }
+    }
+
+    public static class ConstDate {
+        public LocalDate evaluate(Integer i, LocalDate value) {
+            return value;
+        }
+    }
+
+    public static class ConstDateTime {
+        public LocalDateTime evaluate(Integer i, LocalDateTime value) {
+            return value;
+        }
+    }
+
+    public static class ConstString {
+        public String evaluate(Integer i, String value) {
+            return value;
+        }
+    }
+
+    public static class ConstArray {
+        public ArrayList<String> evaluate(Integer i, ArrayList<String> value) {
+            return value;
+        }
+    }
+
+    public static class ConstMap {
+        public HashMap<String, String> evaluate(Integer i, HashMap<String, String> value) {
+            return value;
+        }
+    }
+
+    public static class ConstStruct {
+        public ArrayList<Object> evaluate(Integer i, ArrayList<Object> value) {
+            return value;
+        }
+    }
+}
diff --git a/regression-test/suites/account_p0/test_information_schema.groovy b/regression-test/suites/account_p0/test_information_schema.groovy
index dcbc0c3532838e..fc94ad4b9bc2fa 100644
--- a/regression-test/suites/account_p0/test_information_schema.groovy
+++ b/regression-test/suites/account_p0/test_information_schema.groovy
@@ -87,4 +87,26 @@ suite("test_information_schema") {
         def dbName = dbPrefix + i.toString()
         sql "DROP DATABASE `${dbName}`"
     }
+
+    def dbName = dbPrefix + "default"
+    def tableName = tablePrefix + "default"
+    sql "CREATE DATABASE IF NOT EXISTS `${dbName}`"
+    sql "USE `${dbName}`"
+    sql """drop table if exists `${tableName}`"""
+    sql """
+        CREATE TABLE `${tableName}` (
+          `id` largeint NULL COMMENT '用户ID',
+          `name` varchar(20) NULL DEFAULT "无" COMMENT '用户姓名',
+          `age` smallint NULL DEFAULT "0" COMMENT '用户年龄',
+          `address` varchar(100) NULL DEFAULT "beijing" COMMENT '用户所在地区',
+          `date` datetime NULL DEFAULT "20240101" COMMENT '数据导入时间'
+        ) ENGINE=OLAP
+        DUPLICATE KEY(`id`, `name`)
+        DISTRIBUTED BY HASH(`id`) BUCKETS 1
+        PROPERTIES (
+        "replication_allocation" = "tag.location.default: 1")
+    """
+    qt_default "SELECT COLUMN_NAME as field,COLUMN_TYPE as type,IS_NULLABLE as isNullable, COLUMN_DEFAULT as defaultValue FROM INFORMATION_SCHEMA.COLUMNS WHERE TABLE_NAME = '${tableName}' AND TABLE_SCHEMA = '${dbName}'"
+    sql "DROP DATABASE `${dbName}`"
 }
+
diff --git a/regression-test/suites/account_p0/test_system_user.groovy b/regression-test/suites/account_p0/test_system_user.groovy
new file mode 100644
index 00000000000000..1805f1669ea570
--- /dev/null
+++ b/regression-test/suites/account_p0/test_system_user.groovy
@@ -0,0 +1,39 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.junit.Assert;
+
+suite("test_system_user") {
+    test {
+          sql """
+              create user `root`;
+          """
+          exception "root"
+    }
+    test {
+          sql """
+              drop user `root`;
+          """
+          exception "system"
+    }
+    test {
+          sql """
+              drop user `admin`;
+          """
+          exception "system"
+    }
+}
diff --git a/regression-test/suites/auth_call/test_database_management_auth.groovy b/regression-test/suites/auth_call/test_database_management_auth.groovy
index 0e1805e20d6840..79114c18e789b5 100644
--- a/regression-test/suites/auth_call/test_database_management_auth.groovy
+++ b/regression-test/suites/auth_call/test_database_management_auth.groovy
@@ -23,14 +23,14 @@ suite("test_database_management_auth","p0,auth_call") {
     String user = 'test_database_management_auth_user'
     String pwd = 'C123_567p'
     String dbName = 'test_database_management_auth_db'
-    def String show_dis_error_msg = "denied"
+    def String error_in_cloud = "denied"
     //cloud-mode
     if (isCloudMode()) {
         def clusters = sql " SHOW CLUSTERS; "
         assertTrue(!clusters.isEmpty())
         def validCluster = clusters[0][0]
         sql """GRANT USAGE_PRIV ON CLUSTER ${validCluster} TO ${user}""";
-        show_dis_error_msg = "Unsupported"
+        error_in_cloud = "Unsupported"
     }
 
     try_sql("DROP USER ${user}")
@@ -79,7 +79,7 @@ suite("test_database_management_auth","p0,auth_call") {
         }
         test {
             sql """SHOW REPLICA DISTRIBUTION FROM tbl;"""
-            exception "${show_dis_error_msg}"
+            exception "${error_in_cloud}"
         }
         test {
             sql """SHOW REPLICA STATUS FROM db1.tbl1;"""
@@ -95,7 +95,7 @@ suite("test_database_management_auth","p0,auth_call") {
         }
         test {
             sql """ADMIN CHECK TABLET (10000, 10001) PROPERTIES("type" = "consistency");"""
-            exception "denied"
+            exception "${error_in_cloud}"
         }
         test {
             sql """SHOW TABLET DIAGNOSIS 0;"""
diff --git a/regression-test/suites/auth_call/test_ddl_file_auth.groovy b/regression-test/suites/auth_call/test_ddl_file_auth.groovy
index 53cab5b3687ba5..73aa9204b54c02 100644
--- a/regression-test/suites/auth_call/test_ddl_file_auth.groovy
+++ b/regression-test/suites/auth_call/test_ddl_file_auth.groovy
@@ -69,12 +69,12 @@ suite("test_ddl_file_auth","p0,auth_call") {
 
     sql """grant admin_priv on *.*.* to ${user}"""
     connect(user=user, password="${pwd}", url=context.config.jdbcUrl) {
-        sql """CREATE FILE "${fileName}" IN ${dbName}
+        checkNereidsExecute("""CREATE FILE "${fileName}" IN ${dbName}
                 PROPERTIES
                 (
                     "url" = "${dataFilePath}",
                     "catalog" = "internal"
-                );"""
+                );""")
         sql """use ${dbName}"""
         checkNereidsExecute("SHOW FILE;")
         checkNereidsExecute("SHOW FILE FROM ${dbName};")
diff --git a/regression-test/suites/auth_p0/test_grant_nonexist_table.groovy b/regression-test/suites/auth_p0/test_grant_nonexist_table.groovy
index 36e75707be7252..74d211e5010201 100644
--- a/regression-test/suites/auth_p0/test_grant_nonexist_table.groovy
+++ b/regression-test/suites/auth_p0/test_grant_nonexist_table.groovy
@@ -39,7 +39,9 @@ suite("test_grant_nonexist_table","p0,auth") {
             sql """grant select_priv on internal.${dbName}.non_exist_table to ${user}"""
             exception "table"
         }
-
+    // contain create_triv should not check name, Same behavior as MySQL
+    sql """grant create_priv on internal.${dbName}.non_exist_table to ${user}"""
+    sql """grant create_priv,select_priv on internal.${dbName}.non_exist_table to ${user}"""
 
     try_sql("DROP USER ${user}")
 }
diff --git a/regression-test/suites/catalog_recycle_bin_p0/test_create_drop_multiple.groovy b/regression-test/suites/catalog_recycle_bin_p0/test_create_drop_multiple.groovy
new file mode 100644
index 00000000000000..9decc30c39f2b4
--- /dev/null
+++ b/regression-test/suites/catalog_recycle_bin_p0/test_create_drop_multiple.groovy
@@ -0,0 +1,106 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_create_drop_multiple") {
+    def table = "test_create_drop_multiple"
+
+    // create table and insert data
+    sql """ drop table if exists ${table}"""
+    sql """
+    create table ${table} (
+        `id` int(11),
+        `name` varchar(128),
+        `da` date
+    )
+    engine=olap
+    duplicate key(id)
+    partition by range(da)(
+        PARTITION p3 VALUES LESS THAN ('2023-01-01'),
+        PARTITION p4 VALUES LESS THAN ('2024-01-01'),
+        PARTITION p5 VALUES LESS THAN ('2025-01-01')
+    )
+    distributed by hash(id) buckets 2
+    properties(
+        "replication_num"="1",
+        "light_schema_change"="true"
+    );
+    """
+
+    sql """ insert into ${table} values(1, 'a', '2022-01-02'); """
+    sql """ insert into ${table} values(2, 'a', '2023-01-02'); """
+    sql """ insert into ${table} values(3, 'a', '2024-01-02'); """
+    sql """ SYNC;"""
+
+    qt_select_check_1 """ select * from  ${table} order by id,name,da; """
+
+    sql """ drop table ${table}; """
+
+    sql """
+    create table ${table} (
+        `id` int(11),
+        `name` varchar(128),
+        `da` date
+    )
+    engine=olap
+    duplicate key(id)
+    partition by range(da)(
+        PARTITION p3 VALUES LESS THAN ('2023-01-01'),
+        PARTITION p4 VALUES LESS THAN ('2024-01-01'),
+        PARTITION p5 VALUES LESS THAN ('2025-01-01')
+    )
+    distributed by hash(id) buckets 2
+    properties(
+        "replication_num"="1",
+        "light_schema_change"="true"
+    );
+    """
+    sql """ insert into ${table} values(3, 'a', '2024-01-02'); """
+    sql """ SYNC;"""
+    qt_select_check_2 """ select * from  ${table} order by id,name,da; """    
+    sql """ drop table ${table}; """
+    sql """
+    create table ${table} (
+        `id` int(11),
+        `name` varchar(128),
+        `da` date
+    )
+    engine=olap
+    duplicate key(id)
+    partition by range(da)(
+        PARTITION p3 VALUES LESS THAN ('2023-01-01'),
+        PARTITION p4 VALUES LESS THAN ('2024-01-01'),
+        PARTITION p5 VALUES LESS THAN ('2025-01-01')
+    )
+    distributed by hash(id) buckets 2
+    properties(
+        "replication_num"="1",
+        "light_schema_change"="true"
+    );
+    """
+    sql """ insert into ${table} values(4, 'a', '2024-01-02'); """
+    sql """ SYNC;"""
+    sql """ drop table ${table}; """
+    sql """ recover table ${table}; """
+
+    qt_select_check_recover_1_value4 """ select * from  ${table} order by id,name,da; """
+    sql """ drop table ${table} force; """
+    sql """ recover table ${table}; """
+    qt_select_check_recover_2_value3 """ select * from  ${table} order by id,name,da; """
+    sql """ drop table ${table} force; """
+    sql """ recover table ${table}; """
+    qt_select_check_recover_3_value123 """ select * from  ${table} order by id,name,da; """    
+}
diff --git a/regression-test/suites/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.groovy b/regression-test/suites/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.groovy
new file mode 100644
index 00000000000000..e7f65e82610ffa
--- /dev/null
+++ b/regression-test/suites/catalog_recycle_bin_p0/test_insert_overwrite_recover_multiple.groovy
@@ -0,0 +1,87 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_insert_overwrite_recover_multiple") {
+    def table = "test_insert_overwrite_recover_multiple"
+
+    // create table and insert data
+    sql """ drop table if exists ${table}"""
+    sql """
+    create table ${table} (
+        `id` int(11),
+        `name` varchar(128),
+        `da` date
+    )
+    engine=olap
+    duplicate key(id)
+    partition by range(da)(
+        PARTITION p3 VALUES LESS THAN ('2023-01-01'),
+        PARTITION p4 VALUES LESS THAN ('2024-01-01'),
+        PARTITION p5 VALUES LESS THAN ('2025-01-01')
+    )
+    distributed by hash(id) buckets 2
+    properties(
+        "replication_num"="1",
+        "light_schema_change"="true"
+    );
+    """
+
+    sql """ insert into ${table} values(1, 'a', '2022-01-02'); """
+    sql """ insert into ${table} values(2, 'a', '2023-01-02'); """
+    sql """ insert into ${table} values(3, 'a', '2024-01-02'); """
+    sql """ SYNC;"""
+
+    qt_select_check_1 """ select * from  ${table} order by id,name,da; """
+
+    sql """ insert overwrite  table ${table} values(3, 'a', '2024-01-02'); """
+
+    qt_select_check_2 """ select * from  ${table} order by id,name,da; """
+
+    sql """ insert overwrite  table ${table} values(4, 'a', '2024-01-02'); """
+
+    qt_select_check_3 """ select * from  ${table} order by id,name,da; """    
+    
+    sql """ ALTER TABLE ${table} DROP PARTITION p3; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p4; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p5; """
+
+    sql """ recover partition p3  from ${table}; """
+    sql """ recover partition p4  from ${table}; """
+    sql """ recover partition p5  from ${table}; """    
+
+    qt_select_check_recover_1_value4 """ select * from  ${table} order by id,name,da; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p3 force; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p4 force; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p5 force; """
+
+    sql """ recover partition p3  from ${table}; """
+    sql """ recover partition p4  from ${table}; """
+    sql """ recover partition p5  from ${table}; """    
+
+    qt_select_check_recover_2_value3 """ select * from  ${table} order by id,name,da; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p3 force; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p4 force; """
+    sql """ ALTER TABLE ${table} DROP PARTITION p5 force; """
+
+    sql """ recover partition p3  from ${table}; """
+    sql """ recover partition p4  from ${table}; """
+    sql """ recover partition p5  from ${table}; """    
+
+    qt_select_check_recover_3_value123 """ select * from  ${table} order by id,name,da; """    
+
+
+}
diff --git a/regression-test/suites/check_before_quit/check_before_quit.groovy b/regression-test/suites/check_before_quit/check_before_quit.groovy
index 7b097b58cd23c6..f507fddeaa583b 100644
--- a/regression-test/suites/check_before_quit/check_before_quit.groovy
+++ b/regression-test/suites/check_before_quit/check_before_quit.groovy
@@ -237,5 +237,31 @@ suite("check_before_quit", "nonConcurrent,p0") {
 
         Thread.sleep(2000)
     }
+
+    // check create table sql
+    List<List<Object>> allDataBases = sql "show databases;"
+    logger.info("show all databases: ${allDataBases}")
+
+    def num = allDataBases.size()
+
+    for (int i = 0; i < allDataBases.size(); i++) {
+        def db = allDataBases[i][0]
+        if (db == "__internal_schema" || db == "information_schema" || db == "mysql") {
+            continue
+        }
+        List<List<Object>> allTables = sql "show tables from ${db}"
+        logger.info("show all tabkes: ${allTables}")
+        for (int j = 0;j < allTables.size();j ++) {
+            def tbl = allTables[j][0]
+            def createTableSql = sql "show create table ${db}.${tbl}"
+            logger.info("create table sql info: ${createTableSql}")
+            sql "drop table if exists ${tbl}"
+            sql(createTableSql[0][1])
+            def createTableSqlResult = sql "show create table ${tbl}"
+            logger.info("create table sql result info: ${createTableSqlResult}")
+            assertEquals(createTableSqlResult, createTableSql)
+        }
+    }
+
     assertTrue(clear)
 }
diff --git a/regression-test/suites/compaction/test_full_compaction.groovy b/regression-test/suites/compaction/test_full_compaction.groovy
index 60f52f6f5a55a0..ed2d2ce5bc5e46 100644
--- a/regression-test/suites/compaction/test_full_compaction.groovy
+++ b/regression-test/suites/compaction/test_full_compaction.groovy
@@ -177,6 +177,11 @@ suite("test_full_compaction") {
         // make sure all hidden data has been deleted
         // (1,100)(2,200)
         qt_select_final """select * from ${tableName} order by user_id"""
+
+        sql "SET skip_delete_predicate = false"
+        sql "SET skip_delete_sign = false"
+        sql "SET skip_delete_bitmap = false"
+        qt_select_final2 """select * from ${tableName} order by user_id"""
     } finally {
         try_sql("DROP TABLE IF EXISTS ${tableName}")
     }
diff --git a/regression-test/suites/compaction/test_full_compaction_ck.groovy b/regression-test/suites/compaction/test_full_compaction_ck.groovy
new file mode 100644
index 00000000000000..8e2f86c596de65
--- /dev/null
+++ b/regression-test/suites/compaction/test_full_compaction_ck.groovy
@@ -0,0 +1,189 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.codehaus.groovy.runtime.IOGroovyMethods
+
+suite("test_full_compaction_ck") {
+    def tableName = "test_full_compaction_ck"
+
+    try {
+        String backend_id;
+
+        def backendId_to_backendIP = [:]
+        def backendId_to_backendHttpPort = [:]
+        getBackendIpHttpPort(backendId_to_backendIP, backendId_to_backendHttpPort);
+
+        backend_id = backendId_to_backendIP.keySet()[0]
+        def (code, out, err) = show_be_config(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id))
+        logger.info("Show config: code=" + code + ", out=" + out + ", err=" + err)
+        assertEquals(code, 0)
+        def configList = parseJson(out.trim())
+        assert configList instanceof List
+
+        boolean disableAutoCompaction = true
+        for (Object ele in (List) configList) {
+            assert ele instanceof List<String>
+            if (((List<String>) ele)[0] == "disable_auto_compaction") {
+                disableAutoCompaction = Boolean.parseBoolean(((List<String>) ele)[2])
+            }
+        }
+
+        sql """ DROP TABLE IF EXISTS ${tableName} """
+        sql """
+            CREATE TABLE ${tableName} (
+            `user_id` INT NOT NULL, `value` INT NOT NULL)
+            UNIQUE KEY(`user_id`) 
+            CLUSTER BY(`value`)
+            DISTRIBUTED BY HASH(`user_id`) 
+            BUCKETS 1 
+            PROPERTIES ("replication_allocation" = "tag.location.default: 1",
+            "disable_auto_compaction" = "true",
+            "enable_mow_light_delete" = "false",
+            "enable_unique_key_merge_on_write" = "true");"""
+
+        // version1 (1,1)(2,2)
+        sql """ INSERT INTO ${tableName} VALUES
+            (1,1),(2,2)
+            """
+        qt_1 """select * from ${tableName} order by user_id"""
+
+
+        // version2 (1,10)(2,20)
+        sql """ INSERT INTO ${tableName} VALUES
+            (1,10),(2,20)
+            """
+        qt_2 """select * from ${tableName} order by user_id"""
+
+
+        // version3 (1,100)(2,200)
+        sql """ INSERT INTO ${tableName} VALUES
+            (1,100),(2,200)
+            """
+        qt_3 """select * from ${tableName} order by user_id"""
+
+
+        // version4 (1,100)(2,200)(3,300)
+        sql """ INSERT INTO ${tableName} VALUES
+            (3,300)
+            """
+        qt_4 """select * from ${tableName} order by user_id"""
+
+
+        // version5 (1,100)(2,200)(3,100)
+        sql """update ${tableName} set value = 100 where user_id = 3"""
+        qt_5 """select * from ${tableName} order by user_id"""
+
+
+        // version6 (1,100)(2,200)
+        sql """delete from ${tableName} where user_id = 3"""
+        qt_6 """select * from ${tableName} order by user_id"""
+
+        sql "SET skip_delete_predicate = true"
+        sql "SET skip_delete_sign = true"
+        sql "SET skip_delete_bitmap = true"
+        // show all hidden data
+        // (1,10)(1,100)(2,2)(2,20)(2,200)(3,300)(3,100)
+        qt_skip_delete """select * from ${tableName} order by user_id, value"""
+
+        //TabletId,ReplicaId,BackendId,SchemaHash,Version,LstSuccessVersion,LstFailedVersion,LstFailedTime,LocalDataSize,RemoteDataSize,RowCount,State,LstConsistencyCheckTime,CheckVersion,VersionCount,PathHash,MetaUrl,CompactionStatus
+        def tablets = sql_return_maparray """ show tablets from ${tableName}; """
+
+        def replicaNum = get_table_replica_num(tableName)
+        logger.info("get table replica num: " + replicaNum)
+        // before full compaction, there are 7 rowsets.
+        int rowsetCount = 0
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            rowsetCount +=((List<String>) tabletJson.rowsets).size()
+        }
+        assert (rowsetCount == 7 * replicaNum)
+
+        // trigger full compactions for all tablets in ${tableName}
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            backend_id = tablet.BackendId
+            times = 1
+
+            do{
+                (code, out, err) = be_run_full_compaction(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+                logger.info("Run compaction: code=" + code + ", out=" + out + ", err=" + err)
+                ++times
+                sleep(2000)
+            } while (parseJson(out.trim()).status.toLowerCase()!="success" && times<=10)
+
+            def compactJson = parseJson(out.trim())
+            if (compactJson.status.toLowerCase() == "fail") {
+                assertEquals(disableAutoCompaction, false)
+                logger.info("Compaction was done automatically!")
+            }
+            if (disableAutoCompaction) {
+                assertEquals("success", compactJson.status.toLowerCase())
+            }
+        }
+
+        // wait for full compaction done
+        for (def tablet in tablets) {
+            boolean running = true
+            do {
+                Thread.sleep(1000)
+                String tablet_id = tablet.TabletId
+                backend_id = tablet.BackendId
+                (code, out, err) = be_get_compaction_status(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+                logger.info("Get compaction status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def compactionStatus = parseJson(out.trim())
+                assertEquals("success", compactionStatus.status.toLowerCase())
+                running = compactionStatus.run_status
+            } while (running)
+        }
+
+        // after full compaction, there is only 1 rowset.
+        
+        rowsetCount = 0
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            rowsetCount +=((List<String>) tabletJson.rowsets).size()
+        }
+        def cloudMode = isCloudMode()
+        if (cloudMode) {
+            assert (rowsetCount == 2)
+        } else {
+            assert (rowsetCount == 1 * replicaNum)
+        }
+
+        // make sure all hidden data has been deleted
+        // (1,100)(2,200)
+        qt_select_final """select * from ${tableName} order by user_id"""
+
+        sql "SET skip_delete_predicate = false"
+        sql "SET skip_delete_sign = false"
+        sql "SET skip_delete_bitmap = false"
+        qt_select_final2 """select * from ${tableName} order by user_id"""
+    } finally {
+        // try_sql("DROP TABLE IF EXISTS ${tableName}")
+    }
+}
diff --git a/regression-test/suites/control_p0/set_replica_status.groovy b/regression-test/suites/control_p0/set_replica_status.groovy
index 367893c8e9cdc4..627f48755ee6c0 100644
--- a/regression-test/suites/control_p0/set_replica_status.groovy
+++ b/regression-test/suites/control_p0/set_replica_status.groovy
@@ -50,6 +50,7 @@ suite('test_set_replica_status', 'nonConcurrent') {
             break
         }
         sql """ADMIN SET REPLICA STATUS PROPERTIES("tablet_id" = "${tabletId}", "backend_id" = "${backendId}", "status" = "bad");"""
+        checkNereidsExecute("""SHOW REPLICA STATUS FROM ${tableName}""")
         result = sql_return_maparray """SHOW REPLICA STATUS FROM ${tableName}"""
         for (def res : result) {
             if (res.TabletId == tabletId && res.BackendId == backendId) {
@@ -58,6 +59,7 @@ suite('test_set_replica_status', 'nonConcurrent') {
             }
         }
         sql """ADMIN SET REPLICA STATUS PROPERTIES("tablet_id" = "${tabletId}", "backend_id" = "${backendId}", "status" = "ok");"""
+        checkNereidsExecute("""SHOW REPLICA STATUS FROM ${tableName}""")
         result = sql_return_maparray """SHOW REPLICA STATUS FROM ${tableName}"""
         for (def res : result) {
             if (res.TabletId == tabletId && res.BackendId == backendId) {
@@ -66,6 +68,7 @@ suite('test_set_replica_status', 'nonConcurrent') {
             }
         }
         sql """ADMIN SET REPLICA VERSION PROPERTIES("tablet_id" = "${tabletId}", "backend_id" = "${backendId}", "last_failed_version" = "10");"""
+        checkNereidsExecute("""SHOW REPLICA STATUS FROM ${tableName}""")
         result = sql_return_maparray """SHOW REPLICA STATUS FROM ${tableName}"""
         for (def res : result) {
             if (res.TabletId == tabletId && res.BackendId == backendId) {
diff --git a/regression-test/suites/correctness_p0/test_mv_case/test_mv_case.groovy b/regression-test/suites/correctness_p0/test_mv_case/test_mv_case.groovy
index 0a87c8d2704d1c..0940f817a8de27 100644
--- a/regression-test/suites/correctness_p0/test_mv_case/test_mv_case.groovy
+++ b/regression-test/suites/correctness_p0/test_mv_case/test_mv_case.groovy
@@ -20,7 +20,7 @@ suite("test_mv_case") {
     sql """CREATE TABLE `test_table_aaa2` (
             `ordernum` varchar(65533) NOT NULL ,
             `dnt` datetime NOT NULL ,
-            `data` json NULL 
+            `data` json NULL
             ) ENGINE=OLAP
             DUPLICATE KEY(`ordernum`, `dnt`)
             COMMENT 'OLAP'
@@ -55,7 +55,7 @@ suite("test_mv_case") {
     createMV ("""create  materialized view  test_mv_view_t_mv as
                 select `day`, count(game_code)
                 from test_mv_view_t group by day;""")
-    sql """create view test_mv_view_t_view 
+    sql """create view test_mv_view_t_view
             as
             select `day`
                 from test_mv_view_t
@@ -69,4 +69,69 @@ suite("test_mv_case") {
         sql("""SELECT  * from test_mv_view_t_view where day='2024-04-15';""")
         notContains("mv_day")
     }
+
+    sql """ drop table if exists tb1 """
+    sql """ CREATE TABLE tb1 (
+        `id` bigint NOT NULL COMMENT '',
+        `map_infos` map < int,
+        varchar(65533) > NULL COMMENT ''
+        ) ENGINE = OLAP UNIQUE KEY(`id`) COMMENT 'test' DISTRIBUTED BY HASH(`id`) BUCKETS 2 PROPERTIES (
+        "replication_allocation" = "tag.location.default: 1",
+        "min_load_replica_num" = "-1",
+        "is_being_synced" = "false",
+        "storage_medium" = "hdd",
+        "storage_format" = "V2",
+        "inverted_index_storage_format" = "V1",
+        "enable_unique_key_merge_on_write" = "true",
+        "light_schema_change" = "true",
+        "disable_auto_compaction" = "false",
+        "enable_single_replica_compaction" = "false",
+        "group_commit_interval_ms" = "10000",
+        "group_commit_data_bytes" = "134217728",
+        "enable_mow_light_delete" = "false"
+        )
+    """
+    sql """insert into tb1 select id,map_agg(a, b) from(select 123 id,3 a,'5' b union all select 123 id, 6 a, '8' b) aa group by id"""
+    createMV ("""CREATE MATERIALIZED VIEW mv1 BUILD IMMEDIATE REFRESH COMPLETE ON SCHEDULE EVERY 10 MINUTE DUPLICATE KEY(info_id) DISTRIBUTED BY HASH(`info_id`) BUCKETS 2 PROPERTIES (
+        "replication_allocation" = "tag.location.default: 1",
+        "min_load_replica_num" = "-1",
+        "is_being_synced" = "false",
+        "colocate_with" = "dwd_info_group",
+        "storage_medium" = "hdd",
+        "storage_format" = "V2",
+        "inverted_index_storage_format" = "V1",
+        "light_schema_change" = "true",
+        "disable_auto_compaction" = "false",
+        "enable_single_replica_compaction" = "false",
+        "group_commit_interval_ms" = "10000",
+        "group_commit_data_bytes" = "134217728",
+        "enable_nondeterministic_function" = "true"
+        ) AS
+        select
+        /*+ SET_VAR(enable_force_spill = true) */
+        cast(a.id as bigint) info_id,
+        map_infos
+        from
+        tb1 a;""")
+    createMV ("""CREATE MATERIALIZED VIEW mv2 BUILD IMMEDIATE REFRESH COMPLETE ON SCHEDULE EVERY 10 MINUTE DUPLICATE KEY(info_id) DISTRIBUTED BY HASH(`info_id`) BUCKETS 2 PROPERTIES (
+        "replication_allocation" = "tag.location.default: 1",
+        "min_load_replica_num" = "-1",
+        "is_being_synced" = "false",
+        "colocate_with" = "dwd_info_group",
+        "storage_medium" = "hdd",
+        "storage_format" = "V2",
+        "inverted_index_storage_format" = "V1",
+        "light_schema_change" = "true",
+        "disable_auto_compaction" = "false",
+        "enable_single_replica_compaction" = "false",
+        "group_commit_interval_ms" = "10000",
+        "group_commit_data_bytes" = "134217728",
+        "enable_nondeterministic_function" = "true"
+        ) AS
+        select
+        info_id,
+        map_infos
+        from
+        mv1 a;""")
+    qt_select_mv """ select * from mv2 """
 }
diff --git a/regression-test/suites/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.groovy b/regression-test/suites/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.groovy
index 36fbf9d80aa663..b22b7d82ae34c8 100644
--- a/regression-test/suites/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.groovy
+++ b/regression-test/suites/ddl_p0/test_create_table_generated_column/test_generated_column_nereids.groovy
@@ -134,15 +134,6 @@ suite("test_generated_column") {
 
     qt_describe "describe gencol_refer_gencol"
 
-    //test update
-    sql "drop table if exists test_gen_col_update"
-    sql """create table test_gen_col_update (a int, b int, c int as (a+b))
-    unique key(a)
-    distributed by hash(a) properties("replication_num"="1")"""
-    sql "insert into test_gen_col_update values(1,3,default)"
-    qt_test_update "update test_gen_col_update set b=20"
-    qt_test_update_generated_column "select * from test_gen_col_update"
-
     // test unique table, generated column is not key
     sql "drop table if exists test_gen_col_unique_key"
     qt_gen_col_unique_key """create table test_gen_col_unique_key(a int,b int,c int generated always as (abs(a+b)) not null)
@@ -233,4 +224,17 @@ suite("test_generated_column") {
         PROPERTIES("replication_num" = "1");"""
         exception "The generated columns can be key columns, or value columns of replace and replace_if_not_null aggregation type."
     }
+
+    //test update
+    sql "drop table if exists test_gen_col_update"
+    sql """create table test_gen_col_update (a int, b int, c int as (a+b))
+    unique key(a)
+    distributed by hash(a) properties("replication_num"="1")"""
+    sql "insert into test_gen_col_update values(1,3,default)"
+    if (!isClusterKeyEnabled()) {
+        qt_test_update "update test_gen_col_update set b=20"
+        qt_test_update_generated_column "select * from test_gen_col_update"
+    } else {
+        // errCode = 2, detailMessage = The value specified for generated column 'c' in table 'test_gen_col_update' is not allowed
+    }
 }
\ No newline at end of file
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_catalog.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_catalog.groovy
index f2082ef89c7a50..149eecf5817bd4 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_catalog.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_catalog.groovy
@@ -36,4 +36,4 @@ suite("test_hudi_catalog", "p2,external,hudi,external_remote,external_remote_hud
     def tables = sql """ show tables; """
     assertTrue(tables.size() > 0)
     sql """drop catalog if exists ${catalog_name};"""
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_incremental.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_incremental.groovy
index 8cc1d2a852b8c4..885903646cc5b5 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_incremental.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_incremental.groovy
@@ -60,7 +60,6 @@ suite("test_hudi_incremental", "p2,external,hudi,external_remote,external_remote
         "20241114152009764",
         "20241114152011901",
     ]
-    test_hudi_incremental_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_cow_partition order by _hoodie_commit_time;"
     def timestamps_cow_partition = [
@@ -75,7 +74,6 @@ suite("test_hudi_incremental", "p2,external,hudi,external_remote,external_remote
         "20241114152147114",
         "20241114152156417",
     ]
-    test_hudi_incremental_querys("user_activity_log_cow_partition", timestamps_cow_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_mor_non_partition order by _hoodie_commit_time;"
     def timestamps_mor_non_partition = [
@@ -90,7 +88,6 @@ suite("test_hudi_incremental", "p2,external,hudi,external_remote,external_remote
         "20241114152028770",
         "20241114152030746",
     ]
-    test_hudi_incremental_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_mor_partition order by _hoodie_commit_time;"
     def timestamps_mor_partition = [
@@ -105,7 +102,18 @@ suite("test_hudi_incremental", "p2,external,hudi,external_remote,external_remote
         "20241114152323587",
         "20241114152334111",
     ]
+
+    test_hudi_incremental_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
+    test_hudi_incremental_querys("user_activity_log_cow_partition", timestamps_cow_partition)
+    test_hudi_incremental_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
+    test_hudi_incremental_querys("user_activity_log_mor_partition", timestamps_mor_partition)
+    sql """set force_jni_scanner=true;"""
+    // don't support incremental query for cow table by jni reader
+    // test_hudi_incremental_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
+    // test_hudi_incremental_querys("user_activity_log_cow_partition", timestamps_cow_partition)
+    test_hudi_incremental_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
     test_hudi_incremental_querys("user_activity_log_mor_partition", timestamps_mor_partition)
+    // sql """set force_jni_scanner=false;"""
 
     sql """drop catalog if exists ${catalog_name};"""
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_orc_tables.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_orc_tables.groovy
new file mode 100644
index 00000000000000..43638a23881e0e
--- /dev/null
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_orc_tables.groovy
@@ -0,0 +1,41 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_hudi_orc_tables", "p2,external,hudi,external_remote,external_remote_hudi") {
+    String enabled = context.config.otherConfigs.get("enableExternalHudiTest")
+    if (enabled == null || !enabled.equalsIgnoreCase("true")) {
+        logger.info("disable hudi test")
+    }
+
+    String catalog_name = "test_hudi_orc_tables"
+    String props = context.config.otherConfigs.get("hudiEmrCatalog")
+    sql """drop catalog if exists ${catalog_name};"""
+    sql """
+        create catalog if not exists ${catalog_name} properties (
+            ${props}
+        );
+    """
+
+    sql """ switch ${catalog_name};"""
+    sql """ use regression_hudi;""" 
+    sql """ set enable_fallback_to_original_planner=false """
+    
+    qt_cow """ select * from  orc_hudi_table_cow; """
+    qt_mor """ select * from  orc_hudi_table_mor; """
+
+    sql """drop catalog if exists ${catalog_name};"""
+}
\ No newline at end of file
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_partition_prune.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_partition_prune.groovy
new file mode 100644
index 00000000000000..eea17b01711b44
--- /dev/null
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_partition_prune.groovy
@@ -0,0 +1,333 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_hudi_partition_prune", "p2,external,hudi,external_remote,external_remote_hudi") {
+    String enabled = context.config.otherConfigs.get("enableExternalHudiTest")
+    if (enabled == null || !enabled.equalsIgnoreCase("true")) {
+        logger.info("disable hudi test")
+    }
+
+    String catalog_name = "test_hudi_partition_prune"
+    String props = context.config.otherConfigs.get("hudiEmrCatalog")
+    sql """drop catalog if exists ${catalog_name};"""
+    
+    for (String  use_hive_sync_partition : ['true','false']) {
+
+        sql """
+            create catalog if not exists ${catalog_name} properties (
+                ${props}
+                ,"use_hive_sync_partition"="${use_hive_sync_partition}"
+            );
+        """
+
+        sql """ switch ${catalog_name};"""
+        sql """ use regression_hudi;""" 
+        sql """ set enable_fallback_to_original_planner=false """
+
+
+
+        def one_partition_1_1 = """SELECT id,name,part1  FROM one_partition_tb WHERE part1 = 2024 ORDER BY id;"""
+        def one_partition_2_1 = """SELECT id,name,part1  FROM one_partition_tb WHERE part1 = 2025 ORDER BY id;"""
+        def one_partition_3_all = """SELECT id,name,part1  FROM one_partition_tb ORDER BY id;"""
+        def one_partition_4_all = """SELECT id,name,part1  FROM one_partition_tb WHERE id = 5 ORDER BY id;"""
+        def one_partition_5_1 = """SELECT id,name,part1  FROM one_partition_tb WHERE part1 = 2024 AND id >= 3 ORDER BY id;"""
+
+        def two_partition_1_1 = """SELECT id,name,part1,part2  FROM two_partition_tb WHERE part1 = 'US' AND part2 = 1 ORDER BY id;"""
+        def two_partition_2_1 = """SELECT id,name,part1,part2  FROM two_partition_tb WHERE part1 = 'EU' AND part2 = 2 ORDER BY id;"""
+        def two_partition_3_2 = """SELECT id,name,part1,part2  FROM two_partition_tb WHERE part1 = 'US' ORDER BY id;"""
+        def two_partition_4_all = """SELECT id,name,part1,part2  FROM two_partition_tb ORDER BY id;"""
+        def two_partition_5_1 = """SELECT id,name,part1,part2  FROM two_partition_tb WHERE part1 = 'US' AND part2 = 2 AND id > 5 ORDER BY id;"""
+        def two_partition_6_1 = """SELECT id,name,part1,part2  FROM two_partition_tb WHERE part1 = 'EU' AND part2 = 2 ORDER BY id;"""
+
+        def three_partition_1_1 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'US' AND part2 = 2024 AND part3 = 'Q1' ORDER BY id;"""
+        def three_partition_2_1 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'EU' AND part2 = 2025 AND part3 = 'Q2' ORDER BY id;"""
+        def three_partition_3_3 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'AS' AND part2 = 2025 ORDER BY id;"""
+        def three_partition_4_2 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'US' AND part3 = 'Q1' ORDER BY id;"""
+        def three_partition_5_all = """SELECT id,name,part1,part2,part3  FROM three_partition_tb ORDER BY id;"""
+        def three_partition_6_1 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'EU' AND part2 = 2024 AND part3 = 'Q1' ORDER BY id;"""
+        def three_partition_7_7 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part2 = 2025 ORDER BY id;"""
+        def three_partition_8_2 = """SELECT id,name,part1,part2,part3  FROM three_partition_tb WHERE part1 = 'US' AND part3 = 'Q2' AND id BETWEEN 6 AND 10 ORDER BY id;"""
+
+        def one_partition_boolean = """SELECT id,name,part1  FROM boolean_partition_tb WHERE part1 = true ORDER BY id;"""
+        def one_partition_tinyint = """SELECT id,name,part1  FROM tinyint_partition_tb WHERE part1 = 1 ORDER BY id;"""
+        def one_partition_smallint = """SELECT id,name,part1  FROM smallint_partition_tb WHERE part1 = 10 ORDER BY id;"""
+        def one_partition_int = """SELECT id,name,part1  FROM int_partition_tb WHERE part1 = 100 ORDER BY id;"""
+        def one_partition_bigint = """SELECT id,name,part1  FROM bigint_partition_tb WHERE part1 = 1234567890 ORDER BY id;"""
+        def one_partition_string = """SELECT id,name,part1  FROM string_partition_tb WHERE part1 = 'RegionA' ORDER BY id;"""
+        def one_partition_date = """SELECT id,name,part1  FROM date_partition_tb WHERE part1 = '2023-12-01' ORDER BY id;"""
+        def one_partition_timestamp = """SELECT id,name,part1  FROM timestamp_partition_tb WHERE part1 = '2023-12-01 08:00:00' ORDER BY id;"""
+
+
+
+        qt_one_partition_1_1 one_partition_1_1
+        explain {
+            sql("${one_partition_1_1}")
+            contains "partition=1/2"
+        }
+
+        qt_one_partition_2_1 one_partition_2_1
+        explain {
+            sql("${one_partition_2_1}")
+            contains "partition=1/2"
+        }
+
+        qt_one_partition_3_all one_partition_3_all
+        explain {
+            sql("${one_partition_3_all}")
+            contains "partition=2/2"
+        }
+
+        qt_one_partition_4_all one_partition_4_all
+        explain {
+            sql("${one_partition_4_all}")
+            contains "partition=2/2"
+        }
+
+        qt_one_partition_5_1 one_partition_5_1
+        explain {
+            sql("${one_partition_5_1}")
+            contains "partition=1/2"
+        }
+
+
+        qt_two_partition_1_1 two_partition_1_1
+        explain {
+            sql("${two_partition_1_1}")
+            contains "partition=1/4"
+        }
+
+        qt_two_partition_2_1 two_partition_2_1
+        explain {
+            sql("${two_partition_2_1}")
+            contains "partition=1/4"
+        }
+
+        qt_two_partition_3_2 two_partition_3_2
+        explain {
+            sql("${two_partition_3_2}")
+            contains "partition=2/4"
+        }
+
+        qt_two_partition_4_all two_partition_4_all
+        explain {
+            sql("${two_partition_4_all}")
+            contains "partition=4/4"
+        }
+
+        qt_two_partition_5_1 two_partition_5_1
+        explain {
+            sql("${two_partition_5_1}")
+            contains "partition=1/4"
+        }
+
+        qt_two_partition_6_1 two_partition_6_1
+        explain {
+            sql("${two_partition_6_1}")
+            contains "partition=1/4"
+        }
+
+
+
+        qt_three_partition_1_1 three_partition_1_1
+        explain {
+            sql("${three_partition_1_1}")
+            contains "partition=1/10"
+        }
+
+        qt_three_partition_2_1 three_partition_2_1
+        explain {
+            sql("${three_partition_2_1}")
+            contains "partition=1/10"
+        }
+
+        qt_three_partition_3_3 three_partition_3_3
+        explain {
+            sql("${three_partition_3_3}")
+            contains "partition=3/10"
+        }
+
+        qt_three_partition_4_2 three_partition_4_2
+        explain {
+            sql("${three_partition_4_2}")
+            contains "partition=2/10"
+        }
+
+        qt_three_partition_5_all three_partition_5_all
+        explain {
+            sql("${three_partition_5_all}")
+            contains "partition=10/10"
+        }
+
+        qt_three_partition_6_1 three_partition_6_1
+        explain {
+            sql("${three_partition_6_1}")
+            contains "partition=1/10"
+        }
+
+        qt_three_partition_7_7 three_partition_7_7
+        explain {
+            sql("${three_partition_7_7}")
+            contains "partition=7/10"
+        }
+
+        qt_three_partition_8_2 three_partition_8_2
+        explain {
+            sql("${three_partition_8_2}")
+            contains "partition=2/10"
+        }
+
+
+        // 0 partitions
+        def one_partition_6_0 = """SELECT id,name,part1  FROM one_partition_tb WHERE part1 = 2023 ORDER BY id;"""
+        qt_one_partition_6_0 one_partition_6_0
+        explain {
+            sql("${one_partition_6_0}")
+            contains "partition=0/2"
+        }
+
+        def two_partition_7_0 = """SELECT id,name,part1  FROM two_partition_tb WHERE part1 = 'CN' AND part2 = 1 ORDER BY id;"""
+        qt_two_partition_7_0 two_partition_7_0
+        explain {
+            sql("${two_partition_7_0}")
+            contains "partition=0/4"
+        }
+
+        def two_partition_8_0 = """SELECT id,name,part1  FROM two_partition_tb WHERE part1 = 'US' AND part2 = 3 ORDER BY id;"""
+        qt_two_partition_8_0 two_partition_8_0
+        explain {
+            sql("${two_partition_8_0}")
+            contains "partition=0/4"
+        }
+
+        def three_partition_9_0 = """SELECT id,name,part1  FROM three_partition_tb WHERE part1 = 'US' AND part2 = 2023 AND part3 = 'Q1' ORDER BY id;"""
+        qt_three_partition_9_0 three_partition_9_0
+        explain {
+            sql("${three_partition_9_0}")
+            contains "partition=0/10"
+        }
+
+        def three_partition_10_0 = """SELECT id,name,part1  FROM three_partition_tb WHERE part1 = 'EU' AND part2 = 2024 AND part3 = 'Q4' ORDER BY id;"""
+        qt_three_partition_10_0 three_partition_10_0
+        explain {
+            sql("${three_partition_10_0}")
+            contains "partition=0/10"
+        }
+
+        def three_partition_11_0 = """SELECT id,name,part1  FROM three_partition_tb WHERE part1 = 'AS' AND part2 = 2025 AND part3 = 'Q4' ORDER BY id;"""
+        qt_three_partition_11_0 three_partition_11_0
+        explain {
+            sql("${three_partition_11_0}")
+            contains "partition=0/10"
+        }
+
+
+        //time travel 
+        def time_travel_two_partition_1_3 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20241202171226401' order by id;"
+        def time_travel_two_partition_2_2 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20241202171226401' where part1='US' order by id;"
+        def time_travel_two_partition_3_1 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20241202171226401' where part2=2 order by id;"
+        def time_travel_two_partition_4_0 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20241202171226401' where part2=10 order by id;"
+
+        qt_time_travel_two_partition_1_3 time_travel_two_partition_1_3
+        explain {
+            sql("${time_travel_two_partition_1_3}")
+            contains "partition=3/3"
+        }
+
+
+        qt_time_travel_two_partition_2_2 time_travel_two_partition_2_2
+        explain {
+            sql("${time_travel_two_partition_2_2}")
+            contains "partition=2/3"
+        }
+
+        qt_time_travel_two_partition_3_1 time_travel_two_partition_3_1
+        explain {
+            sql("${time_travel_two_partition_3_1}")
+            contains "partition=1/3"
+        }
+
+        qt_time_travel_two_partition_4_0 time_travel_two_partition_4_0
+        explain {
+            sql("${time_travel_two_partition_4_0}")
+            contains "partition=0/3"
+        }
+
+
+
+
+        def time_travel_two_partition_5_0 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20231126012025218' order by id;"
+        qt_time_travel_two_partition_5_0 time_travel_two_partition_5_0
+        explain {
+            sql("${time_travel_two_partition_5_0}")
+            contains "partition=0/0"
+        }
+
+        def time_travel_two_partition_6_1 = "select id,name,part1,part2 from two_partition_tb  FOR TIME AS OF '20241202171214902' order by id;"
+        qt_time_travel_two_partition_6_1 time_travel_two_partition_6_1
+        explain {
+            sql("${time_travel_two_partition_6_1}")
+            contains "partition=1/1"
+        }
+
+        // all types as partition
+        qt_one_partition_boolean one_partition_boolean
+        explain {
+            sql("${one_partition_boolean}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_tinyint one_partition_tinyint
+        explain {
+            sql("${one_partition_tinyint}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_smallint one_partition_smallint
+        explain {
+            sql("${one_partition_smallint}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_int one_partition_int
+        explain {
+            sql("${one_partition_int}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_bigint one_partition_bigint
+        explain {
+            sql("${one_partition_bigint}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_string one_partition_string
+        explain {
+            sql("${one_partition_string}")
+            contains "partition=1/2"
+        }
+        qt_one_partition_date one_partition_date
+        explain {
+            sql("${one_partition_date}")
+            contains "partition=1/2"
+        }
+        // qt_one_partition_timestamp one_partition_timestamp
+        // explain {
+        //     sql("${one_partition_timestamp}")
+        //     contains "partition=1/2"
+        // }
+
+        sql """drop catalog if exists ${catalog_name};"""
+
+
+    }
+    
+}
\ No newline at end of file
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_schema_evolution.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_schema_evolution.groovy
index b247aaf492400d..0da88447cdef15 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_schema_evolution.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_schema_evolution.groovy
@@ -33,7 +33,18 @@ suite("test_hudi_schema_evolution", "p2,external,hudi,external_remote,external_r
     sql """ switch ${catalog_name};"""
     sql """ use regression_hudi;""" 
     sql """ set enable_fallback_to_original_planner=false """
+    
+    qt_adding_simple_columns_table """ select * from adding_simple_columns_table order by id """
+    qt_altering_simple_columns_table """ select * from altering_simple_columns_table order by id """
+    // qt_deleting_simple_columns_table """ select * from deleting_simple_columns_table order by id """
+    // qt_renaming_simple_columns_table """ select * from renaming_simple_columns_table order by id """
 
+    qt_adding_complex_columns_table """ select * from adding_complex_columns_table order by id """
+    qt_altering_complex_columns_table """ select * from altering_complex_columns_table order by id """
+    // qt_deleting_complex_columns_table """ select * from deleting_complex_columns_table order by id """
+    // qt_renaming_complex_columns_table """ select * from renaming_complex_columns_table order by id """
+    
+    sql """set force_jni_scanner = true;"""
     qt_adding_simple_columns_table """ select * from adding_simple_columns_table order by id """
     qt_altering_simple_columns_table """ select * from altering_simple_columns_table order by id """
     // qt_deleting_simple_columns_table """ select * from deleting_simple_columns_table order by id """
@@ -43,6 +54,7 @@ suite("test_hudi_schema_evolution", "p2,external,hudi,external_remote,external_r
     qt_altering_complex_columns_table """ select * from altering_complex_columns_table order by id """
     // qt_deleting_complex_columns_table """ select * from deleting_complex_columns_table order by id """
     // qt_renaming_complex_columns_table """ select * from renaming_complex_columns_table order by id """
+    sql """set force_jni_scanner = false;"""
 
     sql """drop catalog if exists ${catalog_name};"""
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_snapshot.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_snapshot.groovy
index 53c09e6d5a9031..89d89709b3c822 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_snapshot.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_snapshot.groovy
@@ -64,7 +64,7 @@ suite("test_hudi_snapshot", "p2,external,hudi,external_remote,external_remote_hu
         qt_q09 """SELECT * FROM ${table_name} WHERE struct_element(struct_element(address, 'coordinates'), 'latitude') BETWEEN 0 AND 100 AND struct_element(struct_element(address, 'coordinates'), 'longitude') BETWEEN 0 AND 100 ORDER BY event_time LIMIT 5;"""
 
         // Query records with ratings above a specific value and limit output
-        qt_q10 """SELECT * FROM ${table_name} WHERE rating > 4.5 ORDER BY rating DESC LIMIT 5;"""
+        qt_q10 """SELECT * FROM ${table_name} WHERE rating > 4.5 ORDER BY event_time DESC LIMIT 5;"""
 
         // Query all users' signup dates and limit output
         qt_q11 """SELECT user_id, signup_date FROM ${table_name} ORDER BY signup_date DESC LIMIT 10;"""
@@ -79,13 +79,20 @@ suite("test_hudi_snapshot", "p2,external,hudi,external_remote,external_remote_hu
         qt_q14 """SELECT * FROM ${table_name} WHERE signup_date = '2024-01-15' ORDER BY user_id LIMIT 5;"""
 
         // Query the total count of purchases for each user and limit output
-        qt_q15 """SELECT user_id, array_size(purchases) AS purchase_count FROM ${table_name} ORDER BY purchase_count DESC LIMIT 5;"""
+        qt_q15 """SELECT user_id, array_size(purchases) AS purchase_count FROM ${table_name} ORDER BY user_id LIMIT 5;"""
     }
 
+    test_hudi_snapshot_querys("user_activity_log_mor_non_partition")
+    test_hudi_snapshot_querys("user_activity_log_mor_partition")
     test_hudi_snapshot_querys("user_activity_log_cow_non_partition")
     test_hudi_snapshot_querys("user_activity_log_cow_partition")
+
+    sql """set force_jni_scanner=true;"""
     test_hudi_snapshot_querys("user_activity_log_mor_non_partition")
     test_hudi_snapshot_querys("user_activity_log_mor_partition")
+    test_hudi_snapshot_querys("user_activity_log_cow_non_partition")
+    test_hudi_snapshot_querys("user_activity_log_cow_partition")
+    sql """set force_jni_scanner=false;"""
 
     sql """drop catalog if exists ${catalog_name};"""
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_timestamp.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_timestamp.groovy
index c1ba630e4a7d01..3d7bd40b2d54cf 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_timestamp.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_timestamp.groovy
@@ -34,8 +34,22 @@ suite("test_hudi_timestamp", "p2,external,hudi,external_remote,external_remote_h
     sql """ use regression_hudi;""" 
     sql """ set enable_fallback_to_original_planner=false """
 
-    // TODO: fix hudi timezone issue and enable this
-    // qt_timestamp """ select * from hudi_table_with_timestamp order by id; """
+    def test_timestamp_different_timezones = {
+        sql """set time_zone = 'America/Los_Angeles';"""
+        qt_timestamp1 """ select * from hudi_table_with_timestamp order by id; """
+        sql """set time_zone = 'Asia/Shanghai';"""
+        qt_timestamp2 """ select * from hudi_table_with_timestamp order by id; """
+        sql """set time_zone = 'UTC';"""
+        qt_timestamp3 """ select * from hudi_table_with_timestamp order by id; """
+    }
+
+    // test native reader
+    test_timestamp_different_timezones()
+    sql """ set force_jni_scanner = true; """
+    // test jni reader
+    test_timestamp_different_timezones()
+    sql """ set force_jni_scanner = false; """
+
 
     sql """drop catalog if exists ${catalog_name};"""
 }
@@ -59,4 +73,4 @@ suite("test_hudi_timestamp", "p2,external,hudi,external_remote,external_remote_h
 // INSERT OVERWRITE hudi_table_with_timestamp VALUES
 // ('1', 'Alice', timestamp('2024-10-25 08:00:00')),
 // ('2', 'Bob', timestamp('2024-10-25 09:30:00')),
-// ('3', 'Charlie', timestamp('2024-10-25 11:00:00'));
\ No newline at end of file
+// ('3', 'Charlie', timestamp('2024-10-25 11:00:00'));
diff --git a/regression-test/suites/external_table_p2/hudi/test_hudi_timetravel.groovy b/regression-test/suites/external_table_p2/hudi/test_hudi_timetravel.groovy
index 4d458dc4381dcf..cceeaa412202c6 100644
--- a/regression-test/suites/external_table_p2/hudi/test_hudi_timetravel.groovy
+++ b/regression-test/suites/external_table_p2/hudi/test_hudi_timetravel.groovy
@@ -54,7 +54,6 @@ suite("test_hudi_timetravel", "p2,external,hudi,external_remote,external_remote_
         "20241114152009764",
         "20241114152011901",
     ]
-    test_hudi_timetravel_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_cow_partition order by _hoodie_commit_time;"
     def timestamps_cow_partition = [
@@ -69,7 +68,6 @@ suite("test_hudi_timetravel", "p2,external,hudi,external_remote,external_remote_
         "20241114152147114",
         "20241114152156417",
     ]
-    test_hudi_timetravel_querys("user_activity_log_cow_partition", timestamps_cow_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_mor_non_partition order by _hoodie_commit_time;"
     def timestamps_mor_non_partition = [
@@ -84,7 +82,6 @@ suite("test_hudi_timetravel", "p2,external,hudi,external_remote,external_remote_
         "20241114152028770",
         "20241114152030746",
     ]
-    test_hudi_timetravel_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
 
     // spark-sql "select distinct _hoodie_commit_time from user_activity_log_mor_partition order by _hoodie_commit_time;"
     def timestamps_mor_partition = [
@@ -99,7 +96,17 @@ suite("test_hudi_timetravel", "p2,external,hudi,external_remote,external_remote_
         "20241114152323587",
         "20241114152334111",
     ]
+
+    test_hudi_timetravel_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
+    test_hudi_timetravel_querys("user_activity_log_cow_partition", timestamps_cow_partition)
+    test_hudi_timetravel_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
+    test_hudi_timetravel_querys("user_activity_log_mor_partition", timestamps_mor_partition)
+    sql """set force_jni_scanner=true;"""
+    test_hudi_timetravel_querys("user_activity_log_cow_non_partition", timestamps_cow_non_partition)
+    test_hudi_timetravel_querys("user_activity_log_cow_partition", timestamps_cow_partition)
+    test_hudi_timetravel_querys("user_activity_log_mor_non_partition", timestamps_mor_non_partition)
     test_hudi_timetravel_querys("user_activity_log_mor_partition", timestamps_mor_partition)
+    sql """set force_jni_scanner=false;"""
 
     sql """drop catalog if exists ${catalog_name};"""
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/external_table_p2/maxcompute/test_external_catalog_maxcompute.groovy b/regression-test/suites/external_table_p2/maxcompute/test_external_catalog_maxcompute.groovy
index 3f0929b59ea96a..81133270fb6e60 100644
--- a/regression-test/suites/external_table_p2/maxcompute/test_external_catalog_maxcompute.groovy
+++ b/regression-test/suites/external_table_p2/maxcompute/test_external_catalog_maxcompute.groovy
@@ -388,7 +388,10 @@ suite("test_external_catalog_maxcompute", "p2,external,maxcompute,external_remot
         order_qt_multi_partition_q6 """ select max(pt), yy, mm from multi_partitions where yy = '2023' and mm='08' group by yy, mm order by yy, mm; """
         order_qt_multi_partition_q7 """ select count(*) from multi_partitions where yy < '2023' or dd < '03'; """
         order_qt_multi_partition_q8 """ select count(*) from multi_partitions where pt>=3; """
-        order_qt_multi_partition_q9 """ select city,mnt,gender,finished_time,order_rate,cut_date,create_time,pt, yy, mm, dd from multi_partitions where pt >= 2 and pt < 4 and finished_time is not null; """
+        
+        //`finished_time is not null` => com.aliyun.odps.OdpsException: ODPS-0010000:System internal error - fuxi job failed, caused by: timestamp_ntz
+        // order_qt_multi_partition_q9 """ select city,mnt,gender,finished_time,order_rate,cut_date,create_time,pt, yy, mm, dd from multi_partitions where pt >= 2 and pt < 4 and finished_time is not null; """
+
         order_qt_multi_partition_q10 """ select pt, yy, mm, dd from multi_partitions where pt >= 2 and create_time > '2023-08-03 03:11:00' order by pt, yy, mm, dd; """
 
 
diff --git a/regression-test/suites/external_table_p2/maxcompute/test_max_compute_partition_prune.groovy b/regression-test/suites/external_table_p2/maxcompute/test_max_compute_partition_prune.groovy
index e34569117a167f..83ebbe2fb29d1a 100644
--- a/regression-test/suites/external_table_p2/maxcompute/test_max_compute_partition_prune.groovy
+++ b/regression-test/suites/external_table_p2/maxcompute/test_max_compute_partition_prune.groovy
@@ -104,179 +104,191 @@ suite("test_max_compute_partition_prune", "p2,external,maxcompute,external_remot
         String mc_db = "mc_datalake"
         String mc_catalog_name = "test_max_compute_partition_prune"
 
-        sql """drop catalog if exists ${mc_catalog_name};"""
-        sql """
-            create catalog if not exists ${mc_catalog_name} properties (
-                "type" = "max_compute",
-                "mc.default.project" = "${mc_db}",
-                "mc.access_key" = "${ak}",
-                "mc.secret_key" = "${sk}",
-                "mc.endpoint" = "http://service.cn-beijing-vpc.maxcompute.aliyun-inc.com/api"
-            );
-        """
-        sql """ switch ${mc_catalog_name} """
-        sql """ use ${mc_db}"""
-
-        qt_one_partition_1_1 one_partition_1_1
-        explain {
-            sql("${one_partition_1_1}")
-            contains "partition=1/2"
-        }
-
-        qt_one_partition_2_1 one_partition_2_1
-        explain {
-            sql("${one_partition_2_1}")
-            contains "partition=1/2"
-        }
-
-        qt_one_partition_3_all one_partition_3_all
-        explain {
-            sql("${one_partition_3_all}")
-            contains "partition=2/2"
-        }
-
-        qt_one_partition_4_all one_partition_4_all
-        explain {
-            sql("${one_partition_4_all}")
-            contains "partition=2/2"
-        }
-
-        qt_one_partition_5_1 one_partition_5_1
-        explain {
-            sql("${one_partition_5_1}")
-            contains "partition=1/2"
-        }
-
-
-        qt_two_partition_1_1 two_partition_1_1
-        explain {
-            sql("${two_partition_1_1}")
-            contains "partition=1/4"
-        }
-
-        qt_two_partition_2_1 two_partition_2_1
-        explain {
-            sql("${two_partition_2_1}")
-            contains "partition=1/4"
-        }
-
-        qt_two_partition_3_2 two_partition_3_2
-        explain {
-            sql("${two_partition_3_2}")
-            contains "partition=2/4"
-        }
-
-        qt_two_partition_4_all two_partition_4_all
-        explain {
-            sql("${two_partition_4_all}")
-            contains "partition=4/4"
-        }
-
-        qt_two_partition_5_1 two_partition_5_1
-        explain {
-            sql("${two_partition_5_1}")
-            contains "partition=1/4"
-        }
-
-        qt_two_partition_6_1 two_partition_6_1
-        explain {
-            sql("${two_partition_6_1}")
-            contains "partition=1/4"
-        }
-
-
-
-        qt_three_partition_1_1 three_partition_1_1
-        explain {
-            sql("${three_partition_1_1}")
-            contains "partition=1/10"
-        }
 
-        qt_three_partition_2_1 three_partition_2_1
-        explain {
-            sql("${three_partition_2_1}")
-            contains "partition=1/10"
+        for (String  enable_profile : ["true","false"] ) {
+            sql """set enable_profile = ${enable_profile} """;
+
+            for (String num_partitions : ["1","10","100"] ) {
+                sql "set num_partitions_in_batch_mode =  ${num_partitions} "
+
+                for (String cross_partition : ["true","false"] ) {
+
+                    sql """drop catalog if exists ${mc_catalog_name};"""
+                    sql """
+                        create catalog if not exists ${mc_catalog_name} properties (
+                            "type" = "max_compute",
+                            "mc.default.project" = "${mc_db}",
+                            "mc.access_key" = "${ak}",
+                            "mc.secret_key" = "${sk}",
+                            "mc.endpoint" = "http://service.cn-beijing-vpc.maxcompute.aliyun-inc.com/api",
+                            "mc.split_cross_partition" = "${cross_partition}"
+                        );
+                    """
+                    sql """ switch ${mc_catalog_name} """
+                    sql """ use ${mc_db}"""
+
+                    qt_one_partition_1_1 one_partition_1_1
+                    explain {
+                        sql("${one_partition_1_1}")
+                        contains "partition=1/2"
+                    }
+
+                    qt_one_partition_2_1 one_partition_2_1
+                    explain {
+                        sql("${one_partition_2_1}")
+                        contains "partition=1/2"
+                    }
+
+                    qt_one_partition_3_all one_partition_3_all
+                    explain {
+                        sql("${one_partition_3_all}")
+                        contains "partition=2/2"
+                    }
+
+                    qt_one_partition_4_all one_partition_4_all
+                    explain {
+                        sql("${one_partition_4_all}")
+                        contains "partition=2/2"
+                    }
+
+                    qt_one_partition_5_1 one_partition_5_1
+                    explain {
+                        sql("${one_partition_5_1}")
+                        contains "partition=1/2"
+                    }
+
+
+                    qt_two_partition_1_1 two_partition_1_1
+                    explain {
+                        sql("${two_partition_1_1}")
+                        contains "partition=1/4"
+                    }
+
+                    qt_two_partition_2_1 two_partition_2_1
+                    explain {
+                        sql("${two_partition_2_1}")
+                        contains "partition=1/4"
+                    }
+
+                    qt_two_partition_3_2 two_partition_3_2
+                    explain {
+                        sql("${two_partition_3_2}")
+                        contains "partition=2/4"
+                    }
+
+                    qt_two_partition_4_all two_partition_4_all
+                    explain {
+                        sql("${two_partition_4_all}")
+                        contains "partition=4/4"
+                    }
+
+                    qt_two_partition_5_1 two_partition_5_1
+                    explain {
+                        sql("${two_partition_5_1}")
+                        contains "partition=1/4"
+                    }
+
+                    qt_two_partition_6_1 two_partition_6_1
+                    explain {
+                        sql("${two_partition_6_1}")
+                        contains "partition=1/4"
+                    }
+
+
+
+                    qt_three_partition_1_1 three_partition_1_1
+                    explain {
+                        sql("${three_partition_1_1}")
+                        contains "partition=1/10"
+                    }
+
+                    qt_three_partition_2_1 three_partition_2_1
+                    explain {
+                        sql("${three_partition_2_1}")
+                        contains "partition=1/10"
+                    }
+
+                    qt_three_partition_3_3 three_partition_3_3
+                    explain {
+                        sql("${three_partition_3_3}")
+                        contains "partition=3/10"
+                    }
+
+                    qt_three_partition_4_2 three_partition_4_2
+                    explain {
+                        sql("${three_partition_4_2}")
+                        contains "partition=2/10"
+                    }
+
+                    qt_three_partition_5_all three_partition_5_all
+                    explain {
+                        sql("${three_partition_5_all}")
+                        contains "partition=10/10"
+                    }
+
+                    qt_three_partition_6_1 three_partition_6_1
+                    explain {
+                        sql("${three_partition_6_1}")
+                        contains "partition=1/10"
+                    }
+
+                    qt_three_partition_7_7 three_partition_7_7
+                    explain {
+                        sql("${three_partition_7_7}")
+                        contains "partition=7/10"
+                    }
+
+                    qt_three_partition_8_2 three_partition_8_2
+                    explain {
+                        sql("${three_partition_8_2}")
+                        contains "partition=2/10"
+                    }
+
+
+                    // 0 partitions
+                    def one_partition_6_0 = """SELECT * FROM one_partition_tb WHERE part1 = 2023 ORDER BY id;"""
+                    qt_one_partition_6_0 one_partition_6_0
+                    explain {
+                        sql("${one_partition_6_0}")
+                        contains "partition=0/2"
+                    }
+
+                    def two_partition_7_0 = """SELECT * FROM two_partition_tb WHERE part1 = 'CN' AND part2 = 1 ORDER BY id;"""
+                    qt_two_partition_7_0 two_partition_7_0
+                    explain {
+                        sql("${two_partition_7_0}")
+                        contains "partition=0/4"
+                    }
+
+                    def two_partition_8_0 = """SELECT * FROM two_partition_tb WHERE part1 = 'US' AND part2 = 3 ORDER BY id;"""
+                    qt_two_partition_8_0 two_partition_8_0
+                    explain {
+                        sql("${two_partition_8_0}")
+                        contains "partition=0/4"
+                    }
+
+                    def three_partition_9_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'US' AND part2 = 2023 AND part3 = 'Q1' ORDER BY id;"""
+                    qt_three_partition_9_0 three_partition_9_0
+                    explain {
+                        sql("${three_partition_9_0}")
+                        contains "partition=0/10"
+                    }
+
+                    def three_partition_10_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'EU' AND part2 = 2024 AND part3 = 'Q4' ORDER BY id;"""
+                    qt_three_partition_10_0 three_partition_10_0
+                    explain {
+                        sql("${three_partition_10_0}")
+                        contains "partition=0/10"
+                    }
+
+                    def three_partition_11_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'AS' AND part2 = 2025 AND part3 = 'Q4' ORDER BY id;"""
+                    qt_three_partition_11_0 three_partition_11_0
+                    explain {
+                        sql("${three_partition_11_0}")
+                        contains "partition=0/10"
+                    }
+                }
+            }
         }
-
-        qt_three_partition_3_3 three_partition_3_3
-        explain {
-            sql("${three_partition_3_3}")
-            contains "partition=3/10"
-        }
-
-        qt_three_partition_4_2 three_partition_4_2
-        explain {
-            sql("${three_partition_4_2}")
-            contains "partition=2/10"
-        }
-
-        qt_three_partition_5_all three_partition_5_all
-        explain {
-            sql("${three_partition_5_all}")
-            contains "partition=10/10"
-        }
-
-        qt_three_partition_6_1 three_partition_6_1
-        explain {
-            sql("${three_partition_6_1}")
-            contains "partition=1/10"
-        }
-
-        qt_three_partition_7_7 three_partition_7_7
-        explain {
-            sql("${three_partition_7_7}")
-            contains "partition=7/10"
-        }
-
-        qt_three_partition_8_2 three_partition_8_2
-        explain {
-            sql("${three_partition_8_2}")
-            contains "partition=2/10"
-        }
-
-
-        // 0 partitions
-        def one_partition_6_0 = """SELECT * FROM one_partition_tb WHERE part1 = 2023 ORDER BY id;"""
-        qt_one_partition_6_0 one_partition_6_0
-        explain {
-            sql("${one_partition_6_0}")
-            contains "partition=0/2"
-        }
-
-        def two_partition_7_0 = """SELECT * FROM two_partition_tb WHERE part1 = 'CN' AND part2 = 1 ORDER BY id;"""
-        qt_two_partition_7_0 two_partition_7_0
-        explain {
-            sql("${two_partition_7_0}")
-            contains "partition=0/4"
-        }
-
-        def two_partition_8_0 = """SELECT * FROM two_partition_tb WHERE part1 = 'US' AND part2 = 3 ORDER BY id;"""
-        qt_two_partition_8_0 two_partition_8_0
-        explain {
-            sql("${two_partition_8_0}")
-            contains "partition=0/4"
-        }
-
-        def three_partition_9_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'US' AND part2 = 2023 AND part3 = 'Q1' ORDER BY id;"""
-        qt_three_partition_9_0 three_partition_9_0
-        explain {
-            sql("${three_partition_9_0}")
-            contains "partition=0/10"
-        }
-
-        def three_partition_10_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'EU' AND part2 = 2024 AND part3 = 'Q4' ORDER BY id;"""
-        qt_three_partition_10_0 three_partition_10_0
-        explain {
-            sql("${three_partition_10_0}")
-            contains "partition=0/10"
-        }
-
-        def three_partition_11_0 = """SELECT * FROM three_partition_tb WHERE part1 = 'AS' AND part2 = 2025 AND part3 = 'Q4' ORDER BY id;"""
-        qt_three_partition_11_0 three_partition_11_0
-        explain {
-            sql("${three_partition_11_0}")
-            contains "partition=0/10"
-        }
-
     }
 }
\ No newline at end of file
diff --git a/regression-test/suites/fault_injection_p0/test_inverted_index_v3_fault_injection.groovy b/regression-test/suites/fault_injection_p0/test_inverted_index_v3_fault_injection.groovy
new file mode 100644
index 00000000000000..98c0e110964b49
--- /dev/null
+++ b/regression-test/suites/fault_injection_p0/test_inverted_index_v3_fault_injection.groovy
@@ -0,0 +1,60 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+
+suite("test_inverted_index_v3_fault_injection", "nonConcurrent"){
+    def indexTbName1 = "test_inverted_index_v3_fault_injection"
+
+    sql "DROP TABLE IF EXISTS ${indexTbName1}"
+
+    sql """
+      CREATE TABLE ${indexTbName1} (
+      `@timestamp` int(11) NULL COMMENT "",
+      `clientip` varchar(20) NULL COMMENT "",
+      `request` text NULL COMMENT "",
+      `status` int(11) NULL COMMENT "",
+      `size` int(11) NULL COMMENT "",
+      INDEX clientip_idx (`clientip`) COMMENT '',
+      INDEX request_idx (`request`) USING INVERTED PROPERTIES("parser" = "english", "support_phrase" = "true") COMMENT ''
+      ) ENGINE=OLAP
+      DUPLICATE KEY(`@timestamp`)
+      COMMENT "OLAP"
+      DISTRIBUTED BY RANDOM BUCKETS 1
+      PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1",
+      "inverted_index_storage_format" = "V3"
+      );
+    """
+
+    try {
+      GetDebugPoint().enableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_v3")
+      
+      sql """ INSERT INTO ${indexTbName1} VALUES (1, '40.135.0.0', 'GET /images/hm_bg.jpg HTTP/1.0', 200, 24736); """
+    } finally {
+      GetDebugPoint().disableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_v3")
+    }
+
+    try {
+      GetDebugPoint().enableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_v3")
+      GetDebugPoint().enableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_dic_compression")
+
+      sql """ INSERT INTO ${indexTbName1} VALUES (2, '40.135.0.0', 'GET /images/hm_bg.jpg HTTP/1.0', 200, 24736); """
+    } finally {
+      GetDebugPoint().disableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_v3")
+      GetDebugPoint().disableDebugPointForAllBEs("InvertedIndexColumnWriterImpl::create_field_dic_compression")
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/fault_injection_p0/test_multi_replica_fault_injection.groovy b/regression-test/suites/fault_injection_p0/test_multi_replica_fault_injection.groovy
index 2f6afd5ca6925b..d09983d52d0dc3 100644
--- a/regression-test/suites/fault_injection_p0/test_multi_replica_fault_injection.groovy
+++ b/regression-test/suites/fault_injection_p0/test_multi_replica_fault_injection.groovy
@@ -75,14 +75,15 @@ suite("test_multi_replica_fault_injection", "nonConcurrent") {
             file "baseall.txt"
         }
 
-        def load_with_injection = { injection, error_msg->
+        def load_with_injection = { injection, error_msg, success=false->
             try {
                 sql "truncate table test"
                 GetDebugPoint().enableDebugPointForAllBEs(injection)
                 sql "insert into test select * from baseall where k1 <= 3"
+                assertTrue(success, String.format("Expected Exception '%s', actual success", error_msg))
             } catch(Exception e) {
                 logger.info(e.getMessage())
-                assertTrue(e.getMessage().contains(error_msg))
+                assertTrue(e.getMessage().contains(error_msg), e.toString())
             } finally {
                 GetDebugPoint().disableDebugPointForAllBEs(injection)
             }
@@ -90,15 +91,17 @@ suite("test_multi_replica_fault_injection", "nonConcurrent") {
 
         // StreamSinkFileWriter appendv write segment failed one replica
         // success
-        load_with_injection("StreamSinkFileWriter.appendv.write_segment_failed_one_replica", "sucess")
+        load_with_injection("StreamSinkFileWriter.appendv.write_segment_failed_one_replica", "sucess", true)
         // StreamSinkFileWriter appendv write segment failed two replica
         load_with_injection("StreamSinkFileWriter.appendv.write_segment_failed_two_replica", "add segment failed")
         // StreamSinkFileWriter appendv write segment failed all replica
         load_with_injection("StreamSinkFileWriter.appendv.write_segment_failed_all_replica", "failed to send segment data to any replicas")
         // test segment num check when LoadStreamStub missed tail segments
-        load_with_injection("LoadStreamStub.only_send_segment_0", "segment num mismatch")
+        load_with_injection("LoadStreamStub.skip_send_segment", "segment num mismatch")
         // test one backend open failure
-        load_with_injection("VTabletWriterV2._open_streams.skip_one_backend", "success")
+        load_with_injection("VTabletWriterV2._open_streams.skip_one_backend", "success", true)
+        // test two backend open failure
+        load_with_injection("VTabletWriterV2._open_streams.skip_two_backends", "not enough streams 1/3")
         sql """ set enable_memtable_on_sink_node=false """
     }
 }
diff --git a/regression-test/suites/fault_injection_p0/test_writer_v2_fault_injection.groovy b/regression-test/suites/fault_injection_p0/test_writer_v2_fault_injection.groovy
index f05a084035cb3f..7e71de173e96f9 100644
--- a/regression-test/suites/fault_injection_p0/test_writer_v2_fault_injection.groovy
+++ b/regression-test/suites/fault_injection_p0/test_writer_v2_fault_injection.groovy
@@ -67,10 +67,11 @@ suite("test_writer_v2_fault_injection", "nonConcurrent") {
         file "baseall.txt"
     }
 
-    def load_with_injection = { injection, error_msg->
+    def load_with_injection = { injection, error_msg, success=false->
         try {
             GetDebugPoint().enableDebugPointForAllBEs(injection)
             sql "insert into test select * from baseall where k1 <= 3"
+            assertTrue(success, String.format("expected Exception '%s', actual success", error_msg))
         } catch(Exception e) {
             logger.info(e.getMessage())
             assertTrue(e.getMessage().contains(error_msg),
@@ -88,7 +89,7 @@ suite("test_writer_v2_fault_injection", "nonConcurrent") {
     // VTabletWriterV2 node_info is null
     load_with_injection("VTabletWriterV2._open_streams_to_backend.node_info_null", "failed to open streams to any BE")
     // VTabletWriterV2 do not get tablet schema on open_streams
-    load_with_injection("VTabletWriterV2._open_streams_to_backend.no_schema_when_open_streams", "success")
+    load_with_injection("VTabletWriterV2._open_streams_to_backend.no_schema_when_open_streams", "success", true)
     // VTabletWriterV2 tablet_location is null
     load_with_injection("VTabletWriterV2._build_tablet_node_mapping.tablet_location_null", "unknown tablet location")
     // VTabletWriterV2 location is null
diff --git a/regression-test/suites/http_auth_check/test_http_permissions_check_auth.groovy b/regression-test/suites/http_auth_check/test_http_permissions_check_auth.groovy
new file mode 100644
index 00000000000000..36c6241a244db7
--- /dev/null
+++ b/regression-test/suites/http_auth_check/test_http_permissions_check_auth.groovy
@@ -0,0 +1,66 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.junit.Assert;
+
+suite("test_http_permissions_check_auth","p0,auth") {
+    String suiteName = "test_http_permissions_check_auth"
+    String tableName = "${suiteName}_table"
+    String user = "${suiteName}_user"
+    String pwd = 'C123_567p'
+    try_sql("DROP USER ${user}")
+    sql """CREATE USER '${user}' IDENTIFIED BY '${pwd}'"""
+    sql """drop table if exists `${tableName}`"""
+    sql """
+        CREATE TABLE `${tableName}` (
+          `k1` int,
+          `k2` int
+        ) ENGINE=OLAP
+        DISTRIBUTED BY random BUCKETS auto
+        PROPERTIES ('replication_num' = '1') ;
+        """
+    sql """insert into ${tableName} values(1,1)"""
+    sql """set session_context = 'trace_id:mmn9';"""
+    sql """select * from ${tableName};"""
+
+    def get_queryid_by_traceid = { check_func ->
+        httpTest {
+            basicAuthorization "${user}","${pwd}"
+            endpoint "${context.config.feHttpAddress}"
+            uri "/rest/v2/manager/query/trace_id/mmn9"
+            op "get"
+            check check_func
+        }
+    }
+
+    get_queryid_by_traceid.call() {
+        respCode, body ->
+            log.info("body:${body}")
+            assertTrue("${body}".contains("Bad Request"))
+    }
+
+    sql """grant 'admin' to ${user}"""
+
+    get_queryid_by_traceid.call() {
+        respCode, body ->
+            log.info("body:${body}")
+            assertTrue("${body}".contains("success"))
+    }
+
+    sql """drop table if exists `${tableName}`"""
+    try_sql("DROP USER ${user}")
+}
diff --git a/regression-test/suites/index_p0/test_ngram_bloomfilter_index.groovy b/regression-test/suites/index_p0/test_ngram_bloomfilter_index.groovy
index e2ab9b9c117f1c..cce6ed9fd9d014 100644
--- a/regression-test/suites/index_p0/test_ngram_bloomfilter_index.groovy
+++ b/regression-test/suites/index_p0/test_ngram_bloomfilter_index.groovy
@@ -104,6 +104,10 @@ suite("test_ngram_bloomfilter_index") {
         """
     test {
         sql """ALTER TABLE  ${tableName3} ADD INDEX idx_http_url(http_url) USING NGRAM_BF PROPERTIES("gram_size"="3", "bf_size"="65536") COMMENT 'http_url ngram_bf index'"""
-        exception "bf_size should be integer and between 64 and 65535"
+        exception "'bf_size' should be an integer between 64 and 65535"
+    }
+    test {
+        sql """ALTER TABLE  ${tableName3} ADD INDEX idx_http_url(http_url) USING NGRAM_BF PROPERTIES("gram_size"="256", "bf_size"="65535") COMMENT 'http_url ngram_bf index'"""
+        exception "'gram_size' should be an integer between 1 and 255"
     }
 }
diff --git a/regression-test/suites/insert_p0/test_insert_docs_demo.groovy b/regression-test/suites/insert_p0/test_insert_docs_demo.groovy
new file mode 100644
index 00000000000000..b56df70e344ef3
--- /dev/null
+++ b/regression-test/suites/insert_p0/test_insert_docs_demo.groovy
@@ -0,0 +1,111 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import com.mysql.cj.jdbc.StatementImpl
+
+suite("test_insert_docs_demo") {
+    def dbName = "regression_test_insert_p0"
+    def srcTableName = "test_insert_docs_demo_src"
+    def dstTableName = "test_insert_docs_demo_dst"
+    def srcName = dbName + "." + srcTableName
+    def dstName = dbName + "." + dstTableName
+
+    // create table
+    sql """ drop table if exists ${srcName}; """
+    sql """
+        CREATE TABLE ${srcName}(
+            user_id            BIGINT       NOT NULL COMMENT "user id",
+            name               VARCHAR(20)           COMMENT "name",
+            age                INT                   COMMENT "age"
+        ) DUPLICATE KEY(user_id)
+        DISTRIBUTED BY HASH(user_id) BUCKETS 10;
+    """
+
+    sql """ drop table if exists ${dstName}; """
+    sql """
+        CREATE TABLE ${dstName}(
+            user_id            BIGINT       NOT NULL COMMENT "user id",
+            name               VARCHAR(20)           COMMENT "name",
+            age                INT                   COMMENT "age"
+        ) DUPLICATE KEY(user_id)
+        DISTRIBUTED BY HASH(user_id) BUCKETS 10;
+    """
+
+    sql """ SET enable_insert_strict = true; """
+
+    // insert into values
+    sql """
+        INSERT INTO ${srcName} (user_id, name, age)
+        VALUES (1, "Emily", 25),
+            (2, "Benjamin", 35),
+            (3, "Olivia", 28),
+            (4, "Alexander", 60),
+            (5, "Ava", 17);
+    """
+
+    // insert into
+    sql """
+        INSERT INTO ${dstName}
+        SELECT * FROM ${srcName} WHERE age < 30;
+    """
+
+    qt_insert """
+        SELECT * FROM ${dstName} ORDER BY age;
+    """
+
+    // The error message may vary due to variations in fuzzy execution instance number or batch size.
+    // like this:
+    // Insert has filtered data in strict mode. url: http://172.16.0.10:8041/api/_load_error_log?
+    // file=__shard_303/error_log_insert_stmt_a1ccfb9c67ba40f5-900d0db1d06a19dd_a1ccfb9c67ba40f5_900d0db1d06a19dd
+    // or like this:
+    // [DATA_QUALITY_ERROR]Encountered unqualified data, stop processing. url: http://172.16.0.10:8041/api/_load_error_log?
+    // file=__shard_303/error_log_insert_stmt_a1ccfb9c67ba40f5-900d0db1d06a19dd_a1ccfb9c67ba40f5_900d0db1d06a19dd
+    expectExceptionLike({
+        sql """
+            INSERT INTO ${srcName} (user_id, name, age)
+            VALUES (1, "Emily", 25),
+                (2, "Benjamin", 35),
+                (3, "Olivia", 28),
+                (NULL, "Alexander", 60),
+                (5, "Ava", 17);
+        """
+    }, "error_log")
+
+    sql """ SET enable_insert_strict = false; """
+
+    sql """
+        INSERT INTO ${srcName} (user_id, name, age)
+        VALUES (1, "Emily", 25),
+            (2, "Benjamin", 35),
+            (3, "Olivia", 28),
+            (NULL, "Alexander", 60),
+            (5, "Ava", 17);
+    """
+
+    sql """ SET insert_max_filter_ratio = 0.1 """
+
+    expectExceptionLike({
+        sql """
+            INSERT INTO ${srcName} (user_id, name, age)
+            VALUES (1, "Emily", 25),
+                (2, "Benjamin", 35),
+                (3, "Olivia", 28),
+                (NULL, "Alexander", 60),
+                (5, "Ava", 17);
+        """
+    }, "Insert has too many filtered data 1/5 insert_max_filter_ratio is 0.1")
+}
diff --git a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_dup_keys_arr.groovy b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_dup_keys_arr.groovy
index ba30c9f044b7be..c7d41e68cdd112 100644
--- a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_dup_keys_arr.groovy
+++ b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_dup_keys_arr.groovy
@@ -17,7 +17,7 @@
 
 import org.codehaus.groovy.runtime.IOGroovyMethods
 
-suite("test_index_compaction_dup_keys_array", "array_contains_inverted_index") {
+suite("test_index_compaction_dup_keys_array", "array_contains_inverted_index, nonConcurrent") {
     // here some variable to control inverted index query
     sql """ set enable_profile=true"""
     sql """ set enable_pipeline_x_engine=true;"""
diff --git a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_null_arr.groovy b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_null_arr.groovy
index b33a197bd32170..dfc38998c4d4bc 100644
--- a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_null_arr.groovy
+++ b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_null_arr.groovy
@@ -17,7 +17,7 @@
 
 import org.codehaus.groovy.runtime.IOGroovyMethods
 
-suite("test_index_compaction_null_arr", "array_contains_inverted_index") {
+suite("test_index_compaction_null_arr", "array_contains_inverted_index, nonConcurrent") {
     // here some variable to control inverted index query
     sql """ set enable_profile=true"""
     sql """ set enable_pipeline_x_engine=true;"""
diff --git a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_unique_keys_arr.groovy b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_unique_keys_arr.groovy
index e07618be6c1370..602e5d552598ea 100644
--- a/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_unique_keys_arr.groovy
+++ b/regression-test/suites/inverted_index_p0/array_contains/test_index_compaction_unique_keys_arr.groovy
@@ -17,7 +17,7 @@
 
 import org.codehaus.groovy.runtime.IOGroovyMethods
 
-suite("test_index_compaction_unique_keys_arr", "array_contains_inverted_index") {
+suite("test_index_compaction_unique_keys_arr", "array_contains_inverted_index, nonConcurrent") {
     // here some variable to control inverted index query
     sql """ set enable_profile=true"""
     sql """ set enable_pipeline_x_engine=true;"""
diff --git a/regression-test/suites/inverted_index_p0/index_compaction/test_index_compaction_empty_segments.groovy b/regression-test/suites/inverted_index_p0/index_compaction/test_index_compaction_empty_segments.groovy
index 46126299bf5b88..1c70c9e8e5027b 100644
--- a/regression-test/suites/inverted_index_p0/index_compaction/test_index_compaction_empty_segments.groovy
+++ b/regression-test/suites/inverted_index_p0/index_compaction/test_index_compaction_empty_segments.groovy
@@ -19,7 +19,7 @@ import java.util.concurrent.Executors
 import java.util.concurrent.TimeUnit
 import org.awaitility.Awaitility
 
-suite("test_index_compaction_empty_segments", "p0") {
+suite("test_index_compaction_empty_segments", "p0, nonConcurrent") {
 
     def compaction_table_name = "test_index_compaction_empty_segments"
     def backendId_to_backendIP = [:]
@@ -82,8 +82,9 @@ suite("test_index_compaction_empty_segments", "p0") {
         });
     }
 
-    int afterSegmentCount = 0
+    
     for (def tablet in tablets) {
+        int afterSegmentCount = 0
         String tablet_id = tablet.TabletId
         (code, out, err) = curl("GET", tablet.CompactionStatus)
         logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
@@ -94,6 +95,6 @@ suite("test_index_compaction_empty_segments", "p0") {
             logger.info("rowset is: " + rowset)
             afterSegmentCount += Integer.parseInt(rowset.split(" ")[1])
         }
+        assertEquals(afterSegmentCount, 0)
     }
-    assertEquals(afterSegmentCount, 0)
 }
diff --git a/regression-test/suites/inverted_index_p0/test_inverted_index_v3.groovy b/regression-test/suites/inverted_index_p0/test_inverted_index_v3.groovy
new file mode 100644
index 00000000000000..ea7dd0b595f504
--- /dev/null
+++ b/regression-test/suites/inverted_index_p0/test_inverted_index_v3.groovy
@@ -0,0 +1,117 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+
+suite("test_inverted_index_v3", "p0"){
+    def indexTbName1 = "test_inverted_index_v3_1"
+    def indexTbName2 = "test_inverted_index_v3_2"
+
+    sql "DROP TABLE IF EXISTS ${indexTbName1}"
+    sql "DROP TABLE IF EXISTS ${indexTbName2}"
+
+    sql """
+      CREATE TABLE ${indexTbName1} (
+      `@timestamp` int(11) NULL COMMENT "",
+      `clientip` varchar(20) NULL COMMENT "",
+      `request` text NULL COMMENT "",
+      `status` int(11) NULL COMMENT "",
+      `size` int(11) NULL COMMENT "",
+      INDEX request_idx (`request`) USING INVERTED PROPERTIES("parser" = "english", "support_phrase" = "true") COMMENT ''
+      ) ENGINE=OLAP
+      DUPLICATE KEY(`@timestamp`)
+      COMMENT "OLAP"
+      DISTRIBUTED BY RANDOM BUCKETS 1
+      PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1",
+      "inverted_index_storage_format" = "V2"
+      );
+    """
+
+    sql """
+      CREATE TABLE ${indexTbName2} (
+      `@timestamp` int(11) NULL COMMENT "",
+      `clientip` varchar(20) NULL COMMENT "",
+      `request` text NULL COMMENT "",
+      `status` int(11) NULL COMMENT "",
+      `size` int(11) NULL COMMENT "",
+      INDEX request_idx (`request`) USING INVERTED PROPERTIES("parser" = "english", "support_phrase" = "true") COMMENT ''
+      ) ENGINE=OLAP
+      DUPLICATE KEY(`@timestamp`)
+      COMMENT "OLAP"
+      DISTRIBUTED BY RANDOM BUCKETS 1
+      PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1",
+      "inverted_index_storage_format" = "V3"
+      );
+    """
+
+    def load_httplogs_data = {table_name, label, read_flag, format_flag, file_name, ignore_failure=false,
+                        expected_succ_rows = -1, load_to_single_tablet = 'true' ->
+        
+        // load the json data
+        streamLoad {
+            table "${table_name}"
+            
+            // set http request header params
+            set 'label', label + "_" + UUID.randomUUID().toString()
+            set 'read_json_by_line', read_flag
+            set 'format', format_flag
+            file file_name // import json file
+            time 10000 // limit inflight 10s
+            if (expected_succ_rows >= 0) {
+                set 'max_filter_ratio', '1'
+            }
+
+            // if declared a check callback, the default check condition will ignore.
+            // So you must check all condition
+            check { result, exception, startTime, endTime ->
+		        if (ignore_failure && expected_succ_rows < 0) { return }
+                    if (exception != null) {
+                        throw exception
+                    }
+                    log.info("Stream load result: ${result}".toString())
+                    def json = parseJson(result)
+                    assertEquals("success", json.Status.toLowerCase())
+                    if (expected_succ_rows >= 0) {
+                        assertEquals(json.NumberLoadedRows, expected_succ_rows)
+                    } else {
+                        assertEquals(json.NumberTotalRows, json.NumberLoadedRows + json.NumberUnselectedRows)
+                        assertTrue(json.NumberLoadedRows > 0 && json.LoadBytes > 0)
+                }
+            }
+        }
+    }
+
+    try {
+      load_httplogs_data.call(indexTbName1, indexTbName1, 'true', 'json', 'documents-1000.json')
+      load_httplogs_data.call(indexTbName2, indexTbName2, 'true', 'json', 'documents-1000.json')
+      
+      sql "sync"
+
+      qt_sql """ select count() from ${indexTbName1} where request match_any 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName1} where request match_all 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName1} where request match_phrase 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName1} where request match_phrase_prefix 'hm bg'; """
+
+      qt_sql """ select count() from ${indexTbName2} where request match_any 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName2} where request match_all 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName2} where request match_phrase 'hm bg'; """
+      qt_sql """ select count() from ${indexTbName2} where request match_phrase_prefix 'hm bg'; """
+
+    } finally {
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/inverted_index_p1/show_data/test_show_index_data.groovy b/regression-test/suites/inverted_index_p1/show_data/test_show_index_data.groovy
new file mode 100644
index 00000000000000..671fe907782f2c
--- /dev/null
+++ b/regression-test/suites/inverted_index_p1/show_data/test_show_index_data.groovy
@@ -0,0 +1,399 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import java.util.concurrent.Executors
+import java.util.concurrent.TimeUnit
+import org.awaitility.Awaitility
+
+enum FileSizeChange {
+    LARGER,
+    SMALLER,
+    UNCHANGED
+}
+
+suite("test_show_index_data", "p1") {
+
+    def show_table_name = "test_show_index_data"
+
+    def load_json_data = { table_name, file_name ->
+        // load the json data
+        streamLoad {
+            table "${table_name}"
+
+            // set http request header params
+            set 'read_json_by_line', 'true' 
+            set 'format', 'json' 
+            set 'max_filter_ratio', '0.1'
+            file file_name // import json file
+            time 10000 // limit inflight 10s
+
+            // if declared a check callback, the default check condition will ignore.
+            // So you must check all condition
+
+            check { result, exception, startTime, endTime ->
+                if (exception != null) {
+                        throw exception
+                }
+                logger.info("Stream load ${file_name} result: ${result}".toString())
+                def json = parseJson(result)
+                assertEquals("success", json.Status.toLowerCase())
+                // assertEquals(json.NumberTotalRows, json.NumberLoadedRows + json.NumberUnselectedRows)
+                assertTrue(json.NumberLoadedRows > 0 && json.LoadBytes > 0)
+            }
+        }
+    }
+
+    def backendId_to_backendIP = [:]
+    def backendId_to_backendHttpPort = [:]
+    getBackendIpHttpPort(backendId_to_backendIP, backendId_to_backendHttpPort);
+
+    
+
+    def convert_size = { str ->
+        def matcher = str =~ /(\d+(\.\d+)?)\s*(KB|MB|GB|TB|B)/
+        if (matcher) {
+            def value = matcher[0][1] as double
+            def unit = matcher[0][3]
+            logger.info("value is: " + value + " unit is: " + unit)
+            def result = 0.0
+            switch (unit) {
+                case 'KB':
+                    result = value * 1024
+                    break
+                case 'MB':
+                    result = value * 1024 * 1024 
+                    break
+                case 'GB':
+                    result = value * 1024 * 1024 * 1024
+                    break
+                case 'B':
+                    result = value
+                    break
+                default:
+                    throw new IllegalArgumentException("Unknown unit: $unit")
+            }
+            
+            return result
+        } else {
+           return 0
+        }
+    }
+
+    sql "DROP TABLE IF EXISTS ${show_table_name}"
+    sql """ 
+        CREATE TABLE ${show_table_name} (
+            `@timestamp` int(11) NULL,
+            `clientip` varchar(20) NULL,
+            `request` varchar(500) NULL,
+            `status` int NULL,
+            `size` int NULL,
+            INDEX clientip_idx (`clientip`) USING INVERTED COMMENT '',
+            INDEX request_idx (`request`) USING INVERTED PROPERTIES("parser" = "unicode") COMMENT ''
+        ) ENGINE=OLAP
+        DUPLICATE KEY(`@timestamp`, `clientip`)
+        DISTRIBUTED BY HASH(`@timestamp`) BUCKETS 1
+        PROPERTIES (
+            "replication_allocation" = "tag.location.default: 1",
+            "compaction_policy" = "time_series",
+            "time_series_compaction_file_count_threshold" = "20",
+            "disable_auto_compaction" = "true"
+        );
+    """
+
+    def compaction = {
+
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+
+        for (def tablet in tablets) {
+            int beforeSegmentCount = 0
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                beforeSegmentCount += Integer.parseInt(rowset.split(" ")[1])
+            }
+            assertEquals(beforeSegmentCount, 10)
+        }
+
+        // trigger compactions for all tablets in ${tableName}
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            backend_id = tablet.BackendId
+            (code, out, err) = be_run_full_compaction(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+            logger.info("Run compaction: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def compactJson = parseJson(out.trim())
+            assertEquals("success", compactJson.status.toLowerCase())
+        }
+
+        // wait for all compactions done
+        for (def tablet in tablets) {
+            Awaitility.await().atMost(30, TimeUnit.MINUTES).untilAsserted(() -> {
+                Thread.sleep(30000)
+                String tablet_id = tablet.TabletId
+                backend_id = tablet.BackendId
+                (code, out, err) = be_get_compaction_status(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+                logger.info("Get compaction status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def compactionStatus = parseJson(out.trim())
+                assertEquals("compaction task for this tablet is not running", compactionStatus.msg.toLowerCase())
+            });
+        }
+
+        
+        for (def tablet in tablets) {
+            int afterSegmentCount = 0
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                logger.info("rowset is: " + rowset)
+                afterSegmentCount += Integer.parseInt(rowset.split(" ")[1])
+            }
+            assertEquals(afterSegmentCount, 1)
+        }
+    }
+
+    double localIndexSize = 0
+    double localSegmentSize = 0
+
+    def check_size_equal = { double result1, double result2 ->
+        double tolerance = 0.1 * Math.max(result1, result2);
+        return Math.abs(result1 - result2) <= tolerance;
+    }
+
+    def check_show_data = { FileSizeChange expect_idx, FileSizeChange expect_data ->
+        Thread.sleep(90000)
+        Awaitility.await().atMost(5, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(10000)
+            def result = sql """ show data all;"""
+            logger.info("show data all; result is: ${result}")
+            def currentLocalIndexSize = convert_size.call(result[0][4])
+            def currentSegmentIndexSize = convert_size.call(result[0][3])
+
+            if (expect_idx == FileSizeChange.LARGER) {
+                assertTrue(currentLocalIndexSize > localIndexSize)
+            } else if (expect_idx == FileSizeChange.SMALLER) {
+                assertTrue(currentLocalIndexSize < localIndexSize)
+            } else {
+                assertTrue(check_size_equal(currentLocalIndexSize, localIndexSize))
+            }
+
+            if (expect_data == FileSizeChange.LARGER) {
+                assertTrue(currentSegmentIndexSize > localSegmentSize)
+            } else if (expect_data == FileSizeChange.SMALLER) {
+                assertTrue(currentSegmentIndexSize < localSegmentSize)
+            } else {
+                assertTrue(check_size_equal(currentSegmentIndexSize, localSegmentSize))
+            }
+            assertTrue(currentLocalIndexSize != 0)
+            assertTrue(currentSegmentIndexSize != 0)
+            localIndexSize = currentLocalIndexSize
+            localSegmentSize = currentSegmentIndexSize
+
+            def result2 = sql """ select * from information_schema.tables where TABLE_NAME = '${show_table_name}' """
+            logger.info("result 2 is: ${result2}")
+            def currentLocalIndexSize2 = result2[0][11] as double
+            def currentSegmentIndexSize2 = result2[0][9] as double
+            logger.info("currentLocalIndexSize2 is: ${currentLocalIndexSize2}, currentSegmentIndexSize2 is: ${currentSegmentIndexSize2}")
+            assertTrue(check_size_equal(currentLocalIndexSize, currentLocalIndexSize2))
+            assertTrue(check_size_equal(currentSegmentIndexSize, currentSegmentIndexSize2))
+            logger.info("show data all localIndexSize is: " + localIndexSize)
+            logger.info("show data all localSegmentSize is: " + localSegmentSize)
+        });
+    }
+
+    def schema_change = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ alter table ${show_table_name} drop column clientip"""
+        Awaitility.await().atMost(30, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    def build_index = {
+
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ ALTER TABLE ${show_table_name} ADD INDEX status_idx (status) using inverted; """
+        if (!isCloudMode()) {
+            sql """ build index status_idx on ${show_table_name}"""
+        }
+        Awaitility.await().atMost(30, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    def drop_index = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ DROP INDEX status_idx on ${show_table_name}"""
+        Awaitility.await().atMost(30, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    // 1. load data
+    def executor = Executors.newFixedThreadPool(5)
+    (1..10).each { i ->
+        executor.submit {
+            def fileName = "documents-" + i + ".json"
+            load_json_data.call(show_table_name, """${getS3Url()}/regression/inverted_index_cases/httplogs/${fileName}""")
+        }
+    }
+    executor.shutdown()
+    executor.awaitTermination(30, TimeUnit.MINUTES)
+
+    // 2. check show data
+    check_show_data.call(FileSizeChange.LARGER, FileSizeChange.LARGER)
+
+    // 3. compaction
+    compaction.call()
+
+    // 4. check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.SMALLER)
+
+    // 5. schema change
+    schema_change.call()
+
+    // 6.check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.SMALLER)
+
+    // 7. build index
+    build_index.call()
+
+    // 8.check show data
+    check_show_data.call(FileSizeChange.LARGER, FileSizeChange.UNCHANGED)
+
+    // 9. drop index
+    drop_index.call()
+
+    // 10.check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.UNCHANGED)
+}
diff --git a/regression-test/suites/inverted_index_p2/show_data/test_show_index_data_p2.groovy b/regression-test/suites/inverted_index_p2/show_data/test_show_index_data_p2.groovy
new file mode 100644
index 00000000000000..2839a8a47b04aa
--- /dev/null
+++ b/regression-test/suites/inverted_index_p2/show_data/test_show_index_data_p2.groovy
@@ -0,0 +1,397 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import java.util.concurrent.Executors
+import java.util.concurrent.TimeUnit
+import org.awaitility.Awaitility
+
+enum FileSizeChange {
+    LARGER,
+    SMALLER,
+    UNCHANGED
+}
+
+suite("test_show_index_data_p2", "p2") {
+
+    def show_table_name = "test_show_index_data_p2"
+
+    def load_json_data = { table_name, file_name ->
+        // load the json data
+        streamLoad {
+            table "${table_name}"
+
+            // set http request header params
+            set 'read_json_by_line', 'true' 
+            set 'format', 'json' 
+            set 'max_filter_ratio', '0.1'
+            file file_name // import json file
+            time 10000 // limit inflight 10s
+
+            // if declared a check callback, the default check condition will ignore.
+            // So you must check all condition
+
+            check { result, exception, startTime, endTime ->
+                if (exception != null) {
+                        throw exception
+                }
+                logger.info("Stream load ${file_name} result: ${result}".toString())
+                def json = parseJson(result)
+                assertEquals("success", json.Status.toLowerCase())
+                // assertEquals(json.NumberTotalRows, json.NumberLoadedRows + json.NumberUnselectedRows)
+                assertTrue(json.NumberLoadedRows > 0 && json.LoadBytes > 0)
+            }
+        }
+    }
+
+    def backendId_to_backendIP = [:]
+    def backendId_to_backendHttpPort = [:]
+    getBackendIpHttpPort(backendId_to_backendIP, backendId_to_backendHttpPort);
+
+    
+
+    def convert_size = { str ->
+        def matcher = str =~ /(\d+(\.\d+)?)\s*(KB|MB|GB|TB|B)/
+        if (matcher) {
+            def value = matcher[0][1] as double
+            def unit = matcher[0][3]
+            logger.info("value is: " + value + " unit is: " + unit)
+            def result = 0.0
+            switch (unit) {
+                case 'KB':
+                    result = value * 1024
+                    break
+                case 'MB':
+                    result = value * 1024 * 1024 
+                    break
+                case 'GB':
+                    result = value * 1024 * 1024 * 1024
+                    break
+                case 'B':
+                    result = value
+                    break
+                default:
+                    throw new IllegalArgumentException("Unknown unit: $unit")
+            }
+            
+            return result
+        } else {
+           return 0
+        }
+    }
+
+    sql "DROP TABLE IF EXISTS ${show_table_name}"
+    sql """ 
+        CREATE TABLE ${show_table_name} (
+            `@timestamp` int(11) NULL,
+            `clientip` varchar(20) NULL,
+            `request` varchar(500) NULL,
+            `status` int NULL,
+            `size` int NULL,
+            INDEX clientip_idx (`clientip`) USING INVERTED COMMENT '',
+            INDEX request_idx (`request`) USING INVERTED PROPERTIES("parser" = "unicode") COMMENT ''
+        ) ENGINE=OLAP
+        DUPLICATE KEY(`@timestamp`, `clientip`)
+        DISTRIBUTED BY HASH(`@timestamp`) BUCKETS 1
+        PROPERTIES (
+            "replication_allocation" = "tag.location.default: 1",
+            "compaction_policy" = "time_series",
+            "time_series_compaction_file_count_threshold" = "20",
+            "disable_auto_compaction" = "true"
+        );
+    """
+
+    def compaction = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        for (def tablet in tablets) {
+            int beforeSegmentCount = 0
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                beforeSegmentCount += Integer.parseInt(rowset.split(" ")[1])
+            }
+            assertEquals(beforeSegmentCount, 110)
+        }
+
+        // trigger compactions for all tablets in ${tableName}
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            backend_id = tablet.BackendId
+            (code, out, err) = be_run_full_compaction(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+            logger.info("Run compaction: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def compactJson = parseJson(out.trim())
+            assertEquals("success", compactJson.status.toLowerCase())
+        }
+
+        // wait for all compactions done
+        for (def tablet in tablets) {
+            Awaitility.await().atMost(60, TimeUnit.MINUTES).untilAsserted(() -> {
+                Thread.sleep(30000)
+                String tablet_id = tablet.TabletId
+                backend_id = tablet.BackendId
+                (code, out, err) = be_get_compaction_status(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+                logger.info("Get compaction status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def compactionStatus = parseJson(out.trim())
+                assertEquals("compaction task for this tablet is not running", compactionStatus.msg.toLowerCase())
+            });
+        }
+
+        for (def tablet in tablets) {
+            int afterSegmentCount = 0
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                logger.info("rowset is: " + rowset)
+                afterSegmentCount += Integer.parseInt(rowset.split(" ")[1])
+            }
+            assertEquals(afterSegmentCount, 1)
+        }
+        
+    }
+
+    double localIndexSize = 0
+    double localSegmentSize = 0
+
+    def check_size_equal = { double result1, double result2 ->
+        double tolerance = 0.1 * Math.max(result1, result2);
+        return Math.abs(result1 - result2) <= tolerance;
+    }
+
+    def check_show_data = { FileSizeChange expect_idx, FileSizeChange expect_data ->
+        Thread.sleep(90000)
+        Awaitility.await().atMost(10, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(10000)
+            def result = sql """ show data all;"""
+            logger.info("show data all; result is: ${result}")
+            def currentLocalIndexSize = convert_size.call(result[0][4])
+            def currentSegmentIndexSize = convert_size.call(result[0][3])
+
+            if (expect_idx == FileSizeChange.LARGER) {
+                assertTrue(currentLocalIndexSize > localIndexSize)
+            } else if (expect_idx == FileSizeChange.SMALLER) {
+                assertTrue(currentLocalIndexSize < localIndexSize)
+            } else {
+                assertTrue(check_size_equal(currentLocalIndexSize, localIndexSize))
+            }
+
+            if (expect_data == FileSizeChange.LARGER) {
+                assertTrue(currentSegmentIndexSize > localSegmentSize)
+            } else if (expect_data == FileSizeChange.SMALLER) {
+                assertTrue(currentSegmentIndexSize < localSegmentSize)
+            } else {
+                assertTrue(check_size_equal(currentSegmentIndexSize, localSegmentSize))
+            }
+
+            assertTrue(currentLocalIndexSize != 0)
+            assertTrue(currentSegmentIndexSize != 0)
+            localIndexSize = currentLocalIndexSize
+            localSegmentSize = currentSegmentIndexSize
+
+            def result2 = sql """ select * from information_schema.tables where TABLE_NAME = '${show_table_name}' """
+            logger.info("result 2 is: ${result2}")
+            def currentLocalIndexSize2 = result2[0][11] as double
+            def currentSegmentIndexSize2 = result2[0][9] as double
+            logger.info("currentLocalIndexSize2 is: ${currentLocalIndexSize2}, currentSegmentIndexSize2 is: ${currentSegmentIndexSize2}")
+            assertTrue(check_size_equal(currentLocalIndexSize, currentLocalIndexSize2))
+            assertTrue(check_size_equal(currentSegmentIndexSize, currentSegmentIndexSize2))
+            logger.info("show data all localIndexSize is: " + localIndexSize)
+            logger.info("show data all localSegmentSize is: " + localSegmentSize)
+        });
+    }
+
+    def schema_change = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ alter table ${show_table_name} drop column clientip"""
+        Awaitility.await().atMost(60, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    def build_index = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ ALTER TABLE ${show_table_name} ADD INDEX status_idx (status) using inverted; """
+        if (!isCloudMode()) {
+            sql """ build index status_idx on ${show_table_name}"""
+        }
+        Awaitility.await().atMost(60, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    def drop_index = {
+        def tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+        Set<String> rowsetids = new HashSet<>();
+        for (def tablet in tablets) {
+            String tablet_id = tablet.TabletId
+            (code, out, err) = curl("GET", tablet.CompactionStatus)
+            logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def tabletJson = parseJson(out.trim())
+            assert tabletJson.rowsets instanceof List
+            for (String rowset in (List<String>) tabletJson.rowsets) {
+                int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                if (segmentCount == 0) {
+                    continue;
+                }
+                String rowsetid = rowset.split(" ")[4];
+                rowsetids.add(rowsetid)
+                logger.info("rowsetid: " + rowsetid)
+            }
+        }
+        sql """ DROP INDEX status_idx on ${show_table_name}"""
+        Awaitility.await().atMost(60, TimeUnit.MINUTES).untilAsserted(() -> {
+            Thread.sleep(30000)
+            tablets = sql_return_maparray """ show tablets from ${show_table_name}; """
+            for (def tablet in tablets) {
+                String tablet_id = tablet.TabletId
+                (code, out, err) = curl("GET", tablet.CompactionStatus)
+                logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+                assertEquals(code, 0)
+                def tabletJson = parseJson(out.trim())
+                assert tabletJson.rowsets instanceof List
+                for (String rowset in (List<String>) tabletJson.rowsets) {
+                    int segmentCount = Integer.parseInt(rowset.split(" ")[1])
+                    if (segmentCount == 0) {
+                        continue;
+                    }
+                    String rowsetid = rowset.split(" ")[4];
+                    logger.info("rowsetid: " + rowsetid)
+                    assertTrue(!rowsetids.contains(rowsetid))
+                }
+            }
+        });
+    }
+
+    // 1. load data
+    def executor = Executors.newFixedThreadPool(5)
+    (1..110).each { i ->
+        executor.submit {
+            def fileName = "documents-" + i + ".json"
+            load_json_data.call(show_table_name, """${getS3Url()}/regression/inverted_index_cases/httplogs/${fileName}""")
+        }
+    }
+    executor.shutdown()
+    executor.awaitTermination(60, TimeUnit.MINUTES)
+
+    // 2. check show data
+    check_show_data.call(FileSizeChange.LARGER, FileSizeChange.LARGER)
+
+    // 3. compaction
+    compaction.call()
+
+    // 4. check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.LARGER)
+
+    // 5. schema change
+    schema_change.call()
+
+    // 6.check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.SMALLER)
+
+    // 7. build index
+    build_index.call()
+
+    // 8.check show data
+    check_show_data.call(FileSizeChange.LARGER, FileSizeChange.UNCHANGED)
+
+    // 9. drop index
+    drop_index.call()
+
+    // 10.check show data
+    check_show_data.call(FileSizeChange.SMALLER, FileSizeChange.UNCHANGED)
+}
diff --git a/regression-test/suites/javaudf_p0/test_javaudf_const_test.groovy b/regression-test/suites/javaudf_p0/test_javaudf_const_test.groovy
new file mode 100644
index 00000000000000..31323bb46ed100
--- /dev/null
+++ b/regression-test/suites/javaudf_p0/test_javaudf_const_test.groovy
@@ -0,0 +1,185 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.codehaus.groovy.runtime.IOGroovyMethods
+
+import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.nio.file.Paths
+
+suite("test_javaudf_const_test") {
+    def tableName = "test_javaudf_const_test"
+    def jarPath = """${context.file.parent}/jars/java-udf-case-jar-with-dependencies.jar"""
+    // scp_udf_file_to_all_be(jarPath)
+
+    log.info("Jar path: ${jarPath}".toString())
+    try {
+        sql """ DROP TABLE IF EXISTS ${tableName} """
+        sql """
+        CREATE TABLE IF NOT EXISTS test_javaudf_const_test (
+            int_col int,
+            boolean_col boolean,
+            tinyint_col tinyint,
+            smallint_col smallint,
+            bigint_col bigint,
+            largeint_col largeint,
+            decimal_col decimal(15, 4),
+            float_col float,
+            double_col double,
+            date_col date,
+            datetime_col datetime(6),
+            string_col string,
+            array_col array<string>,
+            struct_col STRUCT<s_id:int, s_name:string>,
+            map_col map<string, string>
+            )
+            DISTRIBUTED BY HASH(int_col) PROPERTIES("replication_num" = "1");
+        """
+        StringBuilder sb = new StringBuilder()
+        int i = 1
+        for (; i < 10; i++) {
+            sb.append("""
+                (${i},${i%2},${i},${i}*2,${i}*3,${i}*4,${3.33/i},${(7.77/i).round(3)},${(3.1415/i).round(5)},"2023-10-${i+17}","2023-10-${i+10} 10:1${i}:11.234","row${i}",array(null, "nested${i}"),struct(${i}, "sa${i}"), {"k${i}":null,"k${i+1}":${i}}),
+            """)
+            log.info("${sb.toString()}");
+        }
+        sb.append("""
+                (${i},${i%2},null,${i}*2,${i}*3,${i}*4,null,${(7.77/i).round(3)},${(3.1415/i).round(5)},null,"2023-10-${i+10} 10:${i}:11.234",null,array(null, "nested${i}"),struct(${i}, "saaaaaa"),{"k${i}":null,"k${i+1}":${i}})
+            """)
+        sql """ INSERT INTO ${tableName} VALUES
+             ${sb.toString()}
+            """
+        File path = new File(jarPath)
+        if (!path.exists()) {
+            throw new IllegalStateException("""${jarPath} doesn't exist! """)
+        }
+
+        sql """DROP FUNCTION IF EXISTS const_boolean(int,boolean);"""
+        sql """CREATE FUNCTION const_boolean(int,boolean) RETURNS boolean PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstBoolean",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_int(int,int);"""
+        sql """CREATE FUNCTION const_int(int,int) RETURNS int PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstInt",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_largeint(int,largeint);"""
+        sql """CREATE FUNCTION const_largeint(int,largeint) RETURNS largeint PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstLargeInt",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_decimal(int,decimal(15, 4));"""
+        sql """CREATE FUNCTION const_decimal(int,decimal(15, 4)) RETURNS decimal(15, 4) PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstDecimal",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_float(int,float);"""
+        sql """CREATE FUNCTION const_float(int,float) RETURNS float PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstFloat",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_double(int,double);"""
+        sql """CREATE FUNCTION const_double(int,double) RETURNS double PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstDouble",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_date(int,date);"""
+        sql """CREATE FUNCTION const_date(int,date) RETURNS date PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstDate",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_datetime(int,datetime(6));"""
+        sql """CREATE FUNCTION const_datetime(int,datetime(6)) RETURNS datetime(6) PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstDateTime",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_string(int,string);"""
+        sql """CREATE FUNCTION const_string(int,string) RETURNS string PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstString",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_array(int,array<string>);"""
+        sql """CREATE FUNCTION const_array(int,array<string>) RETURNS array<string> PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstArray",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_struct(int,STRUCT<s_id:int, s_name:string>);"""
+        sql """CREATE FUNCTION const_struct(int,STRUCT<s_id:int, s_name:string>) RETURNS STRUCT<s_id:int, s_name:string> PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstStruct",
+            "type"="JAVA_UDF"
+        );"""
+
+        sql """DROP FUNCTION IF EXISTS const_map(int,map<string,string>);"""
+        sql """CREATE FUNCTION const_map(int,map<string,string>) RETURNS map<string,string> PROPERTIES (
+            "file"="file://${jarPath}",
+            "symbol"="org.apache.doris.udf.UDFConstTest\$ConstMap",
+            "type"="JAVA_UDF"
+        );"""
+
+        qt_java_udf_all_types """select
+            int_col,
+            const_boolean(int_col,true),
+            const_int(int_col,2),
+            const_largeint(int_col,3),
+            const_decimal(int_col,4.4),
+            const_float(int_col,5.5),
+            const_double(int_col,6.6),
+            const_date(int_col,'2020-02-02'),
+            const_datetime(int_col,'2022-02-03 10:10:10'),
+            const_string(int_col,'asd'),
+            const_array(int_col,['a','b']),
+            const_struct(int_col,struct(2, 'sa2')),
+            const_map(int_col,{"aa":"bb"})
+            from ${tableName} order by int_col;"""
+    } finally {
+        try_sql """DROP FUNCTION IF EXISTS const_boolean(int,boolean);"""
+        try_sql """DROP FUNCTION IF EXISTS const_int(int,int);"""
+        try_sql """DROP FUNCTION IF EXISTS const_largeint(int,largeint);"""
+        try_sql """DROP FUNCTION IF EXISTS const_decimal(int,decimal(15, 4));"""
+        try_sql """DROP FUNCTION IF EXISTS const_float(int,float);"""
+        try_sql """DROP FUNCTION IF EXISTS const_double(int,double);"""
+        try_sql """DROP FUNCTION IF EXISTS const_date(int,date);"""
+        try_sql """DROP FUNCTION IF EXISTS const_datetime(int,datetime(6));"""
+        try_sql """DROP FUNCTION IF EXISTS const_string(int,string);"""
+        try_sql """DROP FUNCTION IF EXISTS const_array(int,array<string>);"""
+        try_sql """DROP FUNCTION IF EXISTS const_struct(int,STRUCT<s_id:int, s_name:string>);"""
+        try_sql """DROP FUNCTION IF EXISTS const_map(int,map<string,string>);"""
+        try_sql("""DROP TABLE IF EXISTS ${tableName};""")
+    }
+}
diff --git a/regression-test/suites/job_p0/test_base_insert_job.groovy b/regression-test/suites/job_p0/test_base_insert_job.groovy
index 8a0bb34ca43fd5..fc97e367483b86 100644
--- a/regression-test/suites/job_p0/test_base_insert_job.groovy
+++ b/regression-test/suites/job_p0/test_base_insert_job.groovy
@@ -76,6 +76,7 @@ suite("test_base_insert_job") {
         insert into ${tableName} values
         ('2023-03-18', 1, 1)
         """
+    // create recurring job
     sql """
        CREATE JOB ${jobName}  ON SCHEDULE every 1 second   comment 'test' DO INSERT INTO ${tableName} (`timestamp`, `type`, `user_id`)
         WITH
@@ -97,23 +98,25 @@ suite("test_base_insert_job") {
     """
     Awaitility.await().atMost(30, SECONDS).until(
             {
-                def onceJob = sql """ select SucceedTaskCount from jobs("type"="insert") where Name like '%${jobName}%' and ExecuteType='RECURRING' """
-                println(onceJob)
-                onceJob.size() == 1 && '1' <= onceJob.get(0).get(0)
+                def jobSuccendCount = sql """ select SucceedTaskCount from jobs("type"="insert") where Name like '%${jobName}%' and ExecuteType='RECURRING' """
+                // check job status and succeed task count larger than 1
+                jobSuccendCount.size() == 1 && '1' <= jobSuccendCount.get(0).get(0)
 
             }
     )
     sql """
         PAUSE JOB where jobname =  '${jobName}'
     """
+    def pausedJobStatus = sql """
+        select status from jobs("type"="insert") where Name='${jobName}'
+    """
+    assert pausedJobStatus.get(0).get(0) == "PAUSED"
     def tblDatas = sql """select * from ${tableName}"""
-    println tblDatas
     assert tblDatas.size() >= 2 //at least 2 records
-    def pauseJobId = sql """select id from jobs("type"="insert") where Name='${jobName}'"""
-    def taskStatus = sql """select status from tasks("type"="insert") where jobid= '${pauseJobId.get(0).get(0)}'"""
-    println taskStatus
+
+    def taskStatus = sql """select status from tasks("type"="insert") where JobName ='${jobName}'"""
     for (int i = 0; i < taskStatus.size(); i++) {
-        assert taskStatus.get(i).get(0) != "FAILED" || taskStatus.get(i).get(0) != "STOPPED" || taskStatus.get(i).get(0) != "STOPPED"
+        assert taskStatus.get(i).get(0) =="CANCELLED" || taskStatus.get(i).get(0) =="FINISHED"
     }
     sql """
        CREATE JOB ${jobMixedName}  ON SCHEDULE every 1 second  DO insert into ${tableName} (timestamp, type, user_id) values ('2023-03-18','1','12213');
@@ -122,6 +125,7 @@ suite("test_base_insert_job") {
     println mixedNameJobs
     assert mixedNameJobs.size() == 1 && mixedNameJobs.get(0).get(0) == jobMixedName
     assert mixedNameJobs.get(0).get(1) == ''
+    // clean up job and table
     sql """
         DROP JOB IF EXISTS where jobname =  '${jobName}'
     """
@@ -145,23 +149,25 @@ suite("test_base_insert_job") {
         """
     def dataCount = sql """select count(*) from ${tableName}"""
     assert dataCount.get(0).get(0) == 0
+    // create one time job
     sql """
           CREATE JOB ${jobName}  ON SCHEDULE at current_timestamp   comment 'test for test&68686781jbjbhj//ncsa' DO insert into ${tableName}  values  ('2023-07-19', 2, 1001);
      """
-
+    // wait job finished
     Awaitility.await("create-one-time-job-test").atMost(30, SECONDS).until(
             {
                 def onceJob = sql """ select SucceedTaskCount from jobs("type"="insert") where Name like '%${jobName}%' and ExecuteType='ONE_TIME' """
                 onceJob.size() == 1 && '1' == onceJob.get(0).get(0)
             }
     )
-    def onceJob = sql """ select SucceedTaskCount from jobs("type"="insert") where Name like '%${jobName}%' and ExecuteType='ONE_TIME' """
+    def onceJob = sql """ select SucceedTaskCount  from jobs("type"="insert") where Name like '%${jobName}%' and ExecuteType='ONE_TIME' """
     assert onceJob.size() == 1
     //check succeed task count
     assert '1' == onceJob.get(0).get(0)
     def datas = sql """select status,taskid from tasks("type"="insert") where jobName= '${jobName}'"""
-    println datas
+    // table should have one record after job finished
     assert datas.size() == 1
+    // one time job only has one task. when job finished, task status should be FINISHED
     assert datas.get(0).get(0) == "FINISHED"
     // check table data
     def dataCount1 = sql """select count(1) from ${tableName} where user_id=1001"""
@@ -175,19 +181,20 @@ suite("test_base_insert_job") {
     sql """
         DROP JOB IF EXISTS where jobname =  'press'
     """
-
+    // create job with start time is current time and interval is 10 hours
     sql """
           CREATE JOB press  ON SCHEDULE every 10 hour starts CURRENT_TIMESTAMP  comment 'test for test&68686781jbjbhj//ncsa' DO insert into ${tableName}  values  ('2023-07-19', 99, 99);
      """
     Awaitility.await("create-immediately-job-test").atMost(60, SECONDS).until({
         def pressJob = sql """ select SucceedTaskCount from jobs("type"="insert") where name='press'"""
-        println pressJob
+        // check job status and succeed task count is 1
         pressJob.size() == 1 && '1' == onceJob.get(0).get(0)
     })
 
     sql """
         DROP JOB IF EXISTS where jobname =  'past_start_time'
     """
+    // create job with start time is past time, job should be running
     sql """
           CREATE JOB past_start_time  ON SCHEDULE every 10 hour starts '2023-11-13 14:18:07'  comment 'test for test&68686781jbjbhj//ncsa' DO insert into ${tableName}  values  ('2023-07-19', 99, 99);
      """
@@ -214,6 +221,10 @@ suite("test_base_insert_job") {
     sql """
         PAUSE JOB where jobname =  '${jobName}'
     """
+    pausedJobStatus = sql """
+        select status from jobs("type"="insert") where Name='${jobName}'
+    """
+    assert pausedJobStatus.get(0).get(0) == "PAUSED"
     def tasks = sql """ select status from tasks("type"="insert") where JobName= '${jobName}'  """
     sql """
         RESUME JOB where jobname =  '${jobName}'
@@ -226,6 +237,11 @@ suite("test_base_insert_job") {
         //resume tasks size should be greater than before pause
         afterResumeTasks.size() > tasks.size()
     })
+    // check resume job status
+    def afterResumeJobStatus = sql """
+        select status from jobs("type"="insert") where Name='${jobName}'
+    """
+    assert afterResumeJobStatus.get(0).get(0) == "RUNNING"
 
     // assert same job name
     try {
diff --git a/regression-test/suites/manager/test_manager_interface_1.groovy b/regression-test/suites/manager/test_manager_interface_1.groovy
index 249ce252ffbf86..02f6c210f1fd09 100644
--- a/regression-test/suites/manager/test_manager_interface_1.groovy
+++ b/regression-test/suites/manager/test_manager_interface_1.groovy
@@ -496,128 +496,6 @@ DISTRIBUTED BY HASH(`k1`) BUCKETS 1"""))
     test_table_index()
 
 
-
-
-
-// show proc '/current_query_stmts'
-// show proc '/current_queries'
-// show processlist
-// kill query $query_id
-// SHOW PROC '/cluster_health/tablet_health' 
-    def test_proc = {
-
-        def futures = []
-        
-
-        futures.add( thread {
-
-            try{
-                sql """ select sleep(4.809); """
-            }catch(Exception e){
-                
-            }
-        })
-        futures.add( thread {
-            sleep(1000);
-            List<List<Object>> result = sql """ show proc '/current_query_stmts' """ 
-            logger.info("result = ${result}" )
-            def x = 0
-            def queryid = ""
-            logger.info("result = ${result}")
-
-            for( int i = 0;i<result.size();i++) {
-                if (result[i][7] != null && result[i][7].contains("sleep(4.809)") )//Statement
-                {
-                    x = 1
-                    queryid = result[i][0]
-                    logger.info("query ID = ${queryid}")
-                    assertTrue(result[i][0]!= null) //QueryId
-                    assertTrue(result[i][1]!= null) //ConnectionId
-                    assertTrue(result[i][2]!= null)//Catalog
-                    assertTrue(result[i][3]!= null)//Database
-                    assertTrue(result[i][4]!= null)//User
-                    assertTrue(result[i][5]!= null)//ExecTime
-                    assertTrue(result[i][5].isNumber())//ExecTime
-                    assertTrue(result[i][6]!= null)//SqlHash
-                }
-            }
-            assertTrue(x == 1)
-            
-            x = 0 
-            result = sql """  show proc '/current_queries' """
-            logger.info("result = ${result}")
-            for( int i = 0;i<result.size();i++) {
-                if (result[i][0] == queryid )//QueryId
-                {
-                    x = 1
-                    assertTrue(result[i][5]!= null)//ScanBytes
-                    assertTrue(result[i][6]!= null)//ProcessBytes
-                }
-            }
-            assertTrue(x == 1)
-
-            result = sql """  show processlist  """
-            logger.info("result = ${result}")
-            for( int i =0 ;i < result.size();i++ ){
-                assertTrue( result[i][2].toLowerCase() != "null"  )//User
-                assertTrue( result[i][3].toLowerCase() != "null"  )//Host
-                assertTrue( result[i][5].toLowerCase() != "null"  )//Catalog
-                assertTrue( result[i][6].toLowerCase() != "null"  )//Db
-                assertTrue( result[i][10].toLowerCase() != "null"  )//QueryId
-                if (result[i][10] == queryid) {
-                    x = 1
-                }
-            }
-
-            assertTrue(x == 1)
-            sql """ kill query "${queryid}" """
-            
-            x =  0
-            sleep(5000)
-
-            result = sql """  show proc '/current_queries' """
-            logger.info("result = ${result}")
-            for( int i = 0;i<result.size();i++) {
-                if (result[i][0] == queryid )//QueryId
-                {
-                    x = 1
-                }
-            }
-            assertTrue(x == 0)
-        })
-        futures.each { it.get() }
-
-
-        def tablet_num  = 0;
-        def healthy_num = 0;
-        def total_tablet_num  = 0;
-        def total_healthy_num = 0;
-        result = sql """  SHOW PROC '/cluster_health/tablet_health' """ 
-        logger.info("result = ${result}" )
-
-        for( int i =0 ;i < result.size();i++ ){
-            assertTrue(result[i][0].toLowerCase() != null ) // DbId
-            if (result[i][0].toLowerCase() == "total") {
-                total_tablet_num = result[i][2].toBigInteger();
-                total_healthy_num = result[i][3].toBigInteger();
-            }else {
-                tablet_num += result[i][2].toBigInteger();
-                healthy_num += result[i][3].toBigInteger();
-                
-            }
-            // assertTrue(result[i][2]()) // TabletNum
-            // assertTrue(result[i][3]()) // HealthyNum
-        }
-        assertTrue(total_healthy_num == healthy_num )
-        assertTrue(total_healthy_num == healthy_num )
-    
-
-
-    }
-    test_proc();
-
-
-
 //select a.*, b.*, c.NAME as WORKLOAD_GROUP_NAME from information_schema.active_queries a left join information_schema.backend_active_tasks b on a.QUERY_ID = b.QUERY_ID left join information_schema.workload_groups c on a.WORKLOAD_GROUP_ID = c.ID
     def  test_active_query = {
 
diff --git a/regression-test/suites/manager/test_manager_interface_4.groovy b/regression-test/suites/manager/test_manager_interface_4.groovy
new file mode 100644
index 00000000000000..355d96e1e0310a
--- /dev/null
+++ b/regression-test/suites/manager/test_manager_interface_4.groovy
@@ -0,0 +1,146 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.apache.doris.regression.suite.ClusterOptions
+import org.apache.doris.regression.util.NodeType
+
+import java.time.LocalDateTime
+import java.time.Duration
+import java.time.format.DateTimeFormatter
+
+
+
+suite('test_manager_interface_4',"p0") {
+
+
+// show proc '/current_query_stmts'
+// show proc '/current_queries'
+// show processlist
+// kill query $query_id
+// SHOW PROC '/cluster_health/tablet_health' 
+    def test_proc = {
+
+        def futures = []
+        
+
+        sql """set parallel_pipeline_task_num=1;"""
+        futures.add( thread {
+
+            try{
+                sql """ select *  from numbers("number" = "9910") as  a  join numbers('number'="18880094567") as b on a.number = b.number; """
+            }catch(Exception e){
+                
+            }
+        })
+
+        futures.add( thread {
+            sleep(500);
+            List<List<Object>> result = sql """ show proc '/current_query_stmts' """ 
+            logger.info("result = ${result}" )
+            def x = 0
+            def queryid = ""
+            logger.info("result = ${result}")
+
+            for( int i = 0;i<result.size();i++) {
+                if (result[i][7] != null && result[i][7].contains("18880094567") )//Statement
+                {
+                    x = 1
+                    queryid = result[i][0]
+                    logger.info("query ID = ${queryid}")
+                    assertTrue(result[i][0]!= null) //QueryId
+                    assertTrue(result[i][1]!= null) //ConnectionId
+                    assertTrue(result[i][2]!= null)//Catalog
+                    assertTrue(result[i][3]!= null)//Database
+                    assertTrue(result[i][4]!= null)//User
+                    assertTrue(result[i][5]!= null)//ExecTime
+                    assertTrue(result[i][5].isNumber())//ExecTime
+                    assertTrue(result[i][6]!= null)//SqlHash
+                }
+            }
+            assertTrue(x == 1)
+            
+            x = 0 
+            result = sql """  show proc '/current_queries' """
+            logger.info("result = ${result}")
+            for( int i = 0;i<result.size();i++) {
+                if (result[i][0] == queryid )//QueryId
+                {
+                    x = 1
+                    assertTrue(result[i][5]!= null)//ScanBytes
+                    assertTrue(result[i][6]!= null)//ProcessBytes
+                }
+            }
+            assertTrue(x == 1)
+
+            result = sql """  show processlist  """
+            logger.info("result = ${result}")
+            for( int i =0 ;i < result.size();i++ ){
+                assertTrue( result[i][2].toLowerCase() != "null"  )//User
+                assertTrue( result[i][3].toLowerCase() != "null"  )//Host
+                assertTrue( result[i][5].toLowerCase() != "null"  )//Catalog
+                assertTrue( result[i][6].toLowerCase() != "null"  )//Db
+                assertTrue( result[i][10].toLowerCase() != "null"  )//QueryId
+                if (result[i][10] == queryid) {
+                    x = 1
+                }
+            }
+
+            assertTrue(x == 1)
+            sql """ kill query "${queryid}" """
+            
+            x =  0
+            sleep(3000)
+
+            result = sql """  show proc '/current_queries' """
+            logger.info("result = ${result}")
+            for( int i = 0;i<result.size();i++) {
+                if (result[i][0] == queryid )//QueryId
+                {
+                    x = 1
+                }
+            }
+            assertTrue(x == 0)
+        })
+        futures.each { it.get() }
+
+
+        def tablet_num  = 0;
+        def healthy_num = 0;
+        def total_tablet_num  = 0;
+        def total_healthy_num = 0;
+        result = sql """  SHOW PROC '/cluster_health/tablet_health' """ 
+        logger.info("result = ${result}" )
+
+        for( int i =0 ;i < result.size();i++ ){
+            assertTrue(result[i][0].toLowerCase() != null ) // DbId
+            if (result[i][0].toLowerCase() == "total") {
+                total_tablet_num = result[i][2].toBigInteger();
+                total_healthy_num = result[i][3].toBigInteger();
+            }else {
+                tablet_num += result[i][2].toBigInteger();
+                healthy_num += result[i][3].toBigInteger();
+                
+            }
+            // assertTrue(result[i][2]()) // TabletNum
+            // assertTrue(result[i][3]()) // HealthyNum
+        }
+        assertTrue(total_healthy_num == healthy_num )
+        assertTrue(total_healthy_num == healthy_num )
+
+    }
+    test_proc();
+}
\ No newline at end of file
diff --git a/regression-test/suites/mtmv_p0/test_hive_rewrite_mtmv.groovy b/regression-test/suites/mtmv_p0/test_hive_rewrite_mtmv.groovy
new file mode 100644
index 00000000000000..f10d6bd65b4d3b
--- /dev/null
+++ b/regression-test/suites/mtmv_p0/test_hive_rewrite_mtmv.groovy
@@ -0,0 +1,89 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_hive_rewrite_mtmv", "p0,external,hive,external_docker,external_docker_hive") {
+    String enabled = context.config.otherConfigs.get("enableHiveTest")
+    if (enabled == null || !enabled.equalsIgnoreCase("true")) {
+        logger.info("diable Hive test.")
+        return;
+    }
+    String suiteName = "test_hive_rewrite_mtmv"
+    String catalogName = "${suiteName}_catalog"
+    String mvName = "${suiteName}_mv"
+    String externalEnvIp = context.config.otherConfigs.get("externalEnvIp")
+    sql """set materialized_view_rewrite_enable_contain_external_table=true;"""
+    String mvSql = "SELECT part_col,count(*) as num FROM ${catalogName}.`default`.mtmv_base1 group by part_col;";
+    for (String hivePrefix : ["hive2", "hive3"]) {
+        String hms_port = context.config.otherConfigs.get(hivePrefix + "HmsPort")
+        sql """drop catalog if exists ${catalogName}"""
+        sql """create catalog if not exists ${catalogName} properties (
+            "type"="hms",
+            'hive.metastore.uris' = 'thrift://${externalEnvIp}:${hms_port}'
+        );"""
+        sql """analyze table ${catalogName}.`default`.mtmv_base1 with sync"""
+        sql """alter table ${catalogName}.`default`.mtmv_base1 modify column part_col set stats ('row_count'='6');"""
+
+        sql """drop materialized view if exists ${mvName};"""
+        sql """
+            CREATE MATERIALIZED VIEW ${mvName}
+                BUILD DEFERRED REFRESH AUTO ON MANUAL
+                partition by(`part_col`)
+                DISTRIBUTED BY RANDOM BUCKETS 2
+                PROPERTIES ('replication_num' = '1')
+                AS
+                ${mvSql}
+            """
+        def showPartitionsResult = sql """show partitions from ${mvName}"""
+        logger.info("showPartitionsResult: " + showPartitionsResult.toString())
+        assertTrue(showPartitionsResult.toString().contains("p_20230101"))
+        assertTrue(showPartitionsResult.toString().contains("p_20230102"))
+
+        // refresh one partitions
+        sql """
+                REFRESH MATERIALIZED VIEW ${mvName} partitions(p_20230101);
+            """
+        waitingMTMVTaskFinishedByMvName(mvName)
+        order_qt_refresh_one_partition "SELECT * FROM ${mvName}"
+
+        def explainOnePartition = sql """ explain  ${mvSql} """
+        logger.info("explainOnePartition: " + explainOnePartition.toString())
+        assertTrue(explainOnePartition.toString().contains("VUNION"))
+        assertTrue(explainOnePartition.toString().contains("part_col[#4] = 20230102"))
+        order_qt_refresh_one_partition_rewrite "${mvSql}"
+
+        mv_rewrite_success("${mvSql}", "${mvName}")
+
+        //refresh complete
+        sql """
+                REFRESH MATERIALIZED VIEW ${mvName} complete
+            """
+        waitingMTMVTaskFinishedByMvName(mvName)
+        order_qt_refresh_complete "SELECT * FROM ${mvName}"
+
+        def explainAllPartition = sql """ explain  ${mvSql}; """
+        logger.info("explainAllPartition: " + explainAllPartition.toString())
+        assertTrue(explainAllPartition.toString().contains("VOlapScanNode"))
+        assertTrue(explainAllPartition.toString().contains("partitions=2/2"))
+        order_qt_refresh_all_partition_rewrite "${mvSql}"
+
+        mv_rewrite_success("${mvSql}", "${mvName}")
+
+        sql """drop materialized view if exists ${mvName};"""
+        sql """drop catalog if exists ${catalogName}"""
+    }
+}
+
diff --git a/regression-test/suites/nereids_function_p0/agg_function/test_orthogonal_bitmap_expr_calculate.groovy b/regression-test/suites/nereids_function_p0/agg_function/test_orthogonal_bitmap_expr_calculate.groovy
new file mode 100644
index 00000000000000..b47315e96dbcec
--- /dev/null
+++ b/regression-test/suites/nereids_function_p0/agg_function/test_orthogonal_bitmap_expr_calculate.groovy
@@ -0,0 +1,55 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_orthogonal_bitmap_expr_calculate") {
+    multi_sql """
+            drop table if exists test_orthogonal_bitmap_expr_calculate;
+
+            create table test_orthogonal_bitmap_expr_calculate(
+                id int,
+                tag int,
+                user_id bitmap bitmap_union
+            )
+            aggregate key(id, tag)
+            distributed by hash(id) buckets 1
+            properties(
+                'replication_num'='1'
+            );
+            
+            insert into test_orthogonal_bitmap_expr_calculate values
+            (1, 100, bitmap_from_string('1,2,3,4,5')),
+            (1, 200, bitmap_from_string('3,4,5,6,7'));
+
+            set enable_fallback_to_original_planner=false;
+            """
+
+    test {
+        sql """
+            select bitmap_to_string(orthogonal_bitmap_expr_calculate(user_id, tag, '(100&200)'))
+            from test_orthogonal_bitmap_expr_calculate
+            """
+        result([['3,4,5']])
+    }
+
+    test {
+        sql """
+            select orthogonal_bitmap_expr_calculate_count(user_id, tag, '(100&200)')
+            from test_orthogonal_bitmap_expr_calculate
+            """
+        result([[3L]])
+    }
+}
diff --git a/regression-test/suites/nereids_function_p0/scalar_function/IP.groovy b/regression-test/suites/nereids_function_p0/scalar_function/IP.groovy
index 9cbdccbe78840b..a1c1d00caa29fe 100644
--- a/regression-test/suites/nereids_function_p0/scalar_function/IP.groovy
+++ b/regression-test/suites/nereids_function_p0/scalar_function/IP.groovy
@@ -30,7 +30,16 @@ suite("nereids_scalar_fn_IP") {
     qt_sql_cidr_ipv6_all """ select id, ipv6_cidr_to_range(ip6, 16) from fn_test_ip_nullable order by id; """
     qt_sql_cidr_ipv4_all """ select id, ipv4_cidr_to_range(ip4, 16) from fn_test_ip_nullable order by id; """
 
-
+    // test nullable param
+    qt_sql_cidr_ipv6_nullable_ "select id, ipv6_cidr_to_range(to_ipv6('::'), 32) from fn_test_ip_nullable order by id;"	
+    test {
+   	sql "select id, ipv6_cidr_to_range(nullable(''), 32) from fn_test_ip_nullable order by id" 
+	exception "Invalid IPv6 value"
+    }
+    test {
+        sql "select id, ipv6_cidr_to_range(nullable('abc'), 32) from fn_test_ip_not_nullable order by id"
+        exception "Invalid IPv6 value"
+    }
     // test IPV4_STRING_TO_NUM/IPV6_STRING_TO_NUM (we have null value in ip4 and ip6 column in fn_test_ip_nullable table)
     test {
         sql 'select id, ipv6_string_to_num(ip6) from fn_test_ip_nullable order by id'
@@ -153,7 +162,17 @@ suite("nereids_scalar_fn_IP") {
     qt_sql_not_null_cidr_ipv6_all """ select id, ipv6_cidr_to_range(ip6, 16) from fn_test_ip_not_nullable order by id; """
     qt_sql_not_null_cidr_ipv4_all """ select id, ipv4_cidr_to_range(ip4, 16) from fn_test_ip_not_nullable order by id; """
 
+    // test nullable param
+    qt_sql_not_null_cidr_ipv6_nullable_ "select id, ipv6_cidr_to_range(to_ipv6('::'), 32) from fn_test_ip_nullable order by id;"
+    test {
+        sql "select id, ipv6_cidr_to_range(nullable(''), 32) from fn_test_ip_not_nullable order by id"
+        exception "Invalid IPv6 value"
+    }
 
+    test {
+        sql "select id, ipv6_cidr_to_range(nullable('abc'), 32) from fn_test_ip_not_nullable order by id"
+        exception "Invalid IPv6 value"
+    }
     // test IPV4_STRING_TO_NUM/IPV6_STRING_TO_NUM
     qt_sql_not_null_ipv6_string_to_num 'select id, hex(ipv6_string_to_num(ip6)) from fn_test_ip_not_nullable order by id'
 
@@ -269,4 +288,4 @@ suite("nereids_scalar_fn_IP") {
     qt_sql_not_null_to_ipv4_or_null "select id, to_ipv4_or_null(ip6) from fn_test_ip_not_nullable order by id"
     qt_sql_not_null_to_ipv4_or_null_str "select id, to_ipv4_or_null(ip6_str) from fn_test_ip_not_nullable order by id"
 
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/nereids_function_p0/scalar_function/S.groovy b/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
index 98a8685a88840b..ea0d80d8adce85 100644
--- a/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
+++ b/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
@@ -126,6 +126,7 @@ suite("nereids_scalar_fn_S") {
 
 	sql "select space(10) from fn_test order by kint"
 	sql "select space(10) from fn_test_not_nullable order by kint"
+	sql """select k from (select length(space(number)) k from numbers("number" = "10"))t;""" // before #44919 will crash
 	qt_sql_split_part_Varchar_Varchar_Integer "select split_part(kvchrs1, ' ', 1) from fn_test order by kvchrs1"
 	qt_sql_split_part_Varchar_Varchar_Integer_notnull "select split_part(kvchrs1, ' ', 1) from fn_test_not_nullable order by kvchrs1"
 	qt_sql_split_part_String_String_Integer "select split_part(kstr, ' ', 1) from fn_test order by kstr"
diff --git a/regression-test/suites/nereids_p0/admin/test_nereids_admin_check_tablet.groovy b/regression-test/suites/nereids_p0/admin/test_nereids_admin_check_tablet.groovy
new file mode 100644
index 00000000000000..8812e09ea9f6f3
--- /dev/null
+++ b/regression-test/suites/nereids_p0/admin/test_nereids_admin_check_tablet.groovy
@@ -0,0 +1,57 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+
+suite("test_nereids_admin_check_tablet") {
+    def table = "test_nereids_admin_check_tablet"
+    // create table and insert data
+    sql """ drop table if exists ${table} force"""
+    sql """
+    create table ${table} (
+        `id` int(11),
+        `name` varchar(128),
+        `da` date
+    )
+    engine=olap
+    duplicate key(id)
+    partition by range(da)(
+        PARTITION p3 VALUES LESS THAN ('2023-01-01'),
+        PARTITION p4 VALUES LESS THAN ('2024-01-01'),
+        PARTITION p5 VALUES LESS THAN ('2025-01-01')
+    )
+    distributed by hash(id) buckets 2
+    properties(
+        "replication_num"="1",
+        "light_schema_change"="true"
+    );
+    """
+
+    def tabletId
+    def tablets = sql_return_maparray "SHOW TABLETS FROM ${table}"
+
+    for (def tablet : tablets) {
+        //get any partition ID.
+        tabletId = tablet.TabletId;
+        break;
+    }
+
+    logger.info("${tabletId}");
+
+    checkNereidsExecute("ADMIN CHECK TABLET (${tabletId}) PROPERTIES('type' = 'consistency')");
+
+}
+
diff --git a/regression-test/suites/nereids_p0/ddl/account/test_nereids_role.groovy b/regression-test/suites/nereids_p0/ddl/account/test_nereids_role.groovy
index 4e2cd4ca6375d2..a3bee25cf5822a 100644
--- a/regression-test/suites/nereids_p0/ddl/account/test_nereids_role.groovy
+++ b/regression-test/suites/nereids_p0/ddl/account/test_nereids_role.groovy
@@ -19,7 +19,7 @@ import org.junit.Assert;
 
 suite("test_nereids_role") {
     def role= 'nereids_account_role_test'
-    def user = 'acount_role_user_test'
+    def user = 'nereids_acount_role_user_test'
     def dbName = 'nereids_account_role_test_db'
     def pwd = 'C123_567p'
 
@@ -28,7 +28,7 @@ suite("test_nereids_role") {
     sql """DROP DATABASE IF EXISTS ${dbName}"""
     sql """CREATE DATABASE ${dbName}"""
 
-    sql """CREATE ROLE ${role}"""
+    checkNereidsExecute("CREATE ROLE ${role}")
     sql """GRANT SELECT_PRIV ON ${context.config.defaultDb} TO ROLE '${role}'"""
     sql """GRANT SELECT_PRIV ON ${dbName} TO ROLE '${role}'"""
     sql """CREATE USER '${user}' IDENTIFIED BY '${pwd}' DEFAULT ROLE '${role}'"""
diff --git a/regression-test/suites/nereids_p0/ddl/alter/test_nereids_role.groovy b/regression-test/suites/nereids_p0/ddl/alter/test_nereids_role.groovy
deleted file mode 100644
index f23982188269b7..00000000000000
--- a/regression-test/suites/nereids_p0/ddl/alter/test_nereids_role.groovy
+++ /dev/null
@@ -1,66 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-import org.junit.Assert;
-
-suite("test_nereids_role_x", "account") {
-    def role= 'nereids_account_role_test_x'
-    def user = 'nereids_acount_role_user_test_x'
-    def dbName = 'nereids_account_role_test_db_x'
-    def pwd = 'C123_567p'
-
-    try_sql("DROP ROLE ${role}")
-    try_sql("DROP USER ${user}")
-    sql """DROP DATABASE IF EXISTS ${dbName}"""
-    sql """CREATE DATABASE IF NOT EXISTS ${dbName}"""
-    sql """CREATE ROLE ${role}"""
-    sql """GRANT SELECT_PRIV ON internal.${context.config.defaultDb}.* TO ROLE '${role}'"""
-    sql """GRANT SELECT_PRIV ON internal.${dbName}.* TO ROLE '${role}'"""
-    sql """CREATE USER '${user}' IDENTIFIED BY '${pwd}' DEFAULT ROLE '${role}'"""
-    def result1 = connect(user=user, password="${pwd}", url=context.config.jdbcUrl) {
-        sql "show databases like '${dbName}'"
-    }
-    assertEquals(result1.size(), 1)
-
-    sql """REVOKE SELECT_PRIV ON ${dbName} FROM ROLE '${role}'"""
-    def result2 = connect(user=user, password="${pwd}", url=context.config.jdbcUrl) {
-        sql "show databases like '${dbName}'"
-    }
-    assertEquals(result2.size(), 0)
-
-    sql """DROP USER ${user}"""
-    sql """DROP ROLE ${role}"""
-    sql """DROP DATABASE ${dbName}"""
-
-    // test comment
-    // create role with comment
-    sql """CREATE ROLE ${role} comment 'account_p0_account_role_test_comment_create'"""
-    def roles_create = sql """show roles"""
-    logger.info("roles_create: " + roles_create.toString())
-    assertTrue(roles_create.toString().contains("account_p0_account_role_test_comment_create"))
-    // alter role with comment
-    checkNereidsExecute("ALTER ROLE ${role} comment 'account_p0_account_role_test_comment_alter';");
-    def roles_alter = sql """show roles"""
-    logger.info("roles_alter: " + roles_alter.toString())
-    assertTrue(roles_alter.toString().contains("account_p0_account_role_test_comment_alter"))
-    // drop role
-    checkNereidsExecute("""DROP ROLE ${role}""")
-    def roles_drop = sql """show roles"""
-    logger.info("roles_drop: " + roles_drop.toString())
-    assertFalse(roles_drop.toString().contains("account_p0_account_role_test_comment_alter"))
-}
-
diff --git a/regression-test/suites/nereids_p0/ddl/repository/show_create_repository_command.groovy b/regression-test/suites/nereids_p0/ddl/repository/show_create_repository_command.groovy
new file mode 100644
index 00000000000000..547cd8a6376db6
--- /dev/null
+++ b/regression-test/suites/nereids_p0/ddl/repository/show_create_repository_command.groovy
@@ -0,0 +1,77 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.junit.Assert;
+
+suite("show_create_repository_command") {
+    String ak = getS3AK()
+    String sk = getS3SK()
+    String endpoint = getS3Endpoint()
+    String region = getS3Region()
+    String bucket = context.config.otherConfigs.get("s3BucketName");
+    String repoName = "test_show_create_repository"
+    String readOnlyRepoName = "test_show_create_read_only_repository"
+
+    //cloud-mode
+    if (isCloudMode()) {
+        return
+    }
+
+    try_sql "DROP REPOSITORY `${repoName}`"
+    try_sql "DROP REPOSITORY `${readOnlyRepoName}`"
+
+    // create S3 repo
+    sql """CREATE REPOSITORY `${repoName}`
+            WITH S3
+            ON LOCATION "s3://${bucket}/${repoName}"
+            PROPERTIES
+            (
+                "s3.endpoint" = "http://${endpoint}",
+                "s3.region" = "${region}",
+                "s3.access_key" = "${ak}",
+                "s3.secret_key" = "${sk}"
+            )"""
+
+    // create S3 read only repo
+    sql """CREATE READ ONLY REPOSITORY `${readOnlyRepoName}`
+            WITH S3
+            ON LOCATION "s3://${bucket}/${readOnlyRepoName}"
+            PROPERTIES
+            (
+                "s3.endpoint" = "http://${endpoint}",
+                "s3.region" = "${region}",
+                "s3.access_key" = "${ak}",
+                "s3.secret_key" = "${sk}"
+            )"""
+
+    def create_repo = checkNereidsExecuteWithResult("""SHOW CREATE REPOSITORY for `${repoName}`;""").toString();
+    assertTrue(create_repo.contains("${repoName}"))
+    assertTrue(create_repo.contains("s3://${bucket}/${repoName}"))
+
+    def create_read_only_repo = checkNereidsExecuteWithResult("""SHOW CREATE REPOSITORY for `${readOnlyRepoName}`;""").toString();
+    assertTrue(create_read_only_repo.contains("${readOnlyRepoName}"))
+    assertTrue(create_read_only_repo.contains("READ ONLY"))
+
+    sql """DROP REPOSITORY `${repoName}`;"""
+    sql """DROP REPOSITORY `${readOnlyRepoName}`;"""
+
+    try {
+        sql """SHOW CREATE REPOSITORY for `${repoName}`;"""
+    } catch (Exception e) {
+        assertTrue(e.getMessage().contains("repository not exist."))
+    }
+}
diff --git a/regression-test/suites/nereids_p0/ddl/repository/show_repositories_command.groovy b/regression-test/suites/nereids_p0/ddl/repository/show_repositories_command.groovy
index 43fadf3b1a86d8..5d3520109002d3 100644
--- a/regression-test/suites/nereids_p0/ddl/repository/show_repositories_command.groovy
+++ b/regression-test/suites/nereids_p0/ddl/repository/show_repositories_command.groovy
@@ -47,7 +47,7 @@ suite("show_repositories_command") {
     def show_repo = checkNereidsExecuteWithResult("""SHOW REPOSITORIES;""").toString();
     assertTrue(show_repo.contains("${repoName}"))
 
-    sql """DROP REPOSITORY `${repoName}`;"""
+    checkNereidsExecute("DROP REPOSITORY `${repoName}`;")
 
     def show_repo_after_drop = checkNereidsExecuteWithResult("""SHOW REPOSITORIES;""").toString();
     assertFalse(show_repo_after_drop.contains("${repoName}"))
diff --git a/regression-test/suites/nereids_p0/show/test_show_commands_nereids.groovy b/regression-test/suites/nereids_p0/show/test_show_commands_nereids.groovy
index 84dcbc2323fa02..ee243b42d3209a 100644
--- a/regression-test/suites/nereids_p0/show/test_show_commands_nereids.groovy
+++ b/regression-test/suites/nereids_p0/show/test_show_commands_nereids.groovy
@@ -27,5 +27,5 @@ suite("test_show_commands_nereids") {
     checkNereidsExecute("""show whitelist;""")
     checkNereidsExecute("""show triggers;""")
     checkNereidsExecute("""show events;""")
-    checkNereidsExecute("""show load profile \"\\";""")
+    checkNereidsExecute("""show load profile "/";""")
 }
diff --git a/regression-test/suites/nereids_p0/show/test_show_create_table_nereids.groovy b/regression-test/suites/nereids_p0/show/test_show_create_table_nereids.groovy
index 8c9b42af41a8a6..53f2242d1fa7f6 100644
--- a/regression-test/suites/nereids_p0/show/test_show_create_table_nereids.groovy
+++ b/regression-test/suites/nereids_p0/show/test_show_create_table_nereids.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_show_create_table_nereids", "query") {
+suite("test_show_create_table_nereids", "query,arrow_flight_sql") {
     String tb_name = "tb_show_create_table";
     try {  
         sql """drop table if exists ${tb_name} """
diff --git a/regression-test/suites/nereids_p0/show/test_show_database_id_nereids.groovy b/regression-test/suites/nereids_p0/show/test_show_database_id_nereids.groovy
new file mode 100644
index 00000000000000..6cc5eb1aac1005
--- /dev/null
+++ b/regression-test/suites/nereids_p0/show/test_show_database_id_nereids.groovy
@@ -0,0 +1,20 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_show_database_id_nereids") {
+    checkNereidsExecute("show database 0;")
+}
diff --git a/regression-test/suites/nereids_p0/show/test_show_diagnose_tablet.groovy b/regression-test/suites/nereids_p0/show/test_show_diagnose_tablet.groovy
index 029fac7428e0bb..62e008412bae3b 100644
--- a/regression-test/suites/nereids_p0/show/test_show_diagnose_tablet.groovy
+++ b/regression-test/suites/nereids_p0/show/test_show_diagnose_tablet.groovy
@@ -29,6 +29,8 @@ suite("test_show_diagnose_tablet_nereids", "query,diagnose") {
 
         // Execute the SHOW TABLET DIAGNOSIS command and verify the output
         checkNereidsExecute("SHOW TABLET DIAGNOSIS ${tabletId}")
+        // Execute the SHOW TABLET DIAGNOSIS command and verify the output
+        checkNereidsExecute("ADMIN DIAGNOSE TABLET ${tabletId}")
     } catch (Exception e) {
         log.error("Failed to execute SHOW TABLET DIAGNOSIS command", e)
         throw e
diff --git a/regression-test/suites/nereids_p0/stats/invalid_stats/invalid_stats.groovy b/regression-test/suites/nereids_p0/stats/invalid_stats/invalid_stats.groovy
index 51f1a37f118a42..3bda4bc743200a 100644
--- a/regression-test/suites/nereids_p0/stats/invalid_stats/invalid_stats.groovy
+++ b/regression-test/suites/nereids_p0/stats/invalid_stats/invalid_stats.groovy
@@ -17,11 +17,11 @@
 
 suite("invalid_stats") {
     multi_sql """
-        set global enable_auto_analyze=false;
         SET enable_nereids_planner=true;
         SET enable_fallback_to_original_planner=false;
         set disable_nereids_rules=PRUNE_EMPTY_PARTITION;
         set ignore_shape_nodes=PhysicalProject;
+        set runtime_filter_mode=off;
         
         drop table if exists region;
         CREATE TABLE region  (
diff --git a/regression-test/suites/nereids_p0/stats/partition_key_minmax.groovy b/regression-test/suites/nereids_p0/stats/partition_key_minmax.groovy
index 3a58d1b6f23ed2..e7d733611e79d1 100644
--- a/regression-test/suites/nereids_p0/stats/partition_key_minmax.groovy
+++ b/regression-test/suites/nereids_p0/stats/partition_key_minmax.groovy
@@ -32,6 +32,8 @@ suite("partition_key_minmax") {
 
         analyze table rangetable with sync;
     """
+    def columnStats = sql """show column cached stats rangetable"""
+    logger.info("rangetable cached stats: " + columnStats)
     explain {
         sql """memo plan
             select * from rangetable where a < 250;
@@ -56,6 +58,9 @@ suite("partition_key_minmax") {
     analyze table listtable with sync;
     """
 
+    columnStats = sql """show column cached stats listtable"""
+    logger.info("listtable cached stats: " + columnStats)
+
     explain {
         sql """
          memo plan select * from listtable where id >=3;
diff --git a/regression-test/suites/nereids_p0/test_nereids_encrypt_test.groovy b/regression-test/suites/nereids_p0/test_nereids_encrypt_test.groovy
index 2fab616580faaa..bd984e4164c37b 100644
--- a/regression-test/suites/nereids_p0/test_nereids_encrypt_test.groovy
+++ b/regression-test/suites/nereids_p0/test_nereids_encrypt_test.groovy
@@ -20,10 +20,12 @@ suite("test_nereids_encrypt_test") {
     sql """ create database IF NOT EXISTS ${dbName}; """
     sql """ use ${dbName}; """
     checkNereidsExecute("drop encryptkey if exists ${encryptkeyName}")    
-    sql """CREATE ENCRYPTKEY ${encryptkeyName} AS "ABCD123456789";"""
+    checkNereidsExecute("""CREATE ENCRYPTKEY ${encryptkeyName} AS "ABCD123456789";""")
+    checkNereidsExecute("SHOW ENCRYPTKEYS FROM ${dbName}")
     qt_check_encrypt_1("SHOW ENCRYPTKEYS FROM ${dbName}")
     checkNereidsExecute("drop encryptkey ${encryptkeyName}")
+    checkNereidsExecute("SHOW ENCRYPTKEYS FROM ${dbName}")
     qt_check_encrypt_2("SHOW ENCRYPTKEYS FROM ${dbName}")    
     checkNereidsExecute("drop encryptkey if exists ${encryptkeyName}")
     qt_check_encrypt_3("SHOW ENCRYPTKEYS FROM ${dbName}")        
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_aggr_distinct_through_join_one_side_cust.groovy b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_aggr_distinct_through_join_one_side_cust.groovy
new file mode 100644
index 00000000000000..9134d66b76d751
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_aggr_distinct_through_join_one_side_cust.groovy
@@ -0,0 +1,125 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("push_down_aggr_distinct_through_join_one_side_cust") {
+    sql "SET enable_nereids_planner=true"
+    sql "set runtime_filter_mode=OFF"
+    sql "SET enable_fallback_to_original_planner=false"
+    sql "set DISABLE_NEREIDS_RULES='PRUNE_EMPTY_PARTITION, ELIMINATE_GROUP_BY_KEY_BY_UNIFORM'"
+
+    sql """
+        DROP TABLE IF EXISTS dwd_com_abtest_result_inc_ymds;
+	DROP TABLE IF EXISTS dwd_tracking_sensor_init_tmp_ymds;
+    """
+
+    sql """
+    CREATE TABLE `dwd_com_abtest_result_inc_ymds` (
+      `app_name` varchar(255) NULL,
+      `user_key` text NULL,
+      `group_name` text NULL,
+      `dt` date NOT NULL,
+    ) ENGINE=OLAP
+    DUPLICATE KEY(`app_name`)
+    AUTO PARTITION BY RANGE (date_trunc(`dt`, 'day'))
+    (PARTITION p20240813000000 VALUES [('2024-08-13'), ('2024-08-14')),
+    PARTITION p20240814000000 VALUES [('2024-08-14'), ('2024-08-15')),
+    PARTITION p20240815000000 VALUES [('2024-08-15'), ('2024-08-16')),
+    PARTITION p20240816000000 VALUES [('2024-08-16'), ('2024-08-17')),
+    PARTITION p20240817000000 VALUES [('2024-08-17'), ('2024-08-18')),
+    PARTITION p20240818000000 VALUES [('2024-08-18'), ('2024-08-19')),
+    PARTITION p20240819000000 VALUES [('2024-08-19'), ('2024-08-20')))
+    DISTRIBUTED BY HASH(`app_name`) BUCKETS 1
+    PROPERTIES (
+    "replication_allocation" = "tag.location.default: 1",
+    "min_load_replica_num" = "-1",
+    "is_being_synced" = "false",
+    "storage_medium" = "hdd",
+    "storage_format" = "V2",
+    "inverted_index_storage_format" = "V2",
+    "light_schema_change" = "true",
+    "disable_auto_compaction" = "false",
+    "enable_single_replica_compaction" = "false",
+    "group_commit_interval_ms" = "10000",
+    "group_commit_data_bytes" = "134217728"
+    );
+
+    CREATE TABLE `dwd_tracking_sensor_init_tmp_ymds` (
+      `ip` varchar(20) NULL,
+      `gz_user_id` text NULL,
+      `dt` date NOT NULL
+    ) ENGINE=OLAP
+    DUPLICATE KEY(`ip`)
+    AUTO PARTITION BY RANGE (date_trunc(`dt`, 'day'))
+    (PARTITION p20240813000000 VALUES [('2024-08-13'), ('2024-08-14')),
+    PARTITION p20240814000000 VALUES [('2024-08-14'), ('2024-08-15')),
+    PARTITION p20240815000000 VALUES [('2024-08-15'), ('2024-08-16')),
+    PARTITION p20240816000000 VALUES [('2024-08-16'), ('2024-08-17')),
+    PARTITION p20240817000000 VALUES [('2024-08-17'), ('2024-08-18')),
+    PARTITION p20240818000000 VALUES [('2024-08-18'), ('2024-08-19')),
+    PARTITION p20240819000000 VALUES [('2024-08-19'), ('2024-08-20')))
+    DISTRIBUTED BY HASH(`ip`) BUCKETS 10
+    PROPERTIES (
+    "replication_allocation" = "tag.location.default: 1",
+    "min_load_replica_num" = "-1",
+    "is_being_synced" = "false",
+    "storage_medium" = "hdd",
+    "storage_format" = "V2",
+    "inverted_index_storage_format" = "V2",
+    "light_schema_change" = "true",
+    "disable_auto_compaction" = "false",
+    "enable_single_replica_compaction" = "false",
+    "group_commit_interval_ms" = "10000",
+    "group_commit_data_bytes" = "134217728"
+    );
+    """
+
+    explain {
+        sql("physical PLAN SELECT /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/" +
+                "COUNT(DISTINCT dwd_tracking_sensor_init_tmp_ymds.gz_user_id) AS a2c1a830_1," +
+                "dwd_com_abtest_result_inc_ymds.group_name AS ab1011d6," +
+                "dwd_tracking_sensor_init_tmp_ymds.dt AS ad466123 " +
+                "FROM dwd_tracking_sensor_init_tmp_ymds " +
+                "LEFT JOIN dwd_com_abtest_result_inc_ymds " +
+                "ON dwd_tracking_sensor_init_tmp_ymds.gz_user_id = dwd_com_abtest_result_inc_ymds.user_key " +
+                "AND dwd_tracking_sensor_init_tmp_ymds.dt = dwd_com_abtest_result_inc_ymds.dt " +
+                "WHERE dwd_tracking_sensor_init_tmp_ymds.dt BETWEEN '2024-08-15' AND '2024-08-15' " +
+                "AND dwd_com_abtest_result_inc_ymds.dt BETWEEN '2024-08-15' AND '2024-08-15' " +
+                "GROUP BY 2, 3 ORDER BY 3 asc limit 10000;");
+        contains"groupByExpr=[gz_user_id#1, dt#2]"
+        contains"groupByExpr=[gz_user_id#1, dt#2, group_name#5], outputExpr=[gz_user_id#1, dt#2, group_name#5]"
+        contains"[group_name#5, dt#2]"
+        contains"groupByExpr=[group_name#5, dt#2], outputExpr=[group_name#5, dt#2, count(partial_count(gz_user_id)#12) AS `a2c1a830_1`#7]"
+    }
+
+    explain {
+        sql("physical PLAN SELECT /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/" +
+                "COUNT(DISTINCT dwd_tracking_sensor_init_tmp_ymds.ip) AS a2c1a830_1," +
+                "dwd_com_abtest_result_inc_ymds.group_name AS ab1011d6," +
+                "dwd_tracking_sensor_init_tmp_ymds.dt AS ad466123 " +
+                "FROM dwd_tracking_sensor_init_tmp_ymds " +
+                "LEFT JOIN dwd_com_abtest_result_inc_ymds " +
+                "ON dwd_tracking_sensor_init_tmp_ymds.gz_user_id = dwd_com_abtest_result_inc_ymds.user_key " +
+                "AND dwd_tracking_sensor_init_tmp_ymds.dt = dwd_com_abtest_result_inc_ymds.dt " +
+                "WHERE dwd_tracking_sensor_init_tmp_ymds.dt BETWEEN '2024-08-15' AND '2024-08-15' " +
+                "AND dwd_com_abtest_result_inc_ymds.dt BETWEEN '2024-08-15' AND '2024-08-15' " +
+                "GROUP BY 2, 3 ORDER BY 3 asc limit 10000;");
+        contains"groupByExpr=[ip#0, gz_user_id#1, dt#2], outputExpr=[ip#0, gz_user_id#1, dt#2]"
+        contains"groupByExpr=[ip#0, dt#2, group_name#5], outputExpr=[ip#0, dt#2, group_name#5]"
+        contains"groupByExpr=[group_name#5, dt#2], outputExpr=[group_name#5, dt#2, partial_count(ip#0) AS `partial_count(ip)`#12]"
+        contains"groupByExpr=[group_name#5, dt#2], outputExpr=[group_name#5, dt#2, count(partial_count(ip)#12) AS `a2c1a830_1`#7]"
+    }
+}
diff --git a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.groovy b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.groovy
new file mode 100644
index 00000000000000..65a6b15ceccf73
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_distinct_through_join_one_side.groovy
@@ -0,0 +1,257 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("push_down_count_distinct_through_join_one_side") {
+    sql "SET enable_nereids_planner=true"
+    sql "set runtime_filter_mode=OFF"
+    sql "SET enable_fallback_to_original_planner=false"
+    sql """
+        DROP TABLE IF EXISTS count_with_distinct_t;
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS count_with_distinct_t(
+      `id` int(32),
+      `score` int(64) NULL,
+      `name` varchar(64) NULL
+    ) ENGINE = OLAP
+    DISTRIBUTED BY HASH(id) BUCKETS 4
+    PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1"
+    );
+    """
+
+    sql "insert into count_with_distinct_t values (1, 1, 'a')"
+    sql "insert into count_with_distinct_t values (2, null, 'a')"
+    sql "insert into count_with_distinct_t values (3, 1, null)"
+    sql "insert into count_with_distinct_t values (4, 2, 'b')"
+    sql "insert into count_with_distinct_t values (5, null, 'b')"
+    sql "insert into count_with_distinct_t values (6, 2, null)"
+    sql "insert into count_with_distinct_t values (7, 3, 'c')"
+    sql "insert into count_with_distinct_t values (8, null, 'c')"
+    sql "insert into count_with_distinct_t values (9, 3, null)"
+    sql "insert into count_with_distinct_t values (10, null, null)"
+    sql "analyze table count_with_distinct_t with full with sync;"
+    
+    order_qt_groupby_pushdown_basic """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_right_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 right join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_full_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 full join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_semi_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 inner join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_anti_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left anti join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_complex_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), avg(t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where score > 10) t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_outer_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_deep_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t) count_with_distinct_t where score > 10) t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_having """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name having count(distinct t1.score) > 100;
+    """
+
+    order_qt_groupby_pushdown_mixed_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), sum(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multi_table_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id join count_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   sum(distinct t1.score), count(distinct t2.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, count(distinct t1.score), count(distinct t2.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+     order_qt_groupby_pushdown_with_where_clause """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_varied_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), avg(t1.id), count(distinct t2.name) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by_limit """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name order by count(distinct t1.score) limit 10;
+    """
+
+    order_qt_groupby_pushdown_alias_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1_alias.score) from count_with_distinct_t t1_alias join count_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_groupby_pushdown_complex_join_condition """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_function_processed_columns """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct LENGTH(t1.name)) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_nested_queries """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where score > 20) t1 join (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_basic """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_right_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 right join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_full_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 full join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_semi_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 inner join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_anti_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left anti join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), avg(t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where score > 10) t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_outer_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 left join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_deep_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t) count_with_distinct_t where score > 10) t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_having """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name having count(distinct t1.score) > 100;
+    """
+
+    order_qt_with_hint_groupby_pushdown_mixed_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), sum(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multi_table_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id join count_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   sum(distinct t1.score), count(distinct t2.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, count(distinct t1.score), count(distinct t2.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_where_clause """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_varied_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score), avg(t1.id), count(distinct t2.name) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by_limit """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name order by count(distinct t1.score) limit 10;
+    """
+
+    order_qt_with_hint_groupby_pushdown_alias_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1_alias.score) from count_with_distinct_t t1_alias join count_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_join_condition """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from count_with_distinct_t t1 join count_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_function_processed_columns """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct LENGTH(t1.name)) from count_with_distinct_t t1, count_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_nested_queries """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   count(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where score > 20) t1 join (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from count_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+}
diff --git a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.groovy b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.groovy
index e551fa04c9110a..031430a48265ae 100644
--- a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.groovy
+++ b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_count_through_join_one_side.groovy
@@ -453,7 +453,6 @@ suite("push_down_count_through_join_one_side") {
     insert into dwd_tracking_sensor_init_tmp_ymd values(1, '2024-08-19', 'click'), (1, '2024-08-19', 'click');
     """
     sql """ 
-    set ENABLE_NEREIDS_RULES = "PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE";
     set disable_join_reorder=true;
     """
 
diff --git a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.groovy b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.groovy
new file mode 100644
index 00000000000000..676becbcb6ecfa
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_min_distinct_through_join_one_side.groovy
@@ -0,0 +1,256 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("push_down_min_distinct_through_join_one_side") {
+    sql "SET enable_nereids_planner=true"
+    sql "set runtime_filter_mode=OFF"
+    sql "SET enable_fallback_to_original_planner=false"
+    sql """
+        DROP TABLE IF EXISTS min_with_distinct_t;
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS min_with_distinct_t(
+      `id` int(32),
+      `score` int(64) NULL,
+      `name` varchar(64) NULL
+    ) ENGINE = OLAP
+    DISTRIBUTED BY HASH(id) BUCKETS 4
+    PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1"
+    );
+    """
+
+    sql "insert into min_with_distinct_t values (1, 1, 'a')"
+    sql "insert into min_with_distinct_t values (2, null, 'a')"
+    sql "insert into min_with_distinct_t values (3, 1, null)"
+    sql "insert into min_with_distinct_t values (4, 2, 'b')"
+    sql "insert into min_with_distinct_t values (5, null, 'b')"
+    sql "insert into min_with_distinct_t values (6, 2, null)"
+    sql "insert into min_with_distinct_t values (7, 3, 'c')"
+    sql "insert into min_with_distinct_t values (8, null, 'c')"
+    sql "insert into min_with_distinct_t values (9, 3, null)"
+    sql "insert into min_with_distinct_t values (10, null, null)"
+    sql "analyze table min_with_distinct_t with sync;"
+    order_qt_groupby_pushdown_basic """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_right_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 right join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_full_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 full join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_semi_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 inner join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_anti_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left anti join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_complex_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), avg(t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where score > 10) t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_outer_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_deep_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t) min_with_distinct_t where score > 10) t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_having """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name having min(distinct t1.score) > 100;
+    """
+
+    order_qt_groupby_pushdown_mixed_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), sum(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multi_table_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id join min_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   sum(distinct t1.score), min(distinct t2.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, min(distinct t1.score), min(distinct t2.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+     order_qt_groupby_pushdown_with_where_clause """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_varied_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), avg(t1.id), min(distinct t2.name) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by_limit """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name order by min(distinct t1.score) limit 10;
+    """
+
+    order_qt_groupby_pushdown_alias_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1_alias.score) from min_with_distinct_t t1_alias join min_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_groupby_pushdown_complex_join_condition """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_function_processed_columns """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct LENGTH(t1.name)) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_nested_queries """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where score > 20) t1 join (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_basic """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_right_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 right join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_full_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 full join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_semi_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 inner join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_anti_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left anti join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), avg(t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where score > 10) t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_outer_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 left join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_deep_subquery """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t) min_with_distinct_t where score > 10) t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_having """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name having min(distinct t1.score) > 100;
+    """
+
+    order_qt_with_hint_groupby_pushdown_mixed_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), sum(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multi_table_join """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id join min_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   sum(distinct t1.score), min(distinct t2.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   t1.name, min(distinct t1.score), min(distinct t2.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_where_clause """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_varied_aggregates """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score), avg(t1.id), min(distinct t2.name) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by_limit """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name order by min(distinct t1.score) limit 10;
+    """
+
+    order_qt_with_hint_groupby_pushdown_alias_multiple_equal_conditions """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1_alias.score) from min_with_distinct_t t1_alias join min_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_join_condition """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from min_with_distinct_t t1 join min_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_function_processed_columns """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct LENGTH(t1.name)) from min_with_distinct_t t1, min_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_nested_queries """
+        select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   min(distinct t1.score) from (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where score > 20) t1 join (select /*+use_cbo_rule(PUSH_DOWN_AGG_WITH_DISTINCT_THROUGH_JOIN_ONE_SIDE)*/   * from min_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+}
diff --git a/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.groovy b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.groovy
new file mode 100644
index 00000000000000..799d45ba413fb7
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/eager_aggregate/push_down_sum_distinct_through_join_one_side.groovy
@@ -0,0 +1,252 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("push_down_sum_distinct_through_join_one_side") {
+    sql "SET enable_nereids_planner=true"
+    sql "set runtime_filter_mode=OFF"
+    sql "SET enable_fallback_to_original_planner=false"
+    sql """
+        DROP TABLE IF EXISTS sum_with_distinct_t;
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS sum_with_distinct_t(
+      `id` int(32),
+      `score` int(64) NULL,
+      `name` varchar(64) NULL
+    ) ENGINE = OLAP
+    DISTRIBUTED BY HASH(id) BUCKETS 4
+    PROPERTIES (
+      "replication_allocation" = "tag.location.default: 1"
+    );
+    """
+
+    sql "insert into sum_with_distinct_t values (1, 1, 'a')"
+    sql "insert into sum_with_distinct_t values (2, null, 'a')"
+    sql "insert into sum_with_distinct_t values (3, 1, null)"
+    sql "insert into sum_with_distinct_t values (4, 2, 'b')"
+    sql "insert into sum_with_distinct_t values (5, null, 'b')"
+    sql "insert into sum_with_distinct_t values (6, 2, null)"
+    sql "insert into sum_with_distinct_t values (7, 3, 'c')"
+    sql "insert into sum_with_distinct_t values (8, null, 'c')"
+    sql "insert into sum_with_distinct_t values (9, 3, null)"
+    sql "insert into sum_with_distinct_t values (10, null, null)"
+    sql "analyze table sum_with_distinct_t with sync;"
+    order_qt_groupby_pushdown_basic """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_right_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 right join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_full_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 full join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_semi_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 inner join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_left_anti_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left anti join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_complex_conditions """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_aggregate """
+        select    sum(distinct t1.score), avg(t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_subquery """
+        select    sum(distinct t1.score) from (select    * from sum_with_distinct_t where score > 10) t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_outer_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_deep_subquery """
+        select    sum(distinct t1.score) from (select    * from (select    * from sum_with_distinct_t) sum_with_distinct_t where score > 10) t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_having """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name having sum(distinct t1.score) > 100;
+    """
+
+    order_qt_groupby_pushdown_mixed_aggregates """
+        select    sum(distinct t1.score), sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multi_table_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id join sum_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_groupby_pushdown_multiple_equal_conditions """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_with_aggregate """
+        select    sum(distinct t1.score), sum(distinct t2.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate """
+        select    t1.name, sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select    t1.name, sum(distinct t1.score), sum(distinct t2.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+     order_qt_groupby_pushdown_with_where_clause """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_varied_aggregates """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_with_order_by_limit """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name order by sum(distinct t1.score) limit 10;
+    """
+
+    order_qt_groupby_pushdown_alias_multiple_equal_conditions """
+        select    sum(distinct t1_alias.score) from sum_with_distinct_t t1_alias join sum_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_groupby_pushdown_complex_join_condition """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_function_processed_columns """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_groupby_pushdown_nested_queries """
+        select    sum(distinct t1.score) from (select    * from sum_with_distinct_t where score > 20) t1 join (select    * from sum_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_basic """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_right_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 right join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_full_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 full join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_semi_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 inner join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_left_anti_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left anti join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_conditions """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.name < t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_aggregate """
+        select    sum(distinct t1.score), avg(t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_subquery """
+        select    sum(distinct t1.score) from (select    * from sum_with_distinct_t where score > 10) t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_outer_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 left join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_deep_subquery """
+        select    sum(distinct t1.score) from (select    * from (select    * from sum_with_distinct_t) sum_with_distinct_t where score > 10) t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_having """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name having sum(distinct t1.score) > 100;
+    """
+
+    order_qt_with_hint_groupby_pushdown_mixed_aggregates """
+        select    sum(distinct t1.score), sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multi_table_join """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id join sum_with_distinct_t t3 on t1.name = t3.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name order by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_multiple_equal_conditions """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_with_aggregate """
+        select    sum(distinct t1.score), sum(distinct t2.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate """
+        select    t1.name, sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_equal_conditions_non_aggregate_with_aggregate """
+        select    t1.name, sum(distinct t1.score), sum(distinct t2.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.name = t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_where_clause """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id and t1.score > 50 group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_varied_aggregates """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_with_order_by_limit """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1, sum_with_distinct_t t2 where t1.id = t2.id group by t1.name order by sum(distinct t1.score) limit 10;
+    """
+
+    order_qt_with_hint_groupby_pushdown_alias_multiple_equal_conditions """
+        select    sum(distinct t1_alias.score) from sum_with_distinct_t t1_alias join sum_with_distinct_t t2_alias on t1_alias.id = t2_alias.id and t1_alias.name = t2_alias.name group by t1_alias.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_complex_join_condition """
+        select    sum(distinct t1.score) from sum_with_distinct_t t1 join sum_with_distinct_t t2 on t1.id = t2.id and t1.score = t2.score and t1.name <> t2.name group by t1.name;
+    """
+
+    order_qt_with_hint_groupby_pushdown_nested_queries """
+        select    sum(distinct t1.score) from (select    * from sum_with_distinct_t where score > 20) t1 join (select    * from sum_with_distinct_t where id < 100) t2 on t1.id = t2.id group by t1.name;
+    """
+}
diff --git a/regression-test/suites/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.groovy b/regression-test/suites/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.groovy
index 2071d75ae85d4e..5bb13c6336c264 100644
--- a/regression-test/suites/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.groovy
+++ b/regression-test/suites/nereids_rules_p0/merge_percentile_to_array/merge_percentile_to_array.groovy
@@ -57,4 +57,8 @@ suite("merge_percentile_to_array") {
             percentile(abs(a), 0.55) as c2 from test_merge_percentile group by a) t;      
     """
 
+    order_qt_same_percentile """select sum(a),percentile(pk, 0.1) as c1 , percentile(pk, 0.1) as c2 ,
+            percentile(pk, 0.4) as c2 from test_merge_percentile;"""
+    order_qt_same_percentile_group_by """select sum(a),percentile(pk, 0.1) as c1 , percentile(pk, 0.1) as c2 ,
+            percentile(pk, 0.4) as c2 from test_merge_percentile group by a;"""
 }
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.groovy b/regression-test/suites/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.groovy
index 92f54f3dd456e8..356b96267a88f5 100644
--- a/regression-test/suites/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.groovy
+++ b/regression-test/suites/nereids_rules_p0/mv/agg_without_roll_up/aggregate_without_roll_up.groovy
@@ -36,7 +36,8 @@ suite("aggregate_without_roll_up") {
       o_orderpriority  CHAR(15) NOT NULL,  
       o_clerk          CHAR(15) NOT NULL, 
       o_shippriority   INTEGER NOT NULL,
-      o_comment        VARCHAR(79) NOT NULL
+      o_comment        VARCHAR(79) NOT NULL,
+      public_col       INT NULL
     )
     DUPLICATE KEY(o_orderkey, o_custkey)
     DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
@@ -44,11 +45,9 @@ suite("aggregate_without_roll_up") {
       "replication_num" = "1"
     );
     """
-
     sql """
     drop table if exists lineitem
     """
-
     sql"""
     CREATE TABLE IF NOT EXISTS lineitem (
       l_orderkey    INTEGER NOT NULL,
@@ -66,7 +65,8 @@ suite("aggregate_without_roll_up") {
       l_receiptdate DATE NOT NULL,
       l_shipinstruct CHAR(25) NOT NULL,
       l_shipmode     CHAR(10) NOT NULL,
-      l_comment      VARCHAR(44) NOT NULL
+      l_comment      VARCHAR(44) NOT NULL,
+      public_col       INT NULL
     )
     DUPLICATE KEY(l_orderkey, l_partkey, l_suppkey, l_linenumber)
     DISTRIBUTED BY HASH(l_orderkey) BUCKETS 3
@@ -74,18 +74,17 @@ suite("aggregate_without_roll_up") {
       "replication_num" = "1"
     )
     """
-
     sql """
     drop table if exists partsupp
     """
-
     sql """
     CREATE TABLE IF NOT EXISTS partsupp (
       ps_partkey     INTEGER NOT NULL,
       ps_suppkey     INTEGER NOT NULL,
       ps_availqty    INTEGER NOT NULL,
       ps_supplycost  DECIMALV3(15,2)  NOT NULL,
-      ps_comment     VARCHAR(199) NOT NULL 
+      ps_comment     VARCHAR(199) NOT NULL,
+      public_col       INT NULL 
     )
     DUPLICATE KEY(ps_partkey, ps_suppkey)
     DISTRIBUTED BY HASH(ps_partkey) BUCKETS 3
@@ -96,29 +95,29 @@ suite("aggregate_without_roll_up") {
 
     sql """
     insert into lineitem values
-    (1, 2, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-08', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
-    (2, 4, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-09', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
-    (3, 2, 4, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-10', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
-    (4, 3, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-11', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
-    (5, 2, 3, 6, 7.5, 8.5, 9.5, 10.5, 'k', 'o', '2023-12-12', '2023-12-12', '2023-12-13', 'c', 'd', 'xxxxxxxxx');
+    (1, 2, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-08', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy', 1),
+    (2, 4, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-09', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy', null),
+    (3, 2, 4, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-10', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy', 2),
+    (4, 3, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-11', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy', null),
+    (5, 2, 3, 6, 7.5, 8.5, 9.5, 10.5, 'k', 'o', '2023-12-12', '2023-12-12', '2023-12-13', 'c', 'd', 'xxxxxxxxx', 3);
     """
 
     sql """
     insert into orders values
-    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
-    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
-    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
-    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
-    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
-    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
-    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
-    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi');  
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy', 1),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy', null),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy', 2),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy', null),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy', 3),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm', null),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi', 4),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi', null);  
     """
 
     sql """
     insert into partsupp values
-    (2, 3, 9, 10.01, 'supply1'),
-    (2, 3, 10, 11.01, 'supply2');
+    (2, 3, 9, 10.01, 'supply1', 1),
+    (2, 3, 10, 11.01, 'supply2', null);
     """
 
     sql """alter table lineitem modify column l_comment set stats ('row_count'='5');"""
@@ -1362,4 +1361,615 @@ suite("aggregate_without_roll_up") {
     """
     async_mv_rewrite_fail(db, mv27_0, query27_0, "mv27_0")
     sql """ DROP MATERIALIZED VIEW IF EXISTS mv27_0"""
+
+
+   // query and mv has the same filter but position is different, should rewrite successfully
+    def mv28_0 = """
+    select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          l_orderkey is null 
+          or l_orderkey <> 8
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey 
+    where 
+      l_orderkey is null 
+      or l_orderkey <> 8
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    def query28_0 = """
+    select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          l_orderkey is null 
+          or l_orderkey <> 8
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey 
+    where 
+      l_orderkey is null 
+      or l_orderkey <> 8 
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    order_qt_query28_0_before "${query28_0}"
+    async_mv_rewrite_success(db, mv28_0, query28_0, "mv28_0")
+    order_qt_query28_0_after "${query28_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv28_0"""
+
+
+
+    // query and mv has the same filter but position is different, should rewrite successfully
+    def mv29_0 = """
+      select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    def query29_0 = """
+      select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    order_qt_query29_0_before "${query29_0}"
+    async_mv_rewrite_success(db, mv29_0, query29_0, "mv29_0")
+    order_qt_query29_0_after "${query29_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv29_0"""
+
+
+    // query and mv has the same filter but position is different, should rewrite successfully
+    // mv join condition has alias
+    def mv30_0 = """
+      select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey_alias, 
+      orders.public_col as col1, 
+      l_orderkey_alias, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey_alias, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey_alias + l_orderkey_alias + ps_partkey_alias * 2, 
+      sum(
+        o_orderkey_alias + l_orderkey_alias + ps_partkey_alias * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey as o_orderkey_alias, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey as l_orderkey_alias, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on lineitem.l_orderkey_alias = orders.o_orderkey_alias 
+      inner join (
+        select 
+          ps_partkey as ps_partkey_alias, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on partsupp.ps_partkey_alias = orders.o_orderkey_alias
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+      and o_orderkey_alias = 2
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    def query30_0 = """
+      select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+      and o_orderkey = 2
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    order_qt_query30_0_before "${query30_0}"
+    async_mv_rewrite_success(db, mv30_0, query30_0, "mv30_0")
+    order_qt_query30_0_after "${query30_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv30_0"""
+
+
+    // query and mv has the same filter but position is different, should rewrite successfully
+    // query join condition has alias
+    def mv31_0 = """
+      select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey, 
+      orders.public_col as col1, 
+      l_orderkey, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey + l_orderkey + ps_partkey * 2, 
+      sum(
+        o_orderkey + l_orderkey + ps_partkey * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on l_orderkey = o_orderkey 
+      inner join (
+        select 
+          ps_partkey, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on ps_partkey = o_orderkey
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+      and o_orderkey = 2
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    def query31_0 = """
+select 
+      o_custkey, 
+      o_orderdate, 
+      o_shippriority, 
+      o_comment, 
+      o_orderkey_alias, 
+      orders.public_col as col1, 
+      l_orderkey_alias, 
+      l_partkey, 
+      l_suppkey, 
+      lineitem.public_col as col2, 
+      ps_partkey_alias, 
+      ps_suppkey, 
+      partsupp.public_col as col3, 
+      partsupp.public_col * 2 as col4, 
+      o_orderkey_alias + l_orderkey_alias + ps_partkey_alias * 2, 
+      sum(
+        o_orderkey_alias + l_orderkey_alias + ps_partkey_alias * 2
+      ), 
+      count() as count_all 
+    from 
+      (
+        select 
+          o_custkey, 
+          o_orderdate, 
+          o_shippriority, 
+          o_comment, 
+          o_orderkey as o_orderkey_alias, 
+          orders.public_col as public_col 
+        from 
+          orders
+      ) orders 
+      left join (
+        select 
+          l_orderkey as l_orderkey_alias, 
+          l_partkey, 
+          l_suppkey, 
+          lineitem.public_col as public_col 
+        from 
+          lineitem 
+        where 
+          lineitem.public_col is null 
+          or lineitem.public_col <> 1
+      ) lineitem on lineitem.l_orderkey_alias = orders.o_orderkey_alias 
+      inner join (
+        select 
+          ps_partkey as ps_partkey_alias, 
+          ps_suppkey, 
+          partsupp.public_col as public_col 
+        from 
+          partsupp
+      ) partsupp on partsupp.ps_partkey_alias = orders.o_orderkey_alias
+    where 
+      lineitem.public_col is null 
+      or lineitem.public_col <> 1 
+      and o_orderkey_alias = 2
+    group by 
+      1, 
+      2, 
+      3, 
+      4, 
+      5, 
+      6, 
+      7, 
+      8, 
+      9, 
+      10, 
+      11, 
+      12, 
+      13, 
+      14;
+    """
+    order_qt_query31_0_before "${query31_0}"
+    async_mv_rewrite_success(db, mv31_0, query31_0, "mv31_0")
+    order_qt_query31_0_after "${query31_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv31_0"""
 }
diff --git a/regression-test/suites/nereids_rules_p0/mv/create_part_and_up/range_datetime_part_up_rewrite.groovy b/regression-test/suites/nereids_rules_p0/mv/create_part_and_up/range_datetime_part_up_rewrite.groovy
index f8e601e64f5819..140a91edd7ca96 100644
--- a/regression-test/suites/nereids_rules_p0/mv/create_part_and_up/range_datetime_part_up_rewrite.groovy
+++ b/regression-test/suites/nereids_rules_p0/mv/create_part_and_up/range_datetime_part_up_rewrite.groovy
@@ -168,7 +168,7 @@ suite("mtmv_range_datetime_part_up_rewrite") {
     for (int i = 0; i < mv_name_list.size(); i++) {
         def job_name = getJobName(db, mv_name_list[i])
         waitingMTMVTaskFinished(job_name)
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
@@ -178,13 +178,15 @@ suite("mtmv_range_datetime_part_up_rewrite") {
         (1, null, 3, 1, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-10-18', '2023-10-18', 'a', 'b', 'yyyyyyyyy', '2023-11-29 03:00:00')"""
     sql """alter table lineitem_range_datetime_union modify column l_comment set stats ('row_count'='8');"""
     for (int i = 0; i < mv_name_list.size(); i++) {
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
     for (int i = 0; i < mv_name_list.size(); i++) {
         sql """refresh MATERIALIZED VIEW ${mv_name_list[i]} auto;"""
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
@@ -192,25 +194,29 @@ suite("mtmv_range_datetime_part_up_rewrite") {
         (3, null, 3, 1, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-10-18', '2023-10-18', 'a', 'b', 'yyyyyyyyy', '2023-11-29 03:00:00');"""
     sql """alter table lineitem_range_datetime_union modify column l_comment set stats ('row_count'='9');"""
     for (int i = 0; i < mv_name_list.size(); i++) {
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
     for (int i = 0; i < mv_name_list.size(); i++) {
         sql """refresh MATERIALIZED VIEW ${mv_name_list[i]} auto;"""
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
     sql """ALTER TABLE lineitem_range_datetime_union DROP PARTITION IF EXISTS p4 FORCE"""
     for (int i = 0; i < mv_name_list.size(); i++) {
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
     for (int i = 0; i < mv_name_list.size(); i++) {
         sql """refresh MATERIALIZED VIEW ${mv_name_list[i]} auto;"""
-        mv_rewrite_success(query_stmt_list[i], mv_name_list[i])
+        // both mv should rewrite success
+        mv_rewrite_any_success(query_stmt_list[i], mv_name_list)
         compare_res(query_stmt_list[i] + " order by 1,2,3")
     }
 
diff --git a/regression-test/suites/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.groovy b/regression-test/suites/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.groovy
new file mode 100644
index 00000000000000..c1c00d448635ee
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/mv/dml/rewrite/rewrite_when_dml.groovy
@@ -0,0 +1,291 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("rewrite_when_dml") {
+    String db = context.config.getDbNameByFile(context.file)
+    sql "use ${db}"
+    sql "set runtime_filter_mode=OFF";
+    sql "SET ignore_shape_nodes='PhysicalDistribute,PhysicalProject'"
+    sql "set enable_agg_state=true"
+
+    sql """
+    drop table if exists orders
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS orders  (
+      o_orderkey       INTEGER NOT NULL,
+      o_custkey        INTEGER NOT NULL,
+      o_orderstatus    CHAR(1) NOT NULL,
+      o_totalprice     DECIMALV3(15,2) NOT NULL,
+      o_orderdate      DATE NOT NULL,
+      o_orderpriority  CHAR(15) NOT NULL,  
+      o_clerk          CHAR(15) NOT NULL, 
+      o_shippriority   INTEGER NOT NULL,
+      O_COMMENT        VARCHAR(79) NOT NULL
+    )
+    DUPLICATE KEY(o_orderkey, o_custkey)
+    DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    );
+    """
+
+    sql """
+    drop table if exists lineitem
+    """
+
+    sql"""
+    CREATE TABLE IF NOT EXISTS lineitem (
+      l_orderkey    INTEGER NOT NULL,
+      l_partkey     INTEGER NOT NULL,
+      l_suppkey     INTEGER NOT NULL,
+      l_linenumber  INTEGER NOT NULL,
+      l_quantity    DECIMALV3(15,2) NOT NULL,
+      l_extendedprice  DECIMALV3(15,2) NOT NULL,
+      l_discount    DECIMALV3(15,2) NOT NULL,
+      l_tax         DECIMALV3(15,2) NOT NULL,
+      l_returnflag  CHAR(1) NOT NULL,
+      l_linestatus  CHAR(1) NOT NULL,
+      l_shipdate    DATE NOT NULL,
+      l_commitdate  DATE NOT NULL,
+      l_receiptdate DATE NOT NULL,
+      l_shipinstruct CHAR(25) NOT NULL,
+      l_shipmode     CHAR(10) NOT NULL,
+      l_comment      VARCHAR(44) NOT NULL
+    )
+    DUPLICATE KEY(l_orderkey, l_partkey, l_suppkey, l_linenumber)
+    DISTRIBUTED BY HASH(l_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    )
+    """
+
+    sql """
+    drop table if exists partsupp
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS partsupp (
+      ps_partkey     INTEGER NOT NULL,
+      ps_suppkey     INTEGER NOT NULL,
+      ps_availqty    INTEGER NOT NULL,
+      ps_supplycost  DECIMALV3(15,2)  NOT NULL,
+      ps_comment     VARCHAR(199) NOT NULL 
+    )
+    DUPLICATE KEY(ps_partkey, ps_suppkey)
+    DISTRIBUTED BY HASH(ps_partkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    )
+    """
+
+    sql """ insert into lineitem values
+    (1, 2, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-08', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (2, 4, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-09', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (3, 2, 4, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-10', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (4, 3, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-11', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (5, 2, 3, 6, 7.5, 8.5, 9.5, 10.5, 'k', 'o', '2023-12-12', '2023-12-12', '2023-12-13', 'c', 'd', 'xxxxxxxxx');
+    """
+
+    sql """
+    insert into orders values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi');  
+    """
+
+    sql """
+    insert into partsupp values
+    (2, 3, 9, 10.01, 'supply1'),
+    (2, 3, 10, 11.01, 'supply2');
+    """
+
+    sql """analyze table partsupp with sync"""
+    sql """analyze table lineitem with sync"""
+    sql """analyze table orders with sync"""
+    sql """alter table lineitem modify column l_comment set stats ('row_count'='5');"""
+    sql """alter table orders modify column O_COMMENT set stats ('row_count'='8');"""
+    sql """alter table partsupp modify column ps_comment set stats ('row_count'='2');"""
+
+    // rewrite should success when table add column
+    def mv1_0 = """
+            select
+            o_orderstatus,
+            l_partkey,
+            l_suppkey,
+            sum_union(sum_state(o_shippriority)),
+            group_concat_union(group_concat_state(o_orderstatus)),
+            avg_union(avg_state(l_linenumber)),
+            max_by_union(max_by_state(O_COMMENT,o_totalprice)),
+            count_union(count_state(l_orderkey)),
+            multi_distinct_count_union(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders
+            on lineitem.l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus,
+            l_partkey,
+            l_suppkey;
+    """
+    def query1_0 = """
+            select
+            o_orderstatus,
+            l_suppkey,
+            sum_merge(sum_state(o_shippriority)),
+            group_concat_merge(group_concat_state(o_orderstatus)),
+            avg_merge(avg_state(l_linenumber)),
+            max_by_merge(max_by_state(O_COMMENT,o_totalprice)),
+            count_merge(count_state(l_orderkey)),
+            multi_distinct_count_merge(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders 
+            on l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus,
+            l_suppkey
+            order by o_orderstatus;
+    """
+    order_qt_query1_0_before "${query1_0}"
+    sql """ALTER TABLE orders ADD COLUMN new_col INT KEY DEFAULT "0";"""
+    async_mv_rewrite_success(db, mv1_0, query1_0, "mv1_0")
+    order_qt_query1_0_after "${query1_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv1_0"""
+
+
+    // rewrite should fail when table drop column which is used by query
+    def mv2_0 = """
+            select
+            o_orderstatus,
+            l_partkey,
+            l_suppkey,
+            sum_union(sum_state(o_shippriority)),
+            group_concat_union(group_concat_state(o_orderstatus)),
+            avg_union(avg_state(l_linenumber)),
+            max_by_union(max_by_state(O_COMMENT,o_totalprice)),
+            count_union(count_state(l_orderkey)),
+            multi_distinct_count_union(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders
+            on lineitem.l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus,
+            l_partkey,
+            l_suppkey;
+    """
+    def query2_0 = """
+            select
+            o_orderstatus,
+            l_suppkey,
+            sum_merge(sum_state(o_shippriority)),
+            group_concat_merge(group_concat_state(o_orderstatus)),
+            avg_merge(avg_state(l_linenumber)),
+            max_by_merge(max_by_state(O_COMMENT,o_totalprice)),
+            count_merge(count_state(l_orderkey)),
+            multi_distinct_count_merge(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders 
+            on l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus,
+            l_suppkey
+            order by o_orderstatus;
+    """
+    order_qt_query2_0_before "${query2_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv2_0"""
+    sql """
+        CREATE MATERIALIZED VIEW mv2_0
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS ${mv2_0}
+    """
+    waitingMTMVTaskFinishedByMvName("mv2_0")
+    sql """ALTER TABLE lineitem DROP COLUMN l_suppkey;"""
+
+    try {
+        mv_not_part_in(query2_0, "mv2_0")
+    } catch (Exception e) {
+        // Unknown column because drop
+    }
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv2_0"""
+
+
+    // rewrite should fail when table drop column which is not used by query
+    // can be optimized in the future
+    def mv3_0 = """
+            select
+            o_orderstatus,
+            l_partkey,
+            sum_union(sum_state(o_shippriority)),
+            group_concat_union(group_concat_state(o_orderstatus)),
+            avg_union(avg_state(l_linenumber)),
+            count_union(count_state(l_orderkey)),
+            multi_distinct_count_union(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders
+            on lineitem.l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus,
+            l_partkey;
+    """
+    def query3_0 = """
+            select
+            o_orderstatus,
+            sum_merge(sum_state(o_shippriority)),
+            group_concat_merge(group_concat_state(o_orderstatus)),
+            avg_merge(avg_state(l_linenumber)),
+            count_merge(count_state(l_orderkey)),
+            multi_distinct_count_merge(multi_distinct_count_state(l_shipmode))
+            from lineitem
+            left join orders 
+            on l_orderkey = o_orderkey and l_shipdate = o_orderdate
+            group by
+            o_orderstatus
+            order by o_orderstatus;
+    """
+    order_qt_query3_0_before "${query3_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv3_0"""
+    sql """
+        CREATE MATERIALIZED VIEW mv3_0
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS ${mv3_0}
+    """
+    waitingMTMVTaskFinishedByMvName("mv3_0")
+    sql """ALTER TABLE orders DROP COLUMN O_COMMENT;"""
+    mv_not_part_in(query3_0, "mv3_0")
+
+    order_qt_query3_0_after "${query3_0}"
+    sql """ DROP MATERIALIZED VIEW IF EXISTS mv3_0"""
+}
diff --git a/regression-test/suites/nereids_rules_p0/mv/is_in_debug_mode/is_in_debug_mode.groovy b/regression-test/suites/nereids_rules_p0/mv/is_in_debug_mode/is_in_debug_mode.groovy
new file mode 100644
index 00000000000000..15d93e32f65dc2
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/mv/is_in_debug_mode/is_in_debug_mode.groovy
@@ -0,0 +1,156 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.junit.Assert
+
+suite("is_in_debug_mode") {
+    String db = context.config.getDbNameByFile(context.file)
+    sql "use ${db}"
+    sql "set runtime_filter_mode=OFF";
+    sql "SET ignore_shape_nodes='PhysicalDistribute,PhysicalProject'"
+
+    sql """
+    drop table if exists orders;
+    """
+
+    sql """
+     CREATE TABLE IF NOT EXISTS orders  (
+      o_orderkey       INTEGER NOT NULL,
+      o_custkey        INTEGER NOT NULL,
+      o_orderstatus    CHAR(1) NOT NULL,
+      o_totalprice     DECIMALV3(15,2) NOT NULL,
+      o_orderdate      DATE NOT NULL,
+      o_orderpriority  CHAR(15) NOT NULL,  
+      o_clerk          CHAR(15) NOT NULL, 
+      o_shippriority   INTEGER NOT NULL,
+      O_COMMENT        VARCHAR(79) NOT NULL
+    )
+    UNIQUE KEY(o_orderkey, o_custkey)
+    DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    );
+    """
+
+    sql """
+    insert into orders values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi'); 
+    """
+
+    create_async_mv(db, "basic_mv", """
+    select * from orders where o_orderkey > 1;
+    """)
+
+    sql """set skip_delete_sign = true;"""
+    mv_not_part_in("""select * from orders where o_orderkey > 1;""", "basic_mv")
+    try {
+        sql """
+        CREATE MATERIALIZED VIEW test_create_mv
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS select * from orders where o_orderkey > 2;
+        """
+    } catch (Exception e) {
+        Assert.assertTrue(e.getMessage().contains("because is in debug mode"))
+    }
+    sql """set skip_delete_sign = false;"""
+
+
+    sql """set skip_storage_engine_merge = true;"""
+    mv_not_part_in("""select * from orders where o_orderkey > 1;""", "basic_mv")
+    try {
+        sql """
+        CREATE MATERIALIZED VIEW test_create_mv
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS select * from orders where o_orderkey > 2;
+        """
+    } catch (Exception e) {
+        Assert.assertTrue(e.getMessage().contains("because is in debug mode"))
+    }
+    sql """set skip_storage_engine_merge = false;"""
+
+
+    sql """set skip_delete_bitmap = true;"""
+    mv_not_part_in("""select * from orders where o_orderkey > 1;""", "basic_mv")
+    try {
+        sql """
+        CREATE MATERIALIZED VIEW test_create_mv
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS select * from orders where o_orderkey > 2;
+        """
+    } catch (Exception e) {
+        Assert.assertTrue(e.getMessage().contains("because is in debug mode"))
+    }
+    sql """set skip_delete_bitmap = false;"""
+
+
+    sql """set skip_delete_predicate = true;"""
+    mv_not_part_in("""select * from orders where o_orderkey > 1;""", "basic_mv")
+    try {
+        sql """
+        CREATE MATERIALIZED VIEW test_create_mv
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS select * from orders where o_orderkey > 2;
+        """
+    } catch (Exception e) {
+        Assert.assertTrue(e.getMessage().contains("because is in debug mode"))
+    }
+    sql """set skip_delete_predicate = false;"""
+
+
+    sql """set show_hidden_columns = true;"""
+    mv_not_part_in("""select * from orders where o_orderkey > 1;""", "basic_mv")
+    try {
+        sql """
+        CREATE MATERIALIZED VIEW test_create_mv
+        BUILD IMMEDIATE REFRESH COMPLETE ON MANUAL
+        DISTRIBUTED BY RANDOM BUCKETS 2
+        PROPERTIES ('replication_num' = '1') 
+        AS select * from orders where o_orderkey > 2;
+        """
+    } catch (Exception e) {
+        Assert.assertTrue(e.getMessage().contains("because is in debug mode"))
+    }
+    sql """set show_hidden_columns = false;"""
+
+    sql """drop materialized view if exists basic_mv"""
+}
+
diff --git a/regression-test/suites/nereids_rules_p0/mv/micro_test/micro_test_when_cte.groovy b/regression-test/suites/nereids_rules_p0/mv/micro_test/micro_test_when_cte.groovy
new file mode 100644
index 00000000000000..9e80ea966fc1a2
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/mv/micro_test/micro_test_when_cte.groovy
@@ -0,0 +1,204 @@
+package mv.micro_test
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("micro_test_when_cte") {
+    String db = context.config.getDbNameByFile(context.file)
+    sql "use ${db}"
+    sql "set runtime_filter_mode=OFF";
+    sql "SET ignore_shape_nodes='PhysicalDistribute,PhysicalProject'"
+
+    sql """
+    drop table if exists orders
+    """
+    sql """
+    CREATE TABLE IF NOT EXISTS orders  (
+      o_orderkey       INTEGER NOT NULL,
+      o_custkey        INTEGER NOT NULL,
+      o_orderstatus    CHAR(1) NOT NULL,
+      o_totalprice     DECIMALV3(15,2) NOT NULL,
+      o_orderdate      DATE NOT NULL,
+      o_orderpriority  CHAR(15) NOT NULL,  
+      o_clerk          CHAR(15) NOT NULL, 
+      o_shippriority   INTEGER NOT NULL,
+      O_COMMENT        VARCHAR(79) NOT NULL
+    )
+    DUPLICATE KEY(o_orderkey, o_custkey)
+    PARTITION BY RANGE(o_orderdate)(
+    FROM ('2023-12-01') TO ('2023-12-31') INTERVAL 1 DAY
+    )
+    DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    );
+    """
+
+    sql """
+    drop table if exists lineitem
+    """
+    sql"""
+    CREATE TABLE IF NOT EXISTS lineitem (
+      l_orderkey    INTEGER NOT NULL,
+      l_partkey     INTEGER NOT NULL,
+      l_suppkey     INTEGER NOT NULL,
+      l_linenumber  INTEGER NOT NULL,
+      l_quantity    DECIMALV3(15,2) NOT NULL,
+      l_extendedprice  DECIMALV3(15,2) NOT NULL,
+      l_discount    DECIMALV3(15,2) NOT NULL,
+      l_tax         DECIMALV3(15,2) NOT NULL,
+      l_returnflag  CHAR(1) NOT NULL,
+      l_linestatus  CHAR(1) NOT NULL,
+      l_shipdate    DATE NOT NULL,
+      l_commitdate  DATE NOT NULL,
+      l_receiptdate DATE NOT NULL,
+      l_shipinstruct CHAR(25) NOT NULL,
+      l_shipmode     CHAR(10) NOT NULL,
+      l_comment      VARCHAR(44) NOT NULL
+    )
+    DUPLICATE KEY(l_orderkey, l_partkey, l_suppkey, l_linenumber)
+    PARTITION BY RANGE(l_shipdate) 
+    (FROM ('2023-12-01') TO ('2023-12-31') INTERVAL 1 DAY)
+    DISTRIBUTED BY HASH(l_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    )
+    """
+
+    sql """
+    drop table if exists partsupp
+    """
+    sql """
+    CREATE TABLE IF NOT EXISTS partsupp (
+      ps_partkey     INTEGER NOT NULL,
+      ps_suppkey     INTEGER NOT NULL,
+      ps_availqty    INTEGER NOT NULL,
+      ps_supplycost  DECIMALV3(15,2)  NOT NULL,
+      ps_comment     VARCHAR(199) NOT NULL 
+    )
+    DUPLICATE KEY(ps_partkey, ps_suppkey)
+    DISTRIBUTED BY HASH(ps_partkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    )
+    """
+
+    sql """ insert into lineitem values
+    (1, 2, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-08', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (2, 4, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-09', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (3, 2, 4, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-10', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (4, 3, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-11', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy'),
+    (5, 2, 3, 6, 7.5, 8.5, 9.5, 10.5, 'k', 'o', '2023-12-12', '2023-12-12', '2023-12-13', 'c', 'd', 'xxxxxxxxx');
+    """
+
+    sql """
+    insert into orders values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi');  
+    """
+
+    sql """
+    insert into partsupp values
+    (2, 3, 9, 10.01, 'supply1'),
+    (2, 3, 10, 11.01, 'supply2');
+    """
+
+    sql """analyze table partsupp with sync"""
+    sql """analyze table lineitem with sync"""
+    sql """analyze table orders with sync"""
+    sql """alter table lineitem modify column l_comment set stats ('row_count'='5');"""
+    sql """alter table orders modify column O_COMMENT set stats ('row_count'='18');"""
+    sql """alter table partsupp modify column ps_comment set stats ('row_count'='2');"""
+
+    def query_sql = """
+    WITH scan_data_cte as (
+        select t1.l_shipdate, t1.L_LINENUMBER, orders.O_CUSTKEY, l_suppkey
+        from (select * from lineitem where L_LINENUMBER > 1) t1
+        left join orders on t1.L_ORDERKEY = orders.O_ORDERKEY
+    )
+    SELECT *  FROM scan_data_cte; 
+    """
+    def mv_sql = """
+    WITH scan_data_cte as (
+        select t1.l_shipdate, t1.L_LINENUMBER, orders.O_CUSTKEY, l_suppkey
+        from (select * from lineitem where L_LINENUMBER > 1) t1
+        left join orders on t1.L_ORDERKEY = orders.O_ORDERKEY
+    )
+    SELECT *  FROM scan_data_cte; 
+    """
+    def mv_name = """mv_with_cte_test"""
+
+    // query directly
+    order_qt_query_0_after "${query_sql}"
+
+    // create and build complete mv
+    create_async_mv(db, mv_name, mv_sql)
+    // refresh mv complete
+    sql """refresh materialized view ${mv_name} complete"""
+    // query mv directly
+    waitingMTMVTaskFinishedByMvName(mv_name)
+    order_qt_query_mv_0 "select * from ${mv_name}"
+
+    // create and build partition mv
+    create_async_partition_mv(db, mv_name, mv_sql, "(l_shipdate)")
+
+    // refresh mv partly
+    sql """refresh materialized view ${mv_name} partitions(p_20231208_20231209)"""
+    // query mv directly
+    waitingMTMVTaskFinishedByMvName(mv_name)
+    order_qt_query_mv_1 "select * from ${mv_name}"
+
+    // query rewrite
+    mv_rewrite_success(mv_sql, mv_name)
+    order_qt_query_0_after "${query_sql}"
+
+    // DML
+    // base table insert into data when not partition table
+    sql """
+    insert into orders values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy');
+    """
+    sql """refresh materialized view ${mv_name} complete"""
+    // query mv directly
+    waitingMTMVTaskFinishedByMvName(mv_name)
+    order_qt_query_mv_2 "select * from ${mv_name}"
+
+    // base table insert into data when partition table
+    sql """
+    insert into lineitem values
+    (1, 2, 3, 4, 5.5, 6.5, 7.5, 8.5, 'o', 'k', '2023-12-10', '2023-12-09', '2023-12-10', 'a', 'b', 'yyyyyyyyy');
+    """
+    sql """refresh materialized view ${mv_name} partitions(p_20231210_20231211)"""
+    // query mv directly
+    waitingMTMVTaskFinishedByMvName(mv_name)
+    order_qt_query_mv_3 "select * from ${mv_name}"
+}
diff --git a/regression-test/suites/nereids_rules_p0/mv/with_table_operator/with_table_operator.groovy b/regression-test/suites/nereids_rules_p0/mv/with_table_operator/with_table_operator.groovy
new file mode 100644
index 00000000000000..5ba2c05053e2a2
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/mv/with_table_operator/with_table_operator.groovy
@@ -0,0 +1,195 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("with_table_operator") {
+    String db = context.config.getDbNameByFile(context.file)
+    sql "use ${db}"
+    sql "set runtime_filter_mode=OFF";
+    sql "SET ignore_shape_nodes='PhysicalDistribute,PhysicalProject'"
+
+    sql """
+    drop table if exists orders;
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS orders  (
+      o_orderkey       INTEGER NOT NULL,
+      o_custkey        INTEGER NOT NULL,
+      o_orderstatus    CHAR(1) NOT NULL,
+      o_totalprice     DECIMALV3(15,2) NOT NULL,
+      o_orderdate      DATE NOT NULL,
+      o_orderpriority  CHAR(15) NOT NULL,  
+      o_clerk          CHAR(15) NOT NULL, 
+      o_shippriority   INTEGER NOT NULL,
+      O_COMMENT        VARCHAR(79) NOT NULL
+    )
+    DUPLICATE KEY(o_orderkey, o_custkey)
+    DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    );
+    """
+
+    sql """
+    insert into orders values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi'); 
+    """
+
+    sql """
+    drop table if exists orders_partition;
+    """
+
+    sql """
+    CREATE TABLE IF NOT EXISTS orders_partition  (
+      o_orderkey       INTEGER NOT NULL,
+      o_custkey        INTEGER NOT NULL,
+      o_orderstatus    CHAR(1) NOT NULL,
+      o_totalprice     DECIMALV3(15,2) NOT NULL,
+      o_orderdate      DATE NOT NULL,
+      o_orderpriority  CHAR(15) NOT NULL,  
+      o_clerk          CHAR(15) NOT NULL, 
+      o_shippriority   INTEGER NOT NULL,
+      O_COMMENT        VARCHAR(79) NOT NULL
+    )
+    DUPLICATE KEY(o_orderkey, o_custkey)
+    PARTITION BY RANGE(o_orderdate) (
+    PARTITION `day_2` VALUES LESS THAN ('2023-12-9'),
+    PARTITION `day_3` VALUES LESS THAN ("2023-12-11"),
+    PARTITION `day_4` VALUES LESS THAN ("2023-12-30")
+    )
+    DISTRIBUTED BY HASH(o_orderkey) BUCKETS 3
+    PROPERTIES (
+      "replication_num" = "1"
+    );
+    """
+
+    sql """
+    insert into orders_partition values
+    (1, 1, 'o', 9.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (1, 1, 'o', 10.5, '2023-12-08', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (2, 1, 'o', 11.5, '2023-12-09', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 12.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (3, 1, 'o', 33.5, '2023-12-10', 'a', 'b', 1, 'yy'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (4, 2, 'o', 43.2, '2023-12-11', 'c','d',2, 'mm'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 56.2, '2023-12-12', 'c','d',2, 'mi'),
+    (5, 2, 'o', 1.2, '2023-12-12', 'c','d',2, 'mi'); 
+    """
+
+    create_async_mv(db, "complete_agg_mv", """
+    select count(*),o_orderdate
+    from orders
+    group by o_orderdate;
+    """)
+
+    create_async_mv(db, "complete_mv", """
+    select * from orders;
+    """)
+
+    create_async_partition_mv(db, "partition_agg_mv", """
+    select count(*),o_orderdate
+    from orders_partition
+    group by o_orderdate;
+    """, "(o_orderdate)")
+
+    create_async_partition_mv(db, "partition_mv", """
+    select * from orders_partition;
+    """, "(o_orderdate)")
+
+    // query rewrite with tablet should fail
+    mv_rewrite_all_fail("""
+    select count(*),o_orderdate
+    from orders TABLET(110)
+    group by o_orderdate;
+    """, ["complete_mv", "complete_agg_mv"])
+
+    mv_rewrite_all_fail("""select * from orders TABLET(110);""", ["complete_mv", "complete_agg_mv"])
+
+    // query rewrite with index should fail
+    createMV("""
+    create materialized view query_index_test 
+    as
+    select o_orderdate, count(*)
+    from orders
+    group by o_orderdate;
+    """)
+    mv_rewrite_all_fail("""
+    select * from orders index query_index_test;
+    """, ["complete_mv", "complete_agg_mv"])
+
+    // query rewrite with sample should fail
+    mv_rewrite_all_fail("""
+    select count(*),o_orderdate
+    from orders TABLESAMPLE(20 percent)
+    group by o_orderdate;
+    """, ["complete_mv", "complete_agg_mv"])
+
+    mv_rewrite_all_fail("""select * from orders TABLESAMPLE(20 percent);""", ["complete_mv", "complete_agg_mv"])
+
+    // query rewrite with partition should fail
+    mv_rewrite_all_fail("""
+    select count(*),o_orderdate
+    from orders_partition PARTITION (day_2)
+    group by o_orderdate;
+    """, ["partition_mv", "partition_agg_mv"])
+
+    mv_rewrite_all_fail("""select * from orders_partition PARTITION (day_2);""", ["partition_mv", "partition_agg_mv"])
+
+
+    sql """
+    DROP MATERIALIZED VIEW IF EXISTS complete_agg_mv;
+    """
+    sql """
+    DROP MATERIALIZED VIEW IF EXISTS partition_agg_mv;
+    """
+    sql """
+    DROP MATERIALIZED VIEW IF EXISTS complete_mv;
+    """
+    sql """
+    DROP MATERIALIZED VIEW IF EXISTS partition_mv;
+    """
+    sql """
+    DROP MATERIALIZED VIEW IF EXISTS query_index_test on orders;
+    """
+}
+
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/auto_partition.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/auto_partition.groovy
new file mode 100644
index 00000000000000..ee6a40c7a0d9e0
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/auto_partition.groovy
@@ -0,0 +1,92 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("auto_partition") {
+    sql "drop table if exists one_col_range_partition_date_func"
+    sql """create table one_col_range_partition_date_func (a int, dt datetime not null, d date, c varchar(100)) duplicate key(a)
+    auto partition by range(date_trunc(dt,'day')) () distributed by hash(a) properties("replication_num"="1");"""
+    sql """INSERT INTO one_col_range_partition_date_func SELECT number,
+    date_add('2020-01-01 00:00:00', interval number hour),
+    cast(date_add('2020-01-01 00:00:00', interval number hour) as date), cast(number as varchar(65533)) FROM numbers('number'='10000');"""
+    sql "drop table if exists one_col_range_partition_date_func_month"
+    sql """create table one_col_range_partition_date_func_month(a int, dt datetime not null, d date, c varchar(100)) duplicate key(a)
+    auto partition by range(date_trunc(dt,'month')) () distributed by hash(a) properties("replication_num"="1");"""
+    sql """INSERT INTO one_col_range_partition_date_func_month SELECT number,
+    date_add('2020-01-01 00:00:00', interval number hour),
+    cast(date_add('2020-01-01 00:00:00', interval number hour) as date), cast(number as varchar(65533)) FROM numbers('number'='10000');"""
+    // auto partition
+    // partition by range(date_trunc(dt, 'day'))
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt<'2020-10-01 00:00:00'"
+        contains("partitions=274/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt<='2020-10-01 00:00:00'"
+        contains("partitions=275/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt>'2020-10-01 00:00:00'"
+        contains("partitions=143/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt>='2020-10-01 00:00:00'"
+        contains("partitions=143/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt='2020-10-01 00:00:00'"
+        contains("partitions=1/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt<=>'2020-10-01 00:00:00'"
+        contains("partitions=1/417")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func WHERE dt!='2020-10-01 00:00:00'"
+        contains("partitions=417/417")
+    }
+
+    // partition by range(date_trunc(dt, 'month'))
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt<'2020-10-01 00:00:00'"
+        contains("partitions=9/14")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt<='2020-10-01 00:00:00'"
+        contains("partitions=10/14")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt>'2020-10-01 00:00:00'"
+        contains("partitions=5/14")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt>='2020-10-01 00:00:00'"
+        contains("partitions=5/14")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt='2020-10-01 00:00:00'"
+        contains("partitions=1/14 (p20201001000000)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt<=>'2020-10-01 00:00:00'"
+        contains("partitions=1/14 (p20201001000000)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date_func_month WHERE dt!='2020-10-01 00:00:00'"
+        contains("partitions=14/14")
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/hive_partition_prune.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/hive_partition_prune.groovy
new file mode 100644
index 00000000000000..ebf4d35d3a1f02
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/hive_partition_prune.groovy
@@ -0,0 +1,136 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("hive_partition_prune") {
+    String enabled = context.config.otherConfigs.get("enableHiveTest")
+    if (enabled == null || !enabled.equalsIgnoreCase("true")) {
+        logger.info("disable Hive test.")
+        return;
+    }
+
+    String extHiveHmsHost = context.config.otherConfigs.get("externalEnvIp")
+    String extHiveHmsPort = context.config.otherConfigs.get("hive3HmsPort")
+    String catalog_name = "test_external_catalog_hive_partition_prune"
+
+    sql """drop catalog if exists ${catalog_name};"""
+    sql """
+        create catalog if not exists ${catalog_name} properties (
+            'type'='hms',
+            'hive.metastore.uris' = 'thrift://${extHiveHmsHost}:${extHiveHmsPort}'
+        );
+    """
+    sql """switch ${catalog_name};"""
+    sql "drop database if exists test_hive_partition_prune"
+    sql "create database test_hive_partition_prune"
+    sql "use test_hive_partition_prune"
+    sql "drop table if exists test_hive_partition "
+    sql """create table test_hive_partition (a int, b int, p int)
+    engine=hive partition by list(p)()
+    properties("file_format"="parquet","orc.compress"="zstd");"""
+
+    sql "insert into test_hive_partition values(1,3,1),(1,2,2),(1,2,3),(1,2,4),(1,2,5),(1,6,null)"
+
+    explain {
+        sql "select * from test_hive_partition where p=1 or p=2"
+        contains("partition=2/6")
+    }
+
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p in (1,2) and p in (2,3,4)"
+        contains("partition=1/6")
+    }
+
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE (p=1 or p=2) and p in (3,5,2)"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE (p=1 xor p=2)"
+        contains("partition=2/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p in (1, 5,6)"
+        contains("partition=2/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p not in (15,6,1, '2021-01-02 00:00:00')"
+        contains("partition=4/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p not in (1, 5,6,null)"
+        contains("partition=0/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where !(p is not null)"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where p is null"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where p is not null"
+        contains("partition=5/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where not p is null"
+        contains("partition=5/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where !(p is null)"
+        contains("partition=5/6")
+    }
+
+    explain {
+        sql "select * from test_hive_partition where p <=> null"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "select * from test_hive_partition where !(p <=> null)"
+        contains("partition=5/6")
+    }
+
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p<1"
+        contains("partition=0/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p<=2"
+        contains("partition=2/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p>2"
+        contains("partition=3/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p>=3"
+        contains("partition=3/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p=4"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p<=>5"
+        contains("partition=1/6")
+    }
+    explain {
+        sql "SELECT * FROM test_hive_partition WHERE p!=5 and p!=6"
+        contains("partition=4/6")
+    }
+    sql "drop table if exists test_hive_partition "
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/int_as_date_partition_col.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/int_as_date_partition_col.groovy
new file mode 100644
index 00000000000000..9d4e2a16490512
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/int_as_date_partition_col.groovy
@@ -0,0 +1,204 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("int_as_date_partition_col") {
+    sql "set ENABLE_FOLD_CONSTANT_BY_BE=false"
+    sql "drop table if exists partition_int"
+    sql """CREATE TABLE partition_int(a int, dt int) PARTITION BY range(dt) (
+            partition p20240101 values less than ("20240101"),
+            partition p20240201 values less than ("20240201"),
+            partition p20240301 values less than ("20240301"),
+            partition p20240401 values less than ("20240401"),
+            partition p20240501 values less than ("20240501"),
+            partition p20240601 values less than ("20240601")
+    )
+    distributed BY hash(a)
+    properties("replication_num"="1");"""
+
+    sql """insert into partition_int
+    SELECT number,cast(date_add('2023-11-05', interval number day) as int) FROM numbers('number'='150');"""
+    sql "drop table if exists partition_int_has_null"
+    sql """
+    CREATE TABLE partition_int_has_null(a int, dt int) PARTITION BY range(dt) (
+            partition p20240101 values less than ("20240101"),
+            partition p20240201 values less than ("20240201"),
+            partition p20240301 values less than ("20240301"),
+            partition p20240401 values less than ("20240401"),
+            partition p20240501 values less than ("20240501"),
+            partition p20240601 values less than ("20240601")
+    )
+    distributed BY hash(a) properties("replication_num"="1");"""
+
+    sql """insert into partition_int_has_null
+    SELECT number,cast(date_add('2023-11-05', interval number day) as int) FROM numbers('number'='120');"""
+    
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt<'20240501' and dt>'20240301'"
+        contains("partitions=2/6 (p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt<'20240701' or dt>='20241001'"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE (dt<'20240301' or dt>='20241001') or dt<=>'20240905'"
+        contains("partitions=3/6 (p20240101,p20240201,p20240301)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE (dt<'20240301' and dt>='20240201') or dt<=>'20240905'"
+        contains("partitions=1/6 (p20240301)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE (dt<'20240701' xor dt>='20240601')"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql """SELECT count(*) FROM partition_int WHERE
+        (date_trunc(dt,'month')<'2024-8-01' and date_trunc(dt,'month')>'2024-6-01' )"""
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql """SELECT count(*) FROM partition_int WHERE date_trunc(dt,'month')<'2024-07-01' ;"""
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql """SELECT count(*) FROM partition_int WHERE
+        !(date_trunc(dt,'month')<'2024-8-01' and date_trunc(dt,'month')>'2024-6-01' );"""
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql """
+        SELECT count(*) FROM partition_int WHERE
+        !(dt<'20241001'  or date_trunc(dt,'month')<'2024-7-01' and date_trunc(dt,'month')>'2024-6-01' )
+        """
+        contains("VEMPTYSET")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE !('2020-09-01' not like '%2020-10-01 00:00:00%')"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE  !('2020-09-01' not in ('2020-10-01','2020-09-01'))"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE  !('2020-09-01' in ('2020-10-01','2020-09-01'))"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE !('2020-10-02'>'2020-10-01')"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE !(dt>='20240301' and a<100) "
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE !(a<100 )"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE !(dt>='20240301' or a<100 )"
+        contains("partitions=3/6 (p20240101,p20240201,p20240301)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE !(dt>='20240301' or (a<100 and dt<'20240801'))"
+        contains("partitions=3/6 (p20240101,p20240201,p20240301)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt regexp '2024-10-01'"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt like '20241001'"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt in  ('20240301', '20240302')"
+        contains("partitions=1/6 (p20240401)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt not in ('20240201', '20240202')"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+
+    explain {
+        sql "select * from partition_int_has_null where dt is null"
+        contains("partitions=1/6 (p20240101)")
+    }
+    explain {
+        sql "select * from partition_int_has_null where dt is not null"
+        contains("partitions=4/6 (p20240101,p20240201,p20240301,p20240401)")
+    }
+    explain {
+        sql "select * from partition_int_has_null where not dt is null"
+        contains("partitions=4/6 (p20240101,p20240201,p20240301,p20240401)")
+    }
+    explain {
+        sql "select * from partition_int_has_null where !(dt is null)"
+        contains("partitions=4/6 (p20240101,p20240201,p20240301,p20240401)")
+    }
+    explain {
+        sql "select * from partition_int_has_null where dt <=> null"
+        contains("partitions=1/6 (p20240101)")
+    }
+    explain {
+        sql "select * from partition_int_has_null where !(dt <=> null)"
+        contains("partitions=4/6 (p20240101,p20240201,p20240301,p20240401)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt<'20240301'"
+        contains("partitions=3/6 (p20240101,p20240201,p20240301)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt<='20240301'"
+        contains("partitions=4/6 (p20240101,p20240201,p20240301,p20240401)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt>'20240301'"
+        contains("partitions=2/6 (p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt>='20240301'"
+        contains("partitions=2/6 (p20240401,p20240501)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt='20240301'"
+        contains("partitions=1/6 (p20240401)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt<=>'20240302'"
+        contains("partitions=1/6 (p20240401)")
+    }
+    explain {
+        sql "SELECT * FROM partition_int WHERE dt!='20241001'"
+        contains("partitions=5/6 (p20240101,p20240201,p20240301,p20240401,p20240501)")
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/multi_column_range_partition.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/multi_column_range_partition.groovy
new file mode 100644
index 00000000000000..78da2304542bc9
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/multi_column_range_partition.groovy
@@ -0,0 +1,260 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("multi_column_range_partition") {
+    sql "drop table if exists t_multi_column_range_partition"
+    sql """
+    create table t_multi_column_range_partition(a int, dt datetime, v int) partition by range(a, dt)
+    (
+    partition p0 values [(0,'2024-01-01 00:00:00'), (10,'2024-01-10 00:00:00')),
+    partition p10 values [(10,'2024-01-10 00:00:00'), (20,'2024-01-20 00:00:00')),
+    partition p20 values [(20,'2024-01-20 00:00:00'), (30,'2024-01-31 00:00:00')),
+    partition p30 values [(30,'2024-01-31 00:00:00'), (40,'2024-02-10 00:00:00')),
+    partition p40 values [(40,'2024-02-10 00:00:00'), (50,'2024-02-20 00:00:00'))
+    )
+    distributed by hash(a) properties("replication_num"="1"); """
+
+    sql """insert into t_multi_column_range_partition values(0,'2024-01-01 00:00:00',2),(1,'2024-01-01 00:00:00',2),(1,'2025-01-01 00:00:00',2),
+    (10,'2024-01-10 00:00:00',3),(10,'2024-01-11 00:00:00',200),(12,'2021-01-01 00:00:00',2),
+    (25,'2024-01-10 00:00:00',3),(20,'2024-01-11 00:00:00',200),(30,'2021-01-01 00:00:00',2),
+    (40,'2024-01-01 00:00:00',2),(40,'2024-01-31 00:00:00',2),(10,'2024-01-9 00:00:00',1000),(10,'2024-01-10 00:00:00',1000),(10,'2024-01-10 01:00:00',1000),
+    (2,'2023-01-10 01:00:00',1000)
+    """
+
+    sql "drop table if exists t_multi_column_partition_datetime_first"
+    sql """
+    create table t_multi_column_partition_datetime_first(a int, dt datetime, v int not null) partition by range(dt,a)
+    (
+    partition p0 values [('2024-01-01 00:00:00',0), ('2024-01-10 00:00:00',10)),
+    partition p10 values [('2024-01-10 00:00:00',10), ('2024-01-20 00:00:00',20)),
+    partition p20 values [('2024-01-20 00:00:00',20), ('2024-01-31 00:00:00',30)),
+    partition p30 values [('2024-01-31 00:00:00',30), ('2024-02-10 00:00:00',40)),
+    partition p40 values [('2024-02-10 00:00:00',40), ('2024-02-20 00:00:00',50))
+    )
+    distributed by hash(a) properties("replication_num"="1");"""
+
+    sql "insert into t_multi_column_partition_datetime_first values(0,'2024-01-01 00:00:00',2)"
+    sql "insert into t_multi_column_partition_datetime_first values(1,'2024-01-01 00:00:00',2)"
+    sql "insert into t_multi_column_partition_datetime_first values(10,'2024-01-10 00:00:00',3),(10,'2024-01-11 00:00:00',200)"
+    sql "insert into t_multi_column_partition_datetime_first values(25,'2024-01-10 00:00:00',3),(20,'2024-01-11 00:00:00',200)"
+    sql "insert into t_multi_column_partition_datetime_first values(40,'2024-01-01 00:00:00',2),(40,'2024-01-31 00:00:00',2)"
+    sql "insert into t_multi_column_partition_datetime_first values(10,'2024-01-9 00:00:00',1000),(10,'2024-01-10 00:00:00',1000),(10,'2024-01-10 01:00:00',1000)"
+
+    explain {
+        sql "select * from t_multi_column_range_partition where a=10 and date_trunc(dt, 'day') <'2024-01-10'"
+        contains("partitions=1/5 (p0)")
+    }
+    sql "set PARTITION_PRUNING_EXPAND_THRESHOLD=5;"
+    explain {
+        sql "select * from t_multi_column_range_partition where a=10 and date_trunc(dt, 'day') <'2024-01-10'"
+        contains("partitions=2/5 (p0,p10)")
+    }
+    for (int i = 0; i < 2; ++i) {
+        if (i == 1) {
+            sql "set PARTITION_PRUNING_EXPAND_THRESHOLD=5;"
+        } else if (i == 0) {
+            sql "set PARTITION_PRUNING_EXPAND_THRESHOLD=30;"
+        }
+        explain {
+            sql "select * from t_multi_column_range_partition where a=10 and date_trunc(dt, 'day') ='2024-01-10'"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "select * from t_multi_column_range_partition where a<19 and (date_trunc(dt, 'day') <'2024-01-20' OR date_trunc(dt, 'day') >'2024-02-10')"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "select * from t_multi_column_range_partition where a>1 and a<30 and (date_trunc(dt, 'day') <'2024-01-20' OR date_trunc(dt, 'day') >'2024-02-10')"
+            contains("partitions=3/5 (p0,p10,p20)")
+        }
+        explain {
+            sql "select * from t_multi_column_range_partition where a>1 and a<30 and (date_trunc(dt, 'day') >'2024-01-20' and date_trunc(dt, 'day') <'2024-02-10')"
+            contains("partitions=3/5 (p0,p10,p20)")
+        }
+
+        explain {
+            sql "select * from t_multi_column_range_partition where !(a > 1 and a < 30 and(date_trunc(dt, 'day') > '2024-01-20' and date_trunc(dt, 'day') < '2024-02-10') )"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_range_partition where !(a >= 10 or date_trunc(dt, 'day') < '2024-01-10' )"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a>1 and date_trunc(dt, 'day') regexp '2020-10-01 00:00:00'"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a>1 and !date_trunc(dt, 'day') regexp '2020-10-01 00:00:00'"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a=1 and !date_trunc(dt, 'day') regexp '2020-10-01 00:00:00'"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a!=1 and !date_trunc(dt, 'day') like '2020-10-01 00:00:00'"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a in (7,8) and date_trunc(dt, 'day') in ('2024-01-01', '2024-10-02')"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a not in (7,8) and date_trunc(dt, 'day') not in ('2024-01-01', '2024-10-02')"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a in (7,8) and date_trunc(dt, 'day') not in ('2024-01-01', '2024-10-02')"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE a in (7,8,15) and date_trunc(dt, 'day') <'2024-01-20'"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE (a in (7,8,15) or a>=31) and date_trunc(dt, 'day') >'2024-01-20'"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where dt is null"
+            contains("VEMPTYSET")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where date_trunc(dt,'day') is null"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where date_trunc(dt,'day') is not null"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where a=1 and date_trunc(dt,'month') is null"
+            contains("partitions=1/5 (p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where a>1 and date_trunc(dt,'month') is null"
+            contains("partitions=1/5 (p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where date_trunc(dt,'month') is null"
+            contains("partitions=1/5 (p30)")
+        }
+        explain {
+            sql "select * from t_multi_column_partition_datetime_first where a=1 and date_trunc(dt,'month') is not null"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')<'2024-1-19 00:00:00'"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')<='2024-1-10 00:00:00'"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')>'2024-1-10 00:00:00'"
+            contains("partitions=2/5 (p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')>'2024-1-11 00:00:00'"
+            contains("partitions=2/5 (p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')>='2024-1-10 00:00:00'"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')='2024-1-2 00:00:00'"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')='2020-10-01 00:00:00'"
+            contains("VEMPTYSET")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')<=>'2020-10-01 00:00:00'"
+            contains("VEMPTYSET")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')!='2020-10-01 00:00:00'"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')<'2024-1-19 00:00:00' and a>10"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')<='2024-1-10 00:00:00' and a=10"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')>'2024-1-10 00:00:00' and a<2"
+            contains("partitions=2/5 (p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')='2024-1-10 00:00:00' and a >100"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE date_trunc(dt,'day')='2024-1-1 00:00:00' and a <0"
+            contains("partitions=1/5 (p0)")
+        }
+
+
+        explain {
+            sql "SELECT * FROM t_multi_column_partition_datetime_first WHERE coalesce(date_trunc(dt,'day'), null, '2020-01-01') <'2021-1-07 00:00:00'"
+            contains("partitions=3/5 (p0,p10,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE coalesce(date_trunc(dt,'day') <'2021-1-07 00:00:00' , true, false) and a=9"
+            contains("partitions=1/5 (p0)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE if(date_trunc(dt,'day') <'2021-1-07 00:00:00', true, false) and a<20"
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE if(a>1, dt<'2001-1-01 00:00:00', dt<'2001-1-01 00:00:00')"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+        explain {
+            sql "SELECT * FROM t_multi_column_range_partition WHERE if(dt<'2021-1-01 00:00:00', dt<'2001-1-01 00:00:00', dt>'2031-1-01 00:00:00')"
+            contains("partitions=4/5 (p0,p10,p20,p30)")
+        }
+
+        explain {
+            sql """SELECT * FROM t_multi_column_range_partition WHERE case when dt<'2024-1-10 00:00:00' then false when dt<'2024-1-20 00:00:00' then false
+    else true end and a=10;"""
+            contains("partitions=2/5 (p0,p10)")
+        }
+
+        explain {
+            sql """SELECT * FROM t_multi_column_range_partition WHERE case when date_trunc(dt,'day')<'2024-1-10 00:00:00' then false when date_trunc(dt,'day')<'2024-1-20 00:00:00' then true
+    else true end and a<20;"""
+            contains("partitions=2/5 (p0,p10)")
+        }
+        explain {
+            sql """SELECT * FROM t_multi_column_range_partition WHERE case when date_trunc(dt,'day')<'2024-1-10 00:00:00' then dt
+    else '2023-01-01 00:00:00' end <'2021-01-06 00:00:00' and a<20;"""
+            contains("partitions=2/5 (p0,p10)")
+        }
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/one_col_list_partition.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/one_col_list_partition.groovy
new file mode 100644
index 00000000000000..4de512376d1378
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/one_col_list_partition.groovy
@@ -0,0 +1,249 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("one_col_list_partition") {
+    sql "drop table if exists one_col_list_partition_date"
+    sql """create table one_col_list_partition_date(a int, dt datetime, d date, c varchar(100)) duplicate key(a)
+    partition by list(dt)
+    (
+            partition p1 values in ('2021-01-01 00:00:00', '2021-01-02 00:00:00'),
+    partition p2 values in ('2021-01-03 00:00:00', '2021-01-04 00:00:00'),
+    partition p3 values in ('2021-01-05 00:00:00', '2021-01-06 00:00:00'),
+    partition p4 values in ('2021-01-07 00:00:00', '2021-01-08 00:00:00'),
+    partition p5 values in ('2021-01-09 00:00:00', '2021-01-10 00:00:00'),
+    partition p6 values in ('2021-01-11 00:00:00', '2021-01-12 00:00:00'),
+    partition p7 values in ('2021-01-13 00:00:00', '2021-01-14 00:00:00'),
+    partition p8 values in ('2021-01-15 00:00:00', '2021-01-16 00:00:00'),
+    partition p9 values in ('2021-01-17 00:00:00', '2021-01-18 00:00:00')
+    )
+    distributed by hash(a)
+    properties("replication_num"="1");"""
+
+    sql """
+    insert into one_col_list_partition_date values(1,'2021-01-01 00:00:00',null, 'abc'),(1,'2021-01-02 00:00:00',null, 'abc')
+    ,(1,'2021-01-03 00:00:00',null, 'abc'),(1,'2021-01-04 00:00:00',null, 'abc')
+    ,(1,'2021-01-05 00:00:00',null, 'abc'),(1,'2021-01-06 00:00:00',null, 'abc'),(1,'2021-01-07 00:00:00',null, 'abc'),(1,'2021-01-08 00:00:00',null, 'abc')
+    ,(1,'2021-01-09 00:00:00',null, 'abc'),(1,'2021-01-11 00:00:00',null, 'abc'),(1,'2021-01-13 00:00:00',null, 'abc'),(1,'2021-01-15 00:00:00',null, 'abc')
+    ,(1,'2021-01-10 00:00:00',null, 'abc'),(1,'2021-01-12 00:00:00',null, 'abc'),(1,'2021-01-14 00:00:00',null, 'abc'),(1,'2021-01-16 00:00:00',null, 'abc')
+    """
+
+    sql "drop table if exists one_col_list_partition_date_has_null"
+    sql"""
+    CREATE TABLE `one_col_list_partition_date_has_null` (
+      `a` int NULL,
+      `dt` datetime NULL,
+      `d` date NULL,
+      `c` varchar(100) NULL
+    ) ENGINE=OLAP
+    DUPLICATE KEY(`a`)
+    PARTITION BY LIST (`dt`)
+    (PARTITION p10 VALUES IN (NULL),
+    PARTITION p1 VALUES IN ('2021-01-01 00:00:00','2021-01-02 00:00:00'),
+    PARTITION p2 VALUES IN ('2021-01-03 00:00:00','2021-01-04 00:00:00'),
+    PARTITION p3 VALUES IN ('2021-01-05 00:00:00','2021-01-06 00:00:00'),
+    PARTITION p4 VALUES IN ('2021-01-07 00:00:00','2021-01-08 00:00:00'),
+    PARTITION p5 VALUES IN ('2021-01-09 00:00:00','2021-01-10 00:00:00'),
+    PARTITION p6 VALUES IN ('2021-01-11 00:00:00','2021-01-12 00:00:00'),
+    PARTITION p7 VALUES IN ('2021-01-13 00:00:00','2021-01-14 00:00:00'),
+    PARTITION p8 VALUES IN ('2021-01-15 00:00:00','2021-01-16 00:00:00'),
+    PARTITION p9 VALUES IN ('2021-01-17 00:00:00','2021-01-18 00:00:00'))
+    DISTRIBUTED BY HASH(`a`) BUCKETS 10
+    PROPERTIES (
+    "replication_allocation" = "tag.location.default: 1")
+    """
+
+    sql """
+    insert into one_col_list_partition_date_has_null values(1,'2021-01-01 00:00:00',null, 'abc'),(1,'2021-01-02 00:00:00',null, 'abc')
+    ,(1,'2021-01-03 00:00:00',null, 'abc'),(1,'2021-01-04 00:00:00',null, 'abc')
+    ,(1,'2021-01-05 00:00:00',null, 'abc'),(1,'2021-01-06 00:00:00',null, 'abc'),(1,'2021-01-07 00:00:00',null, 'abc'),(1,'2021-01-08 00:00:00',null, 'abc')
+    ,(1,'2021-01-09 00:00:00',null, 'abc'),(1,'2021-01-11 00:00:00',null, 'abc'),(1,'2021-01-13 00:00:00',null, 'abc'),(1,'2021-01-15 00:00:00',null, 'abc')
+    ,(1,'2021-01-10 00:00:00',null, 'abc'),(1,'2021-01-12 00:00:00',null, 'abc'),(1,'2021-01-14 00:00:00',null, 'abc'),(1,'2021-01-16 00:00:00',null, 'abc')
+    ,(1,null,null,'bdb')
+    """
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt<'2021-01-10 00:00:00' and dt>'2021-01-7 00:00:00'"
+        contains("partitions=2/9 (p4,p5)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt<'2021-01-10 00:00:00' or dt>'2021-01-14 00:00:00'"
+        contains("partitions=6/9 (p1,p2,p3,p4,p5,p8)")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE (dt<'2021-01-10 00:00:00' or dt>'2021-01-10 00:00:00') and dt<=>'2021-01-01 00:00:00'"
+        contains("partitions=1/9 (p1)")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE (dt<'2021-01-10 00:00:00' xor dt>'2021-01-10 00:00:00')"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt regexp '2020-10-01 00:00:00'"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt like '%2020-10-01 00:00:00'"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt like '2020-10-01 00:00:00'"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt in ('2021-01-10 00:00:00', '2021-01-13 00:00:00')"
+        contains("partitions=2/9 (p5,p7)")
+
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt not in ('2021-01-01 00:00:00', '2021-01-02 00:00:00')"
+        contains("partitions=7/9 (p2,p3,p4,p5,p6,p7,p8)")
+
+    }
+
+    explain {
+        sql "select * from one_col_list_partition_date where dt is null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date where dt is not null"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date where not dt is null"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date where !(dt is null)"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+
+    explain {
+        sql "select * from one_col_list_partition_date where dt <=> null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date where !(dt <=> null)"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where dt is null"
+        contains("partitions=1/10 (p10)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where dt is not null"
+        contains("partitions=8/10 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where not dt is null"
+        contains("partitions=8/10 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where !(dt is null)"
+        contains("partitions=8/10 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where dt <=> null"
+        contains("partitions=1/10 (p10)")
+    }
+    explain {
+        sql "select * from one_col_list_partition_date_has_null where !(dt <=> null)"
+        contains("partitions=8/10 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+
+
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt<'2021-01-01 00:00:00'"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt<='2021-01-02 00:00:00'"
+        contains("partitions=1/9 (p1)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt>'2021-1-03 00:00:00'"
+        contains("partitions=7/9 (p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt>='2021-1-04 00:00:00'"
+        contains("partitions=7/9 (p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt='2021-1-05 00:00:00'"
+        contains("partitions=1/9 (p3)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt<=>'2021-1-01 00:00:00'"
+        contains("partitions=1/9 (p1)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE dt!='2021-1-01 00:00:00' and dt!='2021-1-02 00:00:00'"
+        contains("partitions=7/9 (p2,p3,p4,p5,p6,p7,p8)")
+    }
+
+
+    // has condition function
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE coalesce(dt, null, '2020-01-01') <'2021-1-07 00:00:00'"
+        contains("partitions=3/9 (p1,p2,p3)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE coalesce(dt <'2021-1-07 00:00:00' , true, false)"
+        contains("partitions=3/9 (p1,p2,p3)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE coalesce(dt >'2021-1-07 00:00:00' , true, false)"
+        contains("partitions=5/9 (p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE coalesce(null ,dt< '2021-1-07 00:00:00', dt> '2020-10-01 00:00:00' )"
+        contains("partitions=3/9 (p1,p2,p3)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE if(dt<'2021-1-01 00:00:00', true, false)"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE if(a>1, dt<'2001-1-01 00:00:00', dt<'2001-1-01 00:00:00')"
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_list_partition_date WHERE if(dt<'2021-1-01 00:00:00', dt<'2001-1-01 00:00:00', dt>'2031-1-01 00:00:00')"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql """SELECT * FROM one_col_list_partition_date WHERE case when dt<'2021-1-01 00:00:00' then false when dt<'2021-5-01' then false
+        else true end;"""
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql """SELECT * FROM one_col_list_partition_date WHERE case when dt<'2021-1-01 00:00:00' then false when dt<'2021-5-01' then true
+        else true end;"""
+        contains("partitions=8/9 (p1,p2,p3,p4,p5,p6,p7,p8)")
+    }
+    explain {
+        sql """SELECT * FROM one_col_list_partition_date WHERE case when dt<'2022-01-01 00:00:00' then dt
+        else '2023-01-01 00:00:00' end <'2021-01-06 00:00:00' ;"""
+        contains("partitions=3/9 (p1,p2,p3)")
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/one_col_range_partition.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/one_col_range_partition.groovy
new file mode 100644
index 00000000000000..4d1e3eb223b1a7
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/one_col_range_partition.groovy
@@ -0,0 +1,327 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("one_col_range_partition") {
+    sql "set ENABLE_FOLD_CONSTANT_BY_BE=false"
+    sql "drop table if exists one_col_range_partition_date"
+    sql """
+    create table one_col_range_partition_date(a int, dt datetime, d date, c varchar(100)) duplicate key(a)
+    partition by range(dt)
+    (
+            from ("2020-01-01") to ("2024-12-31") interval 1 day
+    )
+    distributed by hash(a)
+    properties("replication_num"="1");
+    """
+    sql """
+    INSERT INTO one_col_range_partition_date SELECT number, 
+    date_add('2020-01-01 00:00:00', interval number hour), 
+    cast(date_add('2020-01-01 00:00:00', interval number hour) as date), cast(number as varchar(65533)) FROM numbers('number'='10000');
+    """
+
+    sql "drop table if exists one_col_range_partition_date_has_null"
+    sql """create table one_col_range_partition_date_has_null (a int, dt datetime, d date, c varchar(100)) duplicate key(a)
+    partition by range(dt) (
+            partition p1 values less than ("2017-01-01"),
+            partition p2 values less than ("2018-01-01"),
+            partition p3 values less than ("2019-01-01"),
+            partition p4 values less than ("2020-01-01"),
+            partition p5 values less than ("2021-01-01")
+    )distributed by hash(a)
+    properties("replication_num"="1");"""
+    sql """INSERT INTO one_col_range_partition_date_has_null SELECT number,
+    date_add('2017-01-01 00:00:00', interval number day),
+    cast(date_add('2022-01-01 00:00:00', interval number day) as date), cast(number as varchar(65533)) FROM numbers('number'='1000');"""
+    sql """INSERT INTO one_col_range_partition_date_has_null  values(3,null,null,null);"""
+
+
+
+    // or and
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<'2020-10-01 00:00:00' and dt>'2020-9-01 00:00:00'"
+        contains("partitions=30/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<'2020-10-01 00:00:00' or dt>'2020-9-01 00:00:00'"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE (dt<'2020-10-01 00:00:00' or dt>'2020-9-01 00:00:00') and dt<=>'2020-9-5 00:00:00'"
+        contains("partitions=1/1826 (p_20200905)")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE (dt<'2020-10-01 00:00:00' xor dt>'2020-9-01 00:00:00')"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql """SELECT count(*) FROM one_col_range_partition_date WHERE
+        !(dt<'2020-10-01 00:00:00' and dt>'2020-9-01 00:00:00' or date_trunc(dt,'month')<'2020-7-01' and date_trunc(dt,'month')>'2020-6-01' )"""
+        contains("partitions=388/1826")
+    }
+
+    explain {
+        sql """SELECT count(*) FROM one_col_range_partition_date WHERE
+        (dt>='2020-10-01 00:00:00' or dt<='2020-9-01 00:00:00' ) and (date_trunc(dt,'month')>='2020-9-01' or date_trunc(dt,'month')<='2020-6-01' )"""
+        contains("partitions=327/1826")
+    }
+
+    // !
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !('2020-09-01' not like '%2020-10-01 00:00:00%')"
+        contains("partitions=417/1826 ")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE  !('2020-09-01' not in ('2020-10-01','2020-09-01'))"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE  !('2020-09-01' in ('2020-10-01','2020-09-01'))"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !('2020-10-02'>'2020-10-01')"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !(dt>='2020-10-01 00:00:00' and a<100)"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !(a<100 and  c>10)"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !(a<100 or  c>10)"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !(dt>='2020-10-01 00:00:00' or a<100 )"
+        contains("partitions=274/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE !(dt<'2020-2-01 1:00:00' or (a<100 and dt>='2020-10-01 12:00:00'))"
+        contains("partitions=386/1826")
+    }
+
+    // like regexp
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt regexp '2020-10-01 00:00:00'"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt like '2020-10-01 00:00:00'"
+        contains("partitions=417/1826")
+    }
+
+    // in
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt in ('2020-10-01 00:10:00', '2020-10-02 00:00:00')"
+        contains("partitions=2/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt not in ('2020-10-01 00:10:00', '2020-10-02 00:00:00')"
+        contains("partitions=417/1826")
+    }
+
+    // is null
+    //partition key has null value
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where dt is null"
+        contains("partitions=1/5 (p1)")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where dt is not null"
+        contains("partitions=4/5 (p1,p2,p3,p4)")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where not dt is null"
+        contains("partitions=4/5 (p1,p2,p3,p4)")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where !(dt is null)"
+        contains("partitions=4/5 (p1,p2,p3,p4)")
+    }
+
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where dt <=> null"
+        contains("partitions=1/5 (p1)")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date_has_null where !(dt <=> null)"
+        contains("partitions=4/5 (p1,p2,p3,p4)")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date where dt is null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date where dt is not null"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date where not dt is null"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date where !(dt is null)"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "select * from one_col_range_partition_date where dt <=> null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from one_col_range_partition_date where !(dt <=> null)"
+        contains("partitions=417/1826")
+    }
+
+    // op
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<'2020-10-01 00:00:00'"
+        contains("partitions=274/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<='2020-10-01 00:00:00'"
+        contains("partitions=275/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>'2020-10-01 00:00:00'"
+        contains("partitions=143/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>='2020-10-01 00:00:00'"
+        contains("partitions=143/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt='2020-10-01 00:00:00'"
+        contains("partitions=1/1826 (p_20201001)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<=>'2020-10-01 00:00:00'"
+        contains("partitions=1/1826 (p_20201001)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt!='2020-10-01 00:00:00'"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE coalesce(dt, null, '2020-01-01') <'2020-10-01 00:00:00'"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE coalesce(dt <'2020-2-01 00:00:00' , true, false)"
+        contains("partitions=31/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE coalesce(dt >'2020-2-01 00:00:00' , true, false)"
+        contains("partitions=386/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE coalesce(null ,dt< '2001-1-01 00:00:00', dt> '2020-10-01 00:00:00' )"
+        contains("partitions=143/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE if(dt<'2001-1-01 00:00:00', true, false)"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE if(a>1, dt<'2001-1-01 00:00:00', dt>'2001-1-01 00:00:00')"
+        contains("partitions=417/1826 ")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE if(dt<'2021-1-01 00:00:00', dt<'2001-1-01 00:00:00', dt>'2001-1-01 00:00:00')"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql """SELECT * FROM one_col_range_partition_date WHERE case when dt<'2021-1-01 00:00:00' then false when dt<'2021-5-01' then false
+        else true end;"""
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql """SELECT * FROM one_col_range_partition_date WHERE case when dt<'2022-1-01 00:00:00' then dt
+        else '2023-1-01 00:00:00' end <'2021-1-01 00:00:00' ;"""
+        contains("partitions=417/1826")
+    }
+
+    // predicates has non partition column
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE '2020-09-01' not like '%2020-10-01 00:00:00%'"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE  '2020-09-01' not in ('2020-10-01','2020-09-01')"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE  '2020-09-01' in ('2020-10-01','2020-09-01')"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE '2020-10-02'>'2020-10-01'"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>='2020-10-01 00:00:00' and a<100"
+        contains("partitions=143/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE a<100 and  c>10"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE a<100 or  c>10"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>='2020-10-01 00:00:00' or a<100"
+        contains("partitions=417/1826")
+    }
+
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE not (dt>='2020-10-01 00:00:00' and a<100)"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt='2020-10-01 00:00:00' or a<100"
+        contains("partitions=417/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE not(dt!='2020-10-01 00:00:00' or a<100)"
+        contains("partitions=1/1826 (p_20201001)")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt<'2020-1-01 1:00:00' or a<100 and dt>='2020-10-01 12:00:00'"
+        contains("partitions=144/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>='2020-10-01 00:00:00' and dt=d"
+        contains("partitions=143/1826")
+    }
+    explain {
+        sql "SELECT * FROM one_col_range_partition_date WHERE dt>='2020-10-01 00:00:00' or dt=d"
+        contains("partitions=417/1826")
+    }
+
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/partition_prune/varchar_as_date_partition_col.groovy b/regression-test/suites/nereids_rules_p0/partition_prune/varchar_as_date_partition_col.groovy
new file mode 100644
index 00000000000000..a5b3a4375c12bc
--- /dev/null
+++ b/regression-test/suites/nereids_rules_p0/partition_prune/varchar_as_date_partition_col.groovy
@@ -0,0 +1,252 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("varchar_as_date_partition_col") {
+    sql "set ENABLE_FOLD_CONSTANT_BY_BE=false"
+    sql"""drop table if exists partition_varchar;"""
+    sql """CREATE TABLE partition_varchar(a int, dt varchar(10), rdt datetime) PARTITION BY list(dt) (
+    partition p20240101 values in ("20240101","20240102"),
+    partition p20240103 values  in ("20240103","20240104"),
+    partition p20240105 values  in  ("20240105","20240106"),
+    partition p20240107 values  in ("20240107","20240108"),
+    partition p20240109 values  in ("20240109","20240110"),
+    partition p20240111 values  in ("20240111","20240112"),
+    partition p20240113 values  in ("20240113","20240114"),
+    partition p20240115 values  in ("20240115","20240116"),
+    partition p20240117 values  in ("20240117","20240118")
+    )
+    distributed BY hash(a)
+    properties(
+    "replication_num"="1"
+    );"""
+    sql """
+    insert into partition_varchar 
+    SELECT number, DATE_FORMAT(date_add('2024-01-01', interval number day),"yyyyMMdd"),date_add('2024-01-01', interval number day)
+    FROM numbers('number'='10');"""
+
+    sql "drop table if exists partition_varchar_has_null"
+    sql """CREATE TABLE partition_varchar_has_null(a int, dt varchar(10), rdt datetime) PARTITION BY list(dt) (
+    partition p20240101 values in ("20240101","20240102",null),
+    partition p20240103 values  in ("20240103","20240104"),
+    partition p20240105 values  in  ("20240105","20240106"),
+    partition p20240107 values  in ("20240107","20240108"),
+    partition p20240109 values  in ("20240109","20240110"),
+    partition p20240111 values  in ("20240111","20240112"),
+    partition p20240113 values  in ("20240113","20240114"),
+    partition p20240115 values  in ("20240115","20240116"),
+    partition p20240117 values  in ("20240117","20240118")
+    )
+    distributed BY hash(a)
+    properties(
+    "replication_num"="1"
+    );"""
+
+    sql """insert into partition_varchar_has_null 
+    SELECT number, DATE_FORMAT(date_add('2024-01-01', interval number day),"yyyyMMdd"),date_add('2024-01-01', interval number day)
+    FROM numbers('number'='10');"""
+    sql """insert into partition_varchar_has_null values(11,null,null)"""
+
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<'20240110' and dt>'20240104'"
+        contains("partitions=3/9 (p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<'20240104' or dt>'20240110'"
+        contains("partitions=2/9 (p20240101,p20240103)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<date_format(now(),'yyyyMMdd') or dt > date_format(cast(now() as date) - interval 12 month,'yyyyMMdd')"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE date_trunc(dt,'day')< '20240105'"
+        contains("partitions=2/9 (p20240101,p20240103)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE date_trunc(dt,'day')< date_format(cast(now() as date) - interval 10 month,'yyyyMMdd')"
+        contains(" partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE (date_trunc(dt,'day')<'20240105' or dt>='20240108') or dt<=>'20240110';"
+        contains("partitions=4/9 (p20240101,p20240103,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE (dt<'20240107' and dt>='20240104') or dt<=>'20240109'"
+        contains("partitions=3/9 (p20240103,p20240105,p20240109)")
+    }
+    explain {
+        sql "SELECT count(*) FROM partition_varchar WHERE (date_trunc(dt,'day')<'2024-1-03' and date_trunc(dt,'day')>='2024-1-01' )"
+        contains("partitions=1/9 (p20240101)")
+    }
+
+    explain {
+        sql """
+        SELECT count(*) FROM partition_varchar WHERE
+        !(date_trunc(dt,'day')<'2024-1-03' and date_trunc(dt,'day')>='2024-1-01' )
+        """
+        contains("partitions=4/9 (p20240103,p20240105,p20240107,p20240109)")
+    }
+
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !('2020-09-01' not like '%2020-10-01 00:00:00%')"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE  !('2020-09-01' not in ('2020-10-01','2020-09-01'))"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE  !('2020-09-01' in ('2020-10-01','2020-09-01'))"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !('2020-10-02'>'2020-10-01')"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !(dt>='20241001' and a<100)"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !(a<100 )"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !(dt>='20240102' or a<100 )"
+        contains("partitions=1/9 (p20240101)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE !(dt>='20240102' or (a<100 and dt<'20240801'))"
+        contains("partitions=1/9 (p20240101)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt regexp '2024-10-01'"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt like '%20240101'"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt like '20240101'"
+        contains("partitions=1/9 (p20240101)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt in ('20240101', '20241002')"
+        contains("partitions=1/9 (p20240101)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt not in ('20241001', '20241002')"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+
+    //partition key has null value
+    explain {
+        sql "select * from partition_varchar_has_null where dt is null"
+        contains("partitions=1/9 (p20240101)")
+    }
+
+    explain {
+        sql "select * from partition_varchar_has_null where dt is not null"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+
+    explain {
+        sql "select * from partition_varchar_has_null where not dt is null"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar_has_null where !(dt is null)"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar_has_null where dt <=> null"
+        contains("partitions=1/9 (p20240101)")
+    }
+    explain {
+        sql "select * from partition_varchar_has_null where !(dt <=> null)"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    //partition key has no null value
+    explain {
+        sql "select * from partition_varchar where dt is null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from partition_varchar where dt is not null"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar where not dt is null"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar where !(dt is null)"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar where dt <=> null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from partition_varchar where !(dt <=> null)"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "select * from partition_varchar where  date_trunc(dt,'month') is null"
+        contains("VEMPTYSET")
+    }
+    explain {
+        sql "select * from partition_varchar where  date_trunc(dt,'month') is not null"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<'20240103'"
+        contains("partitions=1/9 (p20240101)")
+    }
+
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<='20240103'"
+        contains("partitions=2/9 (p20240101,p20240103)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt>'20240103'"
+        contains("partitions=4/9 (p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt>='20240103'"
+        contains("partitions=4/9 (p20240103,p20240105,p20240107,p20240109)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt='20240103'"
+        contains("partitions=1/9 (p20240103)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt<=>'20240103'"
+        contains("partitions=1/9 (p20240103)")
+    }
+    explain {
+        sql "SELECT * FROM partition_varchar WHERE dt!='20240103'"
+        contains("partitions=5/9 (p20240101,p20240103,p20240105,p20240107,p20240109)")
+    }
+}
\ No newline at end of file
diff --git a/regression-test/suites/nereids_rules_p0/push_down_limit_distinct/push_down_limit_distinct_through_join.groovy b/regression-test/suites/nereids_rules_p0/push_down_limit_distinct/push_down_limit_distinct_through_join.groovy
index f53b100c29aff2..22a59dd1cbdf46 100644
--- a/regression-test/suites/nereids_rules_p0/push_down_limit_distinct/push_down_limit_distinct_through_join.groovy
+++ b/regression-test/suites/nereids_rules_p0/push_down_limit_distinct/push_down_limit_distinct_through_join.groovy
@@ -21,7 +21,6 @@ suite("push_down_limit_distinct_through_join") {
       SET enable_fallback_to_original_planner=false;
       set runtime_filter_mode=OFF;
       SET ignore_shape_nodes='PhysicalDistribute,PhysicalProject';
-      SET ENABLE_NEREIDS_RULES=push_down_limit_distinct_through_join;
       set push_topn_to_agg = true;
       SET disable_join_reorder=true;
       set topn_opt_limit_threshold=1024;
diff --git a/regression-test/suites/nereids_syntax_p0/distribute/test_multicast_sink.groovy b/regression-test/suites/nereids_syntax_p0/distribute/test_multicast_sink.groovy
new file mode 100644
index 00000000000000..eeeaad06d5ee22
--- /dev/null
+++ b/regression-test/suites/nereids_syntax_p0/distribute/test_multicast_sink.groovy
@@ -0,0 +1,60 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_multicast_sink") {
+    multi_sql """
+            drop table if exists table_1_undef_partitions2_keys3_properties4_distributed_by5;
+            CREATE TABLE `table_1_undef_partitions2_keys3_properties4_distributed_by5` (
+              `col_int_undef_signed` int NULL,
+              `col_int_undef_signed_not_null` int NOT NULL,
+              `col_date_undef_signed` date NULL,
+              `col_date_undef_signed_not_null` date NOT NULL,
+              `col_varchar_10__undef_signed` varchar(10) NULL,
+              `col_varchar_10__undef_signed_not_null` varchar(10) NOT NULL,
+              `col_varchar_1024__undef_signed` varchar(1024) NULL,
+              `col_varchar_1024__undef_signed_not_null` varchar(1024) NOT NULL,
+              `pk` int NULL
+            ) ENGINE=OLAP
+            DUPLICATE KEY(`col_int_undef_signed`, `col_int_undef_signed_not_null`, `col_date_undef_signed`)
+            DISTRIBUTED BY HASH(`pk`) BUCKETS 10
+            PROPERTIES (
+            "replication_allocation" = "tag.location.default: 1"
+            );
+            insert into table_1_undef_partitions2_keys3_properties4_distributed_by5 values(3, 6, '2023-12-17', '2023-12-17', 'ok', 'v', 'want', 'z', 0);
+            set enable_nereids_distribute_planner=true;
+            set parallel_pipeline_task_num = 1;
+            """
+
+    for (def i in 0..<100) {
+        test {
+            sql """
+            WITH cte1 AS(
+                SELECT t1.`pk`
+                FROM table_1_undef_partitions2_keys3_properties4_distributed_by5 AS t1
+                ORDER BY t1.pk
+            )
+            SELECT cte1.`pk` AS pk1
+            FROM cte1
+            LEFT OUTER JOIN cte1 AS alias1
+            ON cte1 . `pk` = alias1 . `pk`
+            WHERE cte1.`pk` < 3
+            LIMIT 66666666
+            """
+            result([[0]])
+        }
+    }
+}
diff --git a/regression-test/suites/nereids_tpcds_shape_sf100_p0/constraints/query23.groovy b/regression-test/suites/nereids_tpcds_shape_sf100_p0/constraints/query23.groovy
index 96e49d61bfa89f..9010034d49273e 100644
--- a/regression-test/suites/nereids_tpcds_shape_sf100_p0/constraints/query23.groovy
+++ b/regression-test/suites/nereids_tpcds_shape_sf100_p0/constraints/query23.groovy
@@ -37,7 +37,6 @@ suite("query23") {
     set disable_nereids_rules='PRUNE_EMPTY_PARTITION';
     set push_topn_to_agg = true;
     set topn_opt_limit_threshold=1024;
-    set enable_nereids_rules='ELIMINATE_GROUP_BY_KEY';
     """
 
     def ds = """with frequent_ss_items as 
diff --git a/regression-test/suites/new_shapes_p0/tpcds_sf100/constraints/query23.groovy b/regression-test/suites/new_shapes_p0/tpcds_sf100/constraints/query23.groovy
index b17e9c6d3d0e7f..82db5a725ce44a 100644
--- a/regression-test/suites/new_shapes_p0/tpcds_sf100/constraints/query23.groovy
+++ b/regression-test/suites/new_shapes_p0/tpcds_sf100/constraints/query23.groovy
@@ -40,7 +40,6 @@ suite("query23") {
     set disable_nereids_rules='PRUNE_EMPTY_PARTITION';
     set push_topn_to_agg = true;
     set topn_opt_limit_threshold=1024;
-    set enable_nereids_rules='ELIMINATE_GROUP_BY_KEY';
     """
 
     def ds = """with frequent_ss_items as 
diff --git a/regression-test/suites/query_p0/aggregate/aggregate_count1.groovy b/regression-test/suites/query_p0/aggregate/aggregate_count1.groovy
index cf657cc8ef3e3d..3971f304e38646 100644
--- a/regression-test/suites/query_p0/aggregate/aggregate_count1.groovy
+++ b/regression-test/suites/query_p0/aggregate/aggregate_count1.groovy
@@ -17,7 +17,7 @@
  * under the License.
  */
 
-suite("aggregate_count1", "query") {
+suite("aggregate_count1", "query,arrow_flight_sql") {
     sql """ DROP TABLE IF EXISTS aggregate_count1 """
     sql """create table if not exists aggregate_count1 (
                 name varchar(128),
diff --git a/regression-test/suites/query_p0/aggregate/array_agg.groovy b/regression-test/suites/query_p0/aggregate/array_agg.groovy
index 217285b572c538..42fb3b131a4f86 100644
--- a/regression-test/suites/query_p0/aggregate/array_agg.groovy
+++ b/regression-test/suites/query_p0/aggregate/array_agg.groovy
@@ -277,8 +277,24 @@ suite("array_agg") {
     order_qt_sql_array_agg_map """ SELECT id, array_agg(km) FROM test_array_agg_complex GROUP BY id ORDER BY id """
     order_qt_sql_array_agg_struct """ SELECT id, array_agg(ks) FROM test_array_agg_complex GROUP BY id ORDER BY id """
 
+
+ sql """ DROP TABLE IF EXISTS test_array_agg_ip;"""
+    sql """
+        CREATE TABLE test_array_agg_ip(
+            k1 BIGINT ,
+            k4 ipv4 ,
+            k6 ipv6 ,
+            s string 
+        ) DISTRIBUTED BY HASH(k1) BUCKETS 1 PROPERTIES("replication_num" = "1");
+    """
+    sql """ insert into test_array_agg_ip values(1,123,34141,"0.0.0.123") , (2,3114,318903,"0.0.0.123") , (3,7832131,192837891738927931231,"2001:0DB8:AC10:FE01:FEED:BABE:CAFE:F00D"),(4,null,null,"2001:0DB8:AC10:FE01:FEED:BABE:CAFE:F00D"); """
+
+
+     qt_select """select array_sort(array_agg(k4)),array_sort(array_agg(k6)) from test_array_agg_ip """
+
     sql "DROP TABLE `test_array_agg`"
     sql "DROP TABLE `test_array_agg1`"	
     sql "DROP TABLE `test_array_agg_int`"
     sql "DROP TABLE `test_array_agg_decimal`"
+    sql "DROP TABLE `test_array_agg_ip`"
 }
diff --git a/regression-test/suites/query_p0/aggregate/select_distinct.groovy b/regression-test/suites/query_p0/aggregate/select_distinct.groovy
index 6456158bdadb0d..2d6a8679d87ed8 100644
--- a/regression-test/suites/query_p0/aggregate/select_distinct.groovy
+++ b/regression-test/suites/query_p0/aggregate/select_distinct.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("select_distinct") {
+suite("select_distinct", "arrow_flight_sql") {
     sql """DROP TABLE IF EXISTS decimal_a;"""
     sql """DROP TABLE IF EXISTS decimal_b;"""
     sql """DROP TABLE IF EXISTS decimal_c;"""
diff --git a/regression-test/suites/query_p0/casesensetive_column/join_with_column_casesensetive.groovy b/regression-test/suites/query_p0/casesensetive_column/join_with_column_casesensetive.groovy
index 45499fc6f248a2..8bd3b19088a486 100644
--- a/regression-test/suites/query_p0/casesensetive_column/join_with_column_casesensetive.groovy
+++ b/regression-test/suites/query_p0/casesensetive_column/join_with_column_casesensetive.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("join_with_column_casesensetive") {
+suite("join_with_column_casesensetive", "arrow_flight_sql") {
     def tables=["ad_order_data_v1","ad_order_data"]
 
     for (String table in tables) {
diff --git a/regression-test/suites/query_p0/cast/test_cast.groovy b/regression-test/suites/query_p0/cast/test_cast.groovy
index 947d61bc828861..dae669e2965f04 100644
--- a/regression-test/suites/query_p0/cast/test_cast.groovy
+++ b/regression-test/suites/query_p0/cast/test_cast.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite('test_cast') {
+suite('test_cast', "arrow_flight_sql") {
     def date = "date '2020-01-01'"
     def datev2 = "datev2 '2020-01-01'"
     def datetime = "timestamp '2020-01-01 12:34:45'"
diff --git a/regression-test/suites/query_p0/except/test_query_except.groovy b/regression-test/suites/query_p0/except/test_query_except.groovy
index 1a2aa742d2910d..410e24f89b92de 100644
--- a/regression-test/suites/query_p0/except/test_query_except.groovy
+++ b/regression-test/suites/query_p0/except/test_query_except.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_query_except") {
+suite("test_query_except", "arrow_flight_sql") {
     // test query except, depend on query_test_data_load.groovy
     sql "use test_query_db"
     qt_select_except1 """
diff --git a/regression-test/suites/query_p0/group_concat/test_group_concat.groovy b/regression-test/suites/query_p0/group_concat/test_group_concat.groovy
index 5054dc2ee3a91d..522d66ed64b30b 100644
--- a/regression-test/suites/query_p0/group_concat/test_group_concat.groovy
+++ b/regression-test/suites/query_p0/group_concat/test_group_concat.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_group_concat", "query,p0") {
+suite("test_group_concat", "query,p0,arrow_flight_sql") {
     qt_select """
                 SELECT group_concat(k6) FROM test_query_db.test where k6='false'
               """
diff --git a/regression-test/suites/query_p0/grouping_sets/test_grouping_sets1.groovy b/regression-test/suites/query_p0/grouping_sets/test_grouping_sets1.groovy
index 1f12de6628a5eb..f8180b0ab43846 100644
--- a/regression-test/suites/query_p0/grouping_sets/test_grouping_sets1.groovy
+++ b/regression-test/suites/query_p0/grouping_sets/test_grouping_sets1.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_grouping_sets1") {
+suite("test_grouping_sets1", "arrow_flight_sql") {
     qt_select """
         select 
             col1
diff --git a/regression-test/suites/query_p0/having/having.groovy b/regression-test/suites/query_p0/having/having.groovy
index fb32b3834af4d6..bbad236c973870 100644
--- a/regression-test/suites/query_p0/having/having.groovy
+++ b/regression-test/suites/query_p0/having/having.groovy
@@ -19,7 +19,7 @@
 // /testing/trino-product-tests/src/main/resources/sql-tests/testcases/aggregate
 // and modified by Doris.
 
-suite("having", "query,p0") {
+suite("having", "query,p0,arrow_flight_sql") {
     sql """DROP TABLE IF EXISTS supplier"""
     sql """CREATE TABLE `supplier` (
             `s_suppkey` int(11) NOT NULL,
diff --git a/regression-test/suites/query_p0/intersect/test_intersect.groovy b/regression-test/suites/query_p0/intersect/test_intersect.groovy
index 1c007b95d7d07d..7919bec324b876 100644
--- a/regression-test/suites/query_p0/intersect/test_intersect.groovy
+++ b/regression-test/suites/query_p0/intersect/test_intersect.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_intersect") {
+suite("test_intersect", "arrow_flight_sql") {
     qt_select """
                 SELECT * FROM (SELECT k1 FROM test_query_db.baseall
                     INTERSECT SELECT k1 FROM test_query_db.test) a ORDER BY k1
diff --git a/regression-test/suites/query_p0/join/test_join2.groovy b/regression-test/suites/query_p0/join/test_join2.groovy
index 6125b9a873f77e..9158133948f754 100644
--- a/regression-test/suites/query_p0/join/test_join2.groovy
+++ b/regression-test/suites/query_p0/join/test_join2.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_join2", "query,p0") {
+suite("test_join2", "query,p0,arrow_flight_sql") {
     def DBname = "regression_test_join2"
     def TBname1 = "J1_TBL"
     def TBname2 = "J2_TBL"
diff --git a/regression-test/suites/query_p0/join/test_left_join1.groovy b/regression-test/suites/query_p0/join/test_left_join1.groovy
index d4cbeeee65eda2..104adab4a850d0 100644
--- a/regression-test/suites/query_p0/join/test_left_join1.groovy
+++ b/regression-test/suites/query_p0/join/test_left_join1.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_left_join1", "query,p0") {
+suite("test_left_join1", "query,p0,arrow_flight_sql") {
 
     def tableName = "test_left_join1"
     sql """drop table if exists ${tableName}"""
diff --git a/regression-test/suites/query_p0/join/test_nestedloop_outer_join.groovy b/regression-test/suites/query_p0/join/test_nestedloop_outer_join.groovy
index ad19e554690ee7..f99dfa042446e9 100644
--- a/regression-test/suites/query_p0/join/test_nestedloop_outer_join.groovy
+++ b/regression-test/suites/query_p0/join/test_nestedloop_outer_join.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_nestedloop_outer_join", "query_p0") {
+suite("test_nestedloop_outer_join", "query_p0,arrow_flight_sql") {
     def tbl1 = "test_nestedloop_outer_join1"
     def tbl2 = "test_nestedloop_outer_join2"
 
diff --git a/regression-test/suites/query_p0/join/test_partitioned_hash_join.groovy b/regression-test/suites/query_p0/join/test_partitioned_hash_join.groovy
index cbe09ec527ffbc..676cdd06274a68 100644
--- a/regression-test/suites/query_p0/join/test_partitioned_hash_join.groovy
+++ b/regression-test/suites/query_p0/join/test_partitioned_hash_join.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_partitioned_hash_join", "query,p0") {
+suite("test_partitioned_hash_join", "query,p0,arrow_flight_sql") {
     sql "drop table if exists test_partitioned_hash_join_l"
     sql "drop table if exists test_partitioned_hash_join_r"
     sql """ create table test_partitioned_hash_join_l (
diff --git a/regression-test/suites/query_p0/lateral_view/lateral_view.groovy b/regression-test/suites/query_p0/lateral_view/lateral_view.groovy
index a24623590cd0af..bfe6ca76872ea8 100644
--- a/regression-test/suites/query_p0/lateral_view/lateral_view.groovy
+++ b/regression-test/suites/query_p0/lateral_view/lateral_view.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("lateral_view") {
+suite("lateral_view", "arrow_flight_sql") {
     sql """ DROP TABLE IF EXISTS `test_explode_bitmap` """
 	sql """
 		CREATE TABLE `test_explode_bitmap` (
diff --git a/regression-test/suites/query_p0/limit/OffsetInSubqueryWithJoin.groovy b/regression-test/suites/query_p0/limit/OffsetInSubqueryWithJoin.groovy
index da0c7231f425d1..caa75ac7be38ed 100644
--- a/regression-test/suites/query_p0/limit/OffsetInSubqueryWithJoin.groovy
+++ b/regression-test/suites/query_p0/limit/OffsetInSubqueryWithJoin.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_offset_in_subquery_with_join", "query") {
+suite("test_offset_in_subquery_with_join", "query,arrow_flight_sql") {
     // define a sql table
     def testTable = "test_offset_in_subquery_with_join"
 
diff --git a/regression-test/suites/query_p0/literal_view/lietral_test.groovy b/regression-test/suites/query_p0/literal_view/lietral_test.groovy
index 6e9d51f0a0d610..27b82c16247a73 100644
--- a/regression-test/suites/query_p0/literal_view/lietral_test.groovy
+++ b/regression-test/suites/query_p0/literal_view/lietral_test.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("literal_view_test") {
+suite("literal_view_test", "arrow_flight_sql") {
 
     sql """DROP TABLE IF EXISTS table1"""
 
diff --git a/regression-test/suites/query_p0/operator/test_set_operator.groovy b/regression-test/suites/query_p0/operator/test_set_operator.groovy
index cb05e18b3e870b..7d6219585e4c4c 100644
--- a/regression-test/suites/query_p0/operator/test_set_operator.groovy
+++ b/regression-test/suites/query_p0/operator/test_set_operator.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_set_operators", "query,p0") {
+suite("test_set_operators", "query,p0,arrow_flight_sql") {
 
     sql """
         DROP TABLE IF EXISTS t1;
diff --git a/regression-test/suites/query_p0/operator/test_sort_operator.groovy b/regression-test/suites/query_p0/operator/test_sort_operator.groovy
index 24a2b8ef73a424..d76daff01f6fcc 100644
--- a/regression-test/suites/query_p0/operator/test_sort_operator.groovy
+++ b/regression-test/suites/query_p0/operator/test_sort_operator.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_sort_operator", "query,p0") {
+suite("test_sort_operator", "query,p0,arrow_flight_sql") {
 
     sql """
         DROP TABLE IF EXISTS dim_org_ful;
diff --git a/regression-test/suites/query_p0/session_variable/test_default_limit.groovy b/regression-test/suites/query_p0/session_variable/test_default_limit.groovy
index edda5d51790c56..2ce3b647142ae4 100644
--- a/regression-test/suites/query_p0/session_variable/test_default_limit.groovy
+++ b/regression-test/suites/query_p0/session_variable/test_default_limit.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite('test_default_limit') {
+suite('test_default_limit', "arrow_flight_sql") {
     sql 'drop table if exists baseall'
     sql 'drop table if exists bigtable'
 
diff --git a/regression-test/suites/query_p0/show/test_show_create_materialized_view.groovy b/regression-test/suites/query_p0/show/test_show_create_materialized_view.groovy
index 7c5edcc81a2e8e..9550a7fec3dbd2 100644
--- a/regression-test/suites/query_p0/show/test_show_create_materialized_view.groovy
+++ b/regression-test/suites/query_p0/show/test_show_create_materialized_view.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_show_create_materialized_view", "query") {
+suite("test_show_create_materialized_view", "query,arrow_flight_sql") {
     String tableName = "table_for_mv_test";
     String mvName = "mv_show_create_materialized_view";
     try {  
diff --git a/regression-test/suites/query_p0/show/test_show_create_table.groovy b/regression-test/suites/query_p0/show/test_show_create_table.groovy
index 6325cbe319fd88..1e3fc7ff5cb527 100644
--- a/regression-test/suites/query_p0/show/test_show_create_table.groovy
+++ b/regression-test/suites/query_p0/show/test_show_create_table.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_show_create_table", "query") {
+suite("test_show_create_table", "query,arrow_flight_sql") {
     String tb_name = "tb_show_create_table";
     try {  
         sql """drop table if exists ${tb_name} """
diff --git a/regression-test/suites/query_p0/sql_functions/aggregate_functions/test_aggregate_all_functions.groovy b/regression-test/suites/query_p0/sql_functions/aggregate_functions/test_aggregate_all_functions.groovy
index 86a951d7ac33c6..cdab9472e27dbd 100644
--- a/regression-test/suites/query_p0/sql_functions/aggregate_functions/test_aggregate_all_functions.groovy
+++ b/regression-test/suites/query_p0/sql_functions/aggregate_functions/test_aggregate_all_functions.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_aggregate_all_functions") {
+suite("test_aggregate_all_functions", "arrow_flight_sql") {
 
     sql "set batch_size = 4096"
     
diff --git a/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function.groovy b/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function.groovy
index 311b188e433550..17de93942bfc61 100644
--- a/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function.groovy
@@ -75,8 +75,7 @@ suite("test_array_map_function") {
         test {
             sql"""select c_array1,array_max(array_map(x->countequal(c_array1,x),c_array1)) from array_test2;"""
             check{result, exception, startTime, endTime ->
-                assertTrue(exception != null)
-                logger.info(exception.message)
+                assertTrue(exception == null)
             }
         }
 
diff --git a/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function_with_column.groovy b/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function_with_column.groovy
new file mode 100644
index 00000000000000..024e4b57a34572
--- /dev/null
+++ b/regression-test/suites/query_p0/sql_functions/array_functions/test_array_map_function_with_column.groovy
@@ -0,0 +1,70 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_array_map_function_with_column") {
+
+    def tableName = "array_test_with_column"
+    sql "DROP TABLE IF EXISTS ${tableName}"
+    sql """
+        CREATE TABLE IF NOT EXISTS ${tableName} (
+          `k1` int(11) NULL COMMENT "",
+          `k2` int(11) NULL COMMENT "",
+          `c_array1` ARRAY<int(11)> NULL COMMENT "",
+          `c_array2` ARRAY<int(11)> NULL COMMENT ""
+        ) ENGINE=OLAP
+        DISTRIBUTED BY HASH(`k1`,`k2`) BUCKETS 3
+        PROPERTIES (
+        "replication_allocation" = "tag.location.default: 1"
+        );
+    """
+
+
+    sql """INSERT INTO ${tableName} values
+        (1, 2, [1,2,3,4], [null,2,3]),
+        (2, 3, [6,7,null,9], [4,null,6]),
+        (3, 4, NULL, [4, 5, 6]),
+        (NULL, NULL, NULL, NULL);
+    """
+
+    qt_select_1  "select *,array_map(x->x+k1+k2 > k1*k2,c_array1) from ${tableName} order by k1;"
+
+    sql "set batch_size = 1;"
+    qt_select_2  "select *,array_map(x->x+k1+k2 > k1*k2,c_array1) from ${tableName} order by k1;"
+
+    sql "set batch_size = 4;"
+    qt_select_3  "select *,array_map(x->x+k1+k2 > k1*k2,c_array1) from ${tableName} order by k1;"
+
+    sql "set batch_size = 6;"
+    qt_select_4  "select *,array_map(x->x+k1+k2 > k1*k2,c_array1) from ${tableName} order by k1;"
+
+    sql "set batch_size = 8;"
+    qt_select_5  "select *,array_map(x->x+k1+k2 > k1*k2,c_array1) from ${tableName} order by k1;"
+
+    sql "truncate table ${tableName};"
+
+    sql """INSERT INTO ${tableName} values
+        (4, 5, [6,7,null,9], [4,5,6,7]),
+        (5, 6, [10,11,12,13], [8,9,null,11]),
+        (6, 7, NULL, NULL),
+        (NULL, NULL, NULL, NULL);
+    """
+    qt_select_6  "select *,array_map((x,y)->x+k1+k2 > y+k1*k2,c_array1,c_array2) from ${tableName} order by k1;"
+
+    qt_select_7  "select *,array_map((x,y)->x+k1+k2 > y+k1*k2,c_array1,c_array2) from ${tableName} where array_count((x,y) -> k1*x>y+k2, c_array1, c_array2) > 1 order by k1;"
+
+    sql "DROP TABLE IF EXISTS ${tableName}"
+}
diff --git a/regression-test/suites/query_p0/sql_functions/case_function/test_case_function_null.groovy b/regression-test/suites/query_p0/sql_functions/case_function/test_case_function_null.groovy
index 41ef1625080806..a91c86b5f48908 100644
--- a/regression-test/suites/query_p0/sql_functions/case_function/test_case_function_null.groovy
+++ b/regression-test/suites/query_p0/sql_functions/case_function/test_case_function_null.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_case_function_null", "query,p0") {
+suite("test_case_function_null", "query,p0,arrow_flight_sql") {
     sql """ drop table if exists case_null0 """
     sql """ create table case_null0 (
                 `c0` decimalv3(17, 1) NULL,
diff --git a/regression-test/suites/query_p0/sql_functions/datetime_functions/test_convert_tz.groovy b/regression-test/suites/query_p0/sql_functions/datetime_functions/test_convert_tz.groovy
index 2959c7f136b8e5..e382fe9ae70b84 100644
--- a/regression-test/suites/query_p0/sql_functions/datetime_functions/test_convert_tz.groovy
+++ b/regression-test/suites/query_p0/sql_functions/datetime_functions/test_convert_tz.groovy
@@ -16,6 +16,7 @@
 // under the License.
 
 suite("test_convert_tz") {
+    sql "drop table if exists `cvt_tz`"
     sql """
         CREATE TABLE `cvt_tz` (
             `rowid` int NULL,
@@ -34,4 +35,4 @@ suite("test_convert_tz") {
     order_qt_sql1 """
         select convert_tz(dt, '+00:00', IF(property_value IS NULL, '+00:00', property_value)) from cvt_tz
     """
-}
\ No newline at end of file
+}
diff --git a/regression-test/suites/query_p0/sql_functions/hash_functions/test_hash_function.groovy b/regression-test/suites/query_p0/sql_functions/hash_functions/test_hash_function.groovy
index 590ccd10821f61..d547e9fb287d71 100644
--- a/regression-test/suites/query_p0/sql_functions/hash_functions/test_hash_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/hash_functions/test_hash_function.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_hash_function") {
+suite("test_hash_function", "arrow_flight_sql") {
     sql "set batch_size = 4096;"
     sql "set enable_profile = true;"
 
diff --git a/regression-test/suites/query_p0/sql_functions/ip_functions/test_ip_functions.groovy b/regression-test/suites/query_p0/sql_functions/ip_functions/test_ip_functions.groovy
index 03e9788a58a3b8..5373217503a018 100644
--- a/regression-test/suites/query_p0/sql_functions/ip_functions/test_ip_functions.groovy
+++ b/regression-test/suites/query_p0/sql_functions/ip_functions/test_ip_functions.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_ip_functions") {
+suite("test_ip_functions", "arrow_flight_sql") {
     sql "set batch_size = 4096;"
 
     qt_sql "SELECT ipv4_num_to_string(-1);"
diff --git a/regression-test/suites/query_p0/sql_functions/ip_functions/test_ipv6_cidr_to_range_function.groovy b/regression-test/suites/query_p0/sql_functions/ip_functions/test_ipv6_cidr_to_range_function.groovy
index 41432c986fec49..0a8ba107013b4e 100644
--- a/regression-test/suites/query_p0/sql_functions/ip_functions/test_ipv6_cidr_to_range_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/ip_functions/test_ipv6_cidr_to_range_function.groovy
@@ -91,13 +91,13 @@ suite("test_ipv6_cidr_to_range_function") {
         (9, 'ffff:0000:0000:0000:0000:0000:0000:0000', NULL)
         """
 
-    qt_sql "select id, struct_element(ipv6_cidr_to_range(ipv6_string_to_num_or_null(addr), cidr), 'min') as min_range, struct_element(ipv6_cidr_to_range(ipv6_string_to_num_or_null(addr), cidr), 'max') as max_range from test_str_cidr_to_range_function order by id"
+    qt_sql "select id, struct_element(ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num_or_null(addr)), cidr), 'min') as min_range, struct_element(ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num_or_null(addr)), cidr), 'max') as max_range from test_str_cidr_to_range_function order by id"
 
     sql """ DROP TABLE IF EXISTS test_str_cidr_to_range_function """
 
-    qt_sql "select ipv6_cidr_to_range(ipv6_string_to_num('2001:0db8:0000:85a3:0000:0000:ac1f:8001'), 0)"
-    qt_sql "select ipv6_cidr_to_range(ipv6_string_to_num('2001:0db8:0000:85a3:0000:0000:ac1f:8001'), 128)"
-    qt_sql "select ipv6_cidr_to_range(ipv6_string_to_num('ffff:ffff:ffff:ffff:ffff:ffff:ffff:ffff'), 64)"
-    qt_sql "select ipv6_cidr_to_range(ipv6_string_to_num('0000:0000:0000:0000:0000:0000:0000:0000'), 8)"
-    qt_sql "select ipv6_cidr_to_range(ipv6_string_to_num('ffff:0000:0000:0000:0000:0000:0000:0000'), 4)"
+    qt_sql "select ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num('2001:0db8:0000:85a3:0000:0000:ac1f:8001')), 0)"
+    qt_sql "select ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num('2001:0db8:0000:85a3:0000:0000:ac1f:8001')), 128)"
+    qt_sql "select ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num('ffff:ffff:ffff:ffff:ffff:ffff:ffff:ffff')), 64)"
+    qt_sql "select ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num('0000:0000:0000:0000:0000:0000:0000:0000')), 8)"
+    qt_sql "select ipv6_cidr_to_range(ipv6_num_to_string(ipv6_string_to_num('ffff:0000:0000:0000:0000:0000:0000:0000')), 4)"
 }
diff --git a/regression-test/suites/query_p0/sql_functions/json_function/test_query_json_insert.groovy b/regression-test/suites/query_p0/sql_functions/json_function/test_query_json_insert.groovy
index c885e3ae3431f3..b5865034538a11 100644
--- a/regression-test/suites/query_p0/sql_functions/json_function/test_query_json_insert.groovy
+++ b/regression-test/suites/query_p0/sql_functions/json_function/test_query_json_insert.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_query_json_insert", "query") {
+suite("test_query_json_insert", "query,arrow_flight_sql") {
     qt_sql "select json_insert('{\"a\": 1, \"b\": [2, 3]}', '\$', null);"
     qt_sql "select json_insert('{\"k\": [1, 2]}', '\$.k[0]', null, '\$.[1]', null);"
     def tableName = "test_query_json_insert"
diff --git a/regression-test/suites/query_p0/sql_functions/json_functions/test_json_function.groovy b/regression-test/suites/query_p0/sql_functions/json_functions/test_json_function.groovy
index aa0deec96f46a2..4bd88bf131e727 100644
--- a/regression-test/suites/query_p0/sql_functions/json_functions/test_json_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/json_functions/test_json_function.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_json_function") {
+suite("test_json_function", "arrow_flight_sql") {
     sql "set batch_size = 4096;"
 
     qt_sql "SELECT get_json_double('{\"k1\":1.3, \"k2\":\"2\"}', \"\$.k1\");"
diff --git a/regression-test/suites/query_p0/sql_functions/math_functions/test_conv.groovy b/regression-test/suites/query_p0/sql_functions/math_functions/test_conv.groovy
index 6c4867174d11ac..3a74abfe9c8b22 100644
--- a/regression-test/suites/query_p0/sql_functions/math_functions/test_conv.groovy
+++ b/regression-test/suites/query_p0/sql_functions/math_functions/test_conv.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_conv") {
+suite("test_conv", "arrow_flight_sql") {
     qt_select "SELECT CONV(15,10,2)"
 
     sql """ drop table if exists test_conv; """
diff --git a/regression-test/suites/query_p0/sql_functions/search_functions/test_multi_string_search.groovy b/regression-test/suites/query_p0/sql_functions/search_functions/test_multi_string_search.groovy
index 061665d3b9da6e..f1487d283dfcdf 100644
--- a/regression-test/suites/query_p0/sql_functions/search_functions/test_multi_string_search.groovy
+++ b/regression-test/suites/query_p0/sql_functions/search_functions/test_multi_string_search.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_multi_string_search") {
+suite("test_multi_string_search", "arrow_flight_sql") {
     def table_name = "test_multi_string_search_strings"
 
     sql """ DROP TABLE IF EXISTS ${table_name} """
diff --git a/regression-test/suites/query_p0/sql_functions/spatial_functions/test_gis_function.groovy b/regression-test/suites/query_p0/sql_functions/spatial_functions/test_gis_function.groovy
index e98e11ba7e6888..f76cb44cb4ad4b 100644
--- a/regression-test/suites/query_p0/sql_functions/spatial_functions/test_gis_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/spatial_functions/test_gis_function.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_gis_function") {
+suite("test_gis_function", "arrow_flight_sql") {
     sql "set batch_size = 4096;"
 
     qt_sql "SELECT ST_AsText(ST_Point(24.7, 56.7));"
diff --git a/regression-test/suites/query_p0/sql_functions/string_functions/test_string_function.groovy b/regression-test/suites/query_p0/sql_functions/string_functions/test_string_function.groovy
index f5d32653c818b5..6e18fb57eeb4cf 100644
--- a/regression-test/suites/query_p0/sql_functions/string_functions/test_string_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/string_functions/test_string_function.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_string_function") {
+suite("test_string_function", "arrow_flight_sql") {
     sql "set batch_size = 4096;"
 
     qt_sql "select elt(0, \"hello\", \"doris\");"
diff --git a/regression-test/suites/query_p0/sql_functions/table_function/explode_split.groovy b/regression-test/suites/query_p0/sql_functions/table_function/explode_split.groovy
index b7dd4d640799fb..53db931c03bb03 100644
--- a/regression-test/suites/query_p0/sql_functions/table_function/explode_split.groovy
+++ b/regression-test/suites/query_p0/sql_functions/table_function/explode_split.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("explode_split") {
+suite("explode_split", "arrow_flight_sql") {
     def tableName = "test_lv_str"
 
     sql """ DROP TABLE IF EXISTS ${tableName} """
diff --git a/regression-test/suites/query_p0/sql_functions/test_alias_function.groovy b/regression-test/suites/query_p0/sql_functions/test_alias_function.groovy
index 8e0e94fa2df805..095ec89e220f1b 100644
--- a/regression-test/suites/query_p0/sql_functions/test_alias_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/test_alias_function.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite('test_alias_function') {
+suite('test_alias_function', "arrow_flight_sql") {
     sql '''
         CREATE ALIAS FUNCTION IF NOT EXISTS f1(DATETIMEV2(3), INT)
             with PARAMETER (datetime1, int1) as date_trunc(days_sub(datetime1, int1), 'day')'''
diff --git a/regression-test/suites/query_p0/sql_functions/test_predicate.groovy b/regression-test/suites/query_p0/sql_functions/test_predicate.groovy
index 20b3c179ad5c01..6cca6b62c9960b 100644
--- a/regression-test/suites/query_p0/sql_functions/test_predicate.groovy
+++ b/regression-test/suites/query_p0/sql_functions/test_predicate.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_predicate") {
+suite("test_predicate", "arrow_flight_sql") {
     sql """drop table if exists t1;"""
     sql """
             create table t1 (
diff --git a/regression-test/suites/query_p0/sql_functions/width_bucket_fuctions/test_width_bucket_function.groovy b/regression-test/suites/query_p0/sql_functions/width_bucket_fuctions/test_width_bucket_function.groovy
index d0862a580ca600..1a455da92446f8 100644
--- a/regression-test/suites/query_p0/sql_functions/width_bucket_fuctions/test_width_bucket_function.groovy
+++ b/regression-test/suites/query_p0/sql_functions/width_bucket_fuctions/test_width_bucket_function.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_width_bucket_function") {
+suite("test_width_bucket_function", "arrow_flight_sql") {
     qt_sql "select width_bucket(1, 2, 3, 2)"
     qt_sql "select width_bucket(null, 2, 3, 2)"
     qt_sql "select width_bucket(6, 2, 6, 4)"
diff --git a/regression-test/suites/query_p0/subquery/test_subquery2.groovy b/regression-test/suites/query_p0/subquery/test_subquery2.groovy
index e572459cc72fe3..a14a44fa152b97 100644
--- a/regression-test/suites/query_p0/subquery/test_subquery2.groovy
+++ b/regression-test/suites/query_p0/subquery/test_subquery2.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_subquery2") {
+suite("test_subquery2", "arrow_flight_sql") {
     
     sql """DROP TABLE IF EXISTS subquerytest2"""
     
diff --git a/regression-test/suites/query_p0/test_data_type_marks.groovy b/regression-test/suites/query_p0/test_data_type_marks.groovy
index 79803d98723313..51fb7c9614e488 100644
--- a/regression-test/suites/query_p0/test_data_type_marks.groovy
+++ b/regression-test/suites/query_p0/test_data_type_marks.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_data_type_marks") {
+suite("test_data_type_marks", "arrow_flight_sql") {
     def tbName = "org"
     sql "DROP TABLE IF EXISTS ${tbName}"
     sql """
diff --git a/regression-test/suites/query_p0/test_dict_with_null.groovy b/regression-test/suites/query_p0/test_dict_with_null.groovy
index b3738bb68aa1ba..83d253fa4d1b04 100644
--- a/regression-test/suites/query_p0/test_dict_with_null.groovy
+++ b/regression-test/suites/query_p0/test_dict_with_null.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("dict_with_null", "query") {
+suite("dict_with_null", "query,arrow_flight_sql") {
     def tableName = "test_dict_with_null"
     sql "DROP TABLE IF EXISTS ${tableName}"
     sql """
diff --git a/regression-test/suites/query_p0/test_orderby_nullliteral.groovy b/regression-test/suites/query_p0/test_orderby_nullliteral.groovy
index fe11c778af0b98..e806060c8bcb1c 100644
--- a/regression-test/suites/query_p0/test_orderby_nullliteral.groovy
+++ b/regression-test/suites/query_p0/test_orderby_nullliteral.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("orderby_nullliteral", "query") {
+suite("orderby_nullliteral", "query,arrow_flight_sql") {
 
     def tableName = "test_orderby_nullliteral"
     sql "DROP TABLE IF EXISTS ${tableName}"
diff --git a/regression-test/suites/query_p0/test_select_constant.groovy b/regression-test/suites/query_p0/test_select_constant.groovy
index 6015e19576c690..68f0a28a20e853 100644
--- a/regression-test/suites/query_p0/test_select_constant.groovy
+++ b/regression-test/suites/query_p0/test_select_constant.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_select_constant") {
+suite("test_select_constant", "arrow_flight_sql") {
     qt_select1 'select 100, "test", date("2021-01-02");'
     qt_select_geo1 'SELECT ST_AsText(ST_Point(123.12345678901234567890,89.1234567890));'
 }
diff --git a/regression-test/suites/query_p0/test_select_with_predicate_like.groovy b/regression-test/suites/query_p0/test_select_with_predicate_like.groovy
index 9491c4271ca530..0d01f1b958a11c 100644
--- a/regression-test/suites/query_p0/test_select_with_predicate_like.groovy
+++ b/regression-test/suites/query_p0/test_select_with_predicate_like.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_select_with_predicate_like") {
+suite("test_select_with_predicate_like", "arrow_flight_sql") {
     def tables=["test_basic_agg"]
 
     for (String table in tables) {
diff --git a/regression-test/suites/query_p0/test_select_with_predicate_prune.groovy b/regression-test/suites/query_p0/test_select_with_predicate_prune.groovy
index 768e04b4c327b5..ccd1b9160fb148 100644
--- a/regression-test/suites/query_p0/test_select_with_predicate_prune.groovy
+++ b/regression-test/suites/query_p0/test_select_with_predicate_prune.groovy
@@ -14,7 +14,7 @@
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.
-suite("test_select_with_predicate_prune") {
+suite("test_select_with_predicate_prune", "arrow_flight_sql") {
     sql """
         drop table if exists `test_select_with_predicate_prune`;
     """
diff --git a/regression-test/suites/query_p0/type_inference/test_largeint.groovy b/regression-test/suites/query_p0/type_inference/test_largeint.groovy
index d5cbfa4b479838..161359cfa97e72 100644
--- a/regression-test/suites/query_p0/type_inference/test_largeint.groovy
+++ b/regression-test/suites/query_p0/type_inference/test_largeint.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_largeint") {
+suite("test_largeint", "arrow_flight_sql") {
     def tbName = "test_largeint"
     sql "DROP TABLE IF EXISTS ${tbName}"
     sql """
diff --git a/regression-test/suites/query_p0/with/test_with_and_two_phase_agg.groovy b/regression-test/suites/query_p0/with/test_with_and_two_phase_agg.groovy
index 99164a999c557e..d563ef1630517d 100644
--- a/regression-test/suites/query_p0/with/test_with_and_two_phase_agg.groovy
+++ b/regression-test/suites/query_p0/with/test_with_and_two_phase_agg.groovy
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-suite("test_with_and_two_phase_agg") {
+suite("test_with_and_two_phase_agg", "arrow_flight_sql") {
     def tableName = "test_with_and_two_phase_agg_table"
     sql """ DROP TABLE IF EXISTS ${tableName} """
     sql """
diff --git a/regression-test/suites/unique_with_mow_c_p0/test_compaction_with_multi_append_columns.groovy b/regression-test/suites/unique_with_mow_c_p0/test_compaction_with_multi_append_columns.groovy
index 8403b17cce5b6d..acac719b8c5fd0 100644
--- a/regression-test/suites/unique_with_mow_c_p0/test_compaction_with_multi_append_columns.groovy
+++ b/regression-test/suites/unique_with_mow_c_p0/test_compaction_with_multi_append_columns.groovy
@@ -128,11 +128,17 @@ suite("test_compaction_with_multi_append_columns", "p0") {
             assertEquals("success", compactJson.status.toLowerCase())
         }
 
-        (code, out, err) = be_show_tablet_status(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
-        logger.info("Show tablet status: code=" + code + ", out=" + out + ", err=" + err)
-        assertEquals(code, 0)
-        def json = parseJson(out.trim())
-        logger.info("tablet rowset: " + json)
+        for (int i = 0; i < 10; i++) {
+            (code, out, err) = be_show_tablet_status(backendId_to_backendIP.get(backend_id), backendId_to_backendHttpPort.get(backend_id), tablet_id)
+            logger.info("loop " + i + ", Show tablet status: code=" + code + ", out=" + out + ", err=" + err)
+            assertEquals(code, 0)
+            def json = parseJson(out.trim())
+            logger.info("tablet rowsets: " + json)
+            if (json.rowsets.size() <= 5) {
+                break
+            }
+            sleep(2000)
+        }
     }
     checkNoDuplicatedKeys(tableName)
 
diff --git a/regression-test/suites/unique_with_mow_c_p0/test_schema_change_and_compaction.groovy b/regression-test/suites/unique_with_mow_c_p0/test_schema_change_and_compaction.groovy
new file mode 100644
index 00000000000000..dfb7facf5ee4cb
--- /dev/null
+++ b/regression-test/suites/unique_with_mow_c_p0/test_schema_change_and_compaction.groovy
@@ -0,0 +1,145 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+// The cases is copied from https://github.com/trinodb/trino/tree/master
+// /testing/trino-product-tests/src/main/resources/sql-tests/testcases
+// and modified by Doris.
+
+import org.codehaus.groovy.runtime.IOGroovyMethods
+
+suite("test_schema_change_and_compaction", "nonConcurrent") {
+    def tableName = "test_schema_change_and_compaction"
+
+    def getAlterTableState = { job_state ->
+        def retry = 0
+        def last_state = ""
+        while (true) {
+            sleep(2000)
+            def state = sql " show alter table column where tablename = '${tableName}' order by CreateTime desc limit 1"
+            logger.info("alter table state: ${state}")
+            last_state = state[0][9]
+            if (state.size() > 0 && state[0][9] == job_state) {
+                return
+            }
+            retry++
+            if (retry >= 10) {
+                break
+            }
+        }
+        assertTrue(false, "alter table job state is ${last_state}, not ${job_state} after retry ${retry} times")
+    }
+
+    def block_convert_historical_rowsets = {
+        if (isCloudMode()) {
+            GetDebugPoint().enableDebugPointForAllBEs("CloudSchemaChangeJob::_convert_historical_rowsets.block")
+        } else {
+            GetDebugPoint().enableDebugPointForAllBEs("SchemaChangeJob::_convert_historical_rowsets.block")
+        }
+    }
+
+    def unblock = {
+        if (isCloudMode()) {
+            GetDebugPoint().disableDebugPointForAllBEs("CloudSchemaChangeJob::_convert_historical_rowsets.block")
+        } else {
+            GetDebugPoint().disableDebugPointForAllBEs("SchemaChangeJob::_convert_historical_rowsets.block")
+        }
+    }
+
+    onFinish {
+        unblock()
+    }
+
+    sql """ DROP TABLE IF EXISTS ${tableName} force """
+    sql """
+        CREATE TABLE ${tableName} ( `k1` int(11), `k2` int(11), `v1` int(11), `v2` int(11) ) ENGINE=OLAP
+        unique KEY(`k1`, `k2`) cluster by(v1) DISTRIBUTED BY HASH(`k1`) BUCKETS 1
+        PROPERTIES ( "replication_num" = "1" );
+    """
+    sql """ insert into ${tableName} values(10, 20, 30, 40); """
+
+    // alter table
+    block_convert_historical_rowsets()
+    sql """ alter table ${tableName} order by(k1, k2, v2, v1); """
+    getAlterTableState("RUNNING")
+
+    def tablets = sql_return_maparray """ show tablets from ${tableName}; """
+    logger.info("tablets: ${tablets}")
+    assertEquals(2, tablets.size())
+    String alterTabletId = ""
+    String alterTabletBackendId = ""
+    String alterTabletCompactionUrl = ""
+    for (Map<String, String> tablet : tablets) {
+        if (tablet["State"] == "ALTER") {
+            alterTabletId = tablet["TabletId"].toLong()
+            alterTabletBackendId = tablet["BackendId"]
+            alterTabletCompactionUrl = tablet["CompactionStatus"]
+        }
+    }
+    logger.info("alterTabletId: ${alterTabletId}, alterTabletBackendId: ${alterTabletBackendId}, alterTabletCompactionUrl: ${alterTabletCompactionUrl}")
+    assertTrue(!alterTabletId.isEmpty())
+
+    // write some data
+    sql """ insert into ${tableName} values(10, 20, 31, 40); """
+    sql """ insert into ${tableName} values(10, 20, 32, 40); """
+    sql """ insert into ${tableName} values(10, 20, 33, 40); """
+    sql """ insert into ${tableName} values(10, 20, 34, 40); """
+    sql """ insert into ${tableName} values(10, 20, 35, 40); """
+    order_qt_select1 """ select * from ${tableName}; """
+
+    // trigger compaction
+    def backendId_to_backendIP = [:]
+    def backendId_to_backendHttpPort = [:]
+    getBackendIpHttpPort(backendId_to_backendIP, backendId_to_backendHttpPort)
+    logger.info("ip: " + backendId_to_backendIP.get(alterTabletBackendId) + ", port: " + backendId_to_backendHttpPort.get(alterTabletBackendId))
+    def (code, out, err) = be_run_cumulative_compaction(backendId_to_backendIP.get(alterTabletBackendId), backendId_to_backendHttpPort.get(alterTabletBackendId), alterTabletId+"")
+    logger.info("Run compaction: code=" + code + ", out=" + out + ", err=" + err)
+
+    // wait for compaction done
+    def enable_new_tablet_do_compaction = get_be_param.call("enable_new_tablet_do_compaction")
+    logger.info("enable_new_tablet_do_compaction: " + enable_new_tablet_do_compaction)
+    boolean enable = enable_new_tablet_do_compaction.get(alterTabletBackendId).toBoolean()
+    logger.info("enable: " + enable)
+    for (int i = 0; i < 10; i++) {
+        (code, out, err) = curl("GET", alterTabletCompactionUrl)
+        logger.info("Show tablets status: code=" + code + ", out=" + out + ", err=" + err)
+        assertEquals(code, 0)
+        def tabletJson = parseJson(out.trim())
+        assert tabletJson.rowsets instanceof List
+        if (isCloudMode()) {
+            if (enable) {
+                if(tabletJson.rowsets.size() < 5) {
+                    break
+                }
+            } else {
+                // "msg": "invalid tablet state. tablet_id="
+                break
+            }
+        } else {
+            if(tabletJson.rowsets.size() < 5) {
+                break
+            }
+        }
+        sleep(2000)
+    }
+
+    // unblock
+    unblock()
+    sql """ insert into ${tableName}(k1, k2, v1, v2) values(10, 20, 36, 40), (11, 20, 36, 40); """
+    sql """ insert into ${tableName}(k1, k2, v1, v2) values(10, 20, 37, 40), (11, 20, 37, 40); """
+    getAlterTableState("FINISHED")
+    order_qt_select2 """ select * from ${tableName}; """
+}
diff --git a/regression-test/suites/unique_with_mow_c_p0/test_select.groovy b/regression-test/suites/unique_with_mow_c_p0/test_select.groovy
new file mode 100644
index 00000000000000..8cf169e6272dd0
--- /dev/null
+++ b/regression-test/suites/unique_with_mow_c_p0/test_select.groovy
@@ -0,0 +1,70 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("test_select") {
+    sql """ DROP TABLE IF EXISTS test_select0 """
+    sql """ DROP TABLE IF EXISTS test_select1 """
+
+    sql """ 
+        create table test_select0 (
+            pk int,
+            v1 char(255) null,
+            v2 varchar(255) not null, 
+            v3 varchar(1000) not null 
+        ) engine=olap
+        UNIQUE KEY(pk)
+        distributed by hash(pk) buckets 10
+        properties("replication_num" = "1");
+    """
+
+    sql """ 
+        create table test_select1 (
+            pk int,
+            v1 char(255) null,
+            v2 varchar(255) not null, 
+            v3 varchar(1000) not null 
+        ) engine=olap
+        UNIQUE KEY(pk)
+        cluster by(v2, v3)
+        distributed by hash(pk) buckets 10
+        properties("replication_num" = "1");
+    """
+
+    sql """
+        insert into test_select0 values 
+        (0,null,'a','1'),
+        (1,'r','0','9999-12-31 23:59:59'),
+        (2,'n','she','i'),
+        (3,'but','can','2024-08-03 13:08:30');
+    """
+
+    sql """
+        insert into test_select1 values 
+        (0,null,'a','1'),
+        (1,'r','0','9999-12-31 23:59:59'),
+        (2,'n','she','i'),
+        (3,'but','can','2024-08-03 13:08:30');
+    """
+
+    order_qt_sql0 """ 
+        select v2  from test_select0 where v1 is not null  ORDER BY v2 LIMIT 2 ;
+    """
+
+    order_qt_sql1 """ 
+        select v2  from test_select1 where v1 is not null  ORDER BY v2 LIMIT 2 ;
+    """
+}
diff --git a/thirdparty/patches/librdkafka-1.9.2.patch b/thirdparty/patches/librdkafka-1.9.2.patch
index b13e740bc5c36a..3caac08f79dacd 100644
--- a/thirdparty/patches/librdkafka-1.9.2.patch
+++ b/thirdparty/patches/librdkafka-1.9.2.patch
@@ -67,7 +67,19 @@
  
 --- src/rdkafka_broker.c
 +++ src/rdkafka_broker.c
-@@ -5461,7 +5461,9 @@ static int rd_kafka_broker_thread_main(void *arg) {
+@@ -3288,6 +3288,11 @@ rd_kafka_broker_op_serve(rd_kafka_broker_t *rkb, rd_kafka_op_t *rko) {
+                                 : (topic_err
+                                        ? topic_err
+                                        : RD_KAFKA_RESP_ERR__UNKNOWN_PARTITION));
++
++                        if (rkb->rkb_rk->rk_type == RD_KAFKA_CONSUMER) {
++                                rd_kafka_toppar_purge_internal_fetch_queue_maybe(
++                                    rktp);
++                        }
+                 }
+ 
+                 rd_kafka_toppar_unlock(rktp);
+@@ -5461,7 +5466,9 @@ static int rd_kafka_broker_thread_main(void *arg) {
   */
  void rd_kafka_broker_destroy_final(rd_kafka_broker_t *rkb) {
  
@@ -78,3 +90,100 @@
          rd_assert(TAILQ_EMPTY(&rkb->rkb_monitors));
          rd_assert(TAILQ_EMPTY(&rkb->rkb_outbufs.rkbq_bufs));
          rd_assert(TAILQ_EMPTY(&rkb->rkb_waitresps.rkbq_bufs));
+--- src/rdkafka_cgrp.c
++++ src/rdkafka_cgrp.c
+@@ -2734,6 +2734,9 @@ static void rd_kafka_cgrp_partition_del(rd_kafka_cgrp_t *rkcg,
+         rd_kafka_toppar_lock(rktp);
+         rd_assert(rktp->rktp_flags & RD_KAFKA_TOPPAR_F_ON_CGRP);
+         rktp->rktp_flags &= ~RD_KAFKA_TOPPAR_F_ON_CGRP;
++
++        rd_kafka_toppar_purge_internal_fetch_queue_maybe(rktp);
++
+         rd_kafka_toppar_unlock(rktp);
+ 
+         rd_list_remove(&rkcg->rkcg_toppars, rktp);
+--- src/rdkafka_partition.c
++++ src/rdkafka_partition.c
+@@ -959,7 +959,71 @@ void rd_kafka_toppar_insert_msgq(rd_kafka_toppar_t *rktp,
+         rd_kafka_toppar_unlock(rktp);
+ }
+ 
++/**
++ * @brief Purge internal fetch queue if toppar is stopped
++ * (RD_KAFKA_TOPPAR_FETCH_STOPPED) and removed from the cluster
++ * (RD_KAFKA_TOPPAR_F_REMOVE). Will be called from different places as it's
++ * removed starting from a metadata response and stopped from a rebalance or a
++ * consumer close.
++ *
++ * @remark Avoids circular dependencies in from `rktp_fetchq` ops to the same
++ * toppar that stop destroying a consumer.
++ *
++ * @locks rd_kafka_toppar_lock() MUST be held
++ */
++void rd_kafka_toppar_purge_internal_fetch_queue_maybe(rd_kafka_toppar_t *rktp) {
++        rd_kafka_q_t *rkq;
++        rkq = rktp->rktp_fetchq;
++        mtx_lock(&rkq->rkq_lock);
++        if (rktp->rktp_flags & RD_KAFKA_TOPPAR_F_REMOVE &&
++            !rktp->rktp_fetchq->rkq_fwdq) {
++                rd_kafka_op_t *rko;
++                int cnt = 0, barrier_cnt = 0, message_cnt = 0, other_cnt = 0;
++
++                /* Partition is being removed from the cluster and it's stopped,
++                 * so rktp->rktp_fetchq->rkq_fwdq is NULL.
++                 * Purge remaining operations in rktp->rktp_fetchq->rkq_q,
++                 * while holding lock, to avoid circular references */
++                rko = TAILQ_FIRST(&rkq->rkq_q);
++                while (rko) {
++                        if (rko->rko_type != RD_KAFKA_OP_BARRIER &&
++                            rko->rko_type != RD_KAFKA_OP_FETCH) {
++                                rd_kafka_log(
++                                    rktp->rktp_rkt->rkt_rk, LOG_WARNING,
++                                    "PARTDEL",
++                                    "Purging toppar fetch queue buffer op"
++                                    "with unexpected type: %s",
++                                    rd_kafka_op2str(rko->rko_type));
++                        }
++
++                        if (rko->rko_type == RD_KAFKA_OP_BARRIER)
++                                barrier_cnt++;
++                        else if (rko->rko_type == RD_KAFKA_OP_FETCH)
++                                message_cnt++;
++                        else
++                                other_cnt++;
+ 
++                        rko = TAILQ_NEXT(rko, rko_link);
++                        cnt++;
++                }
++
++                if (cnt) {
++                        rd_kafka_dbg(rktp->rktp_rkt->rkt_rk, CGRP, "PARTDEL",
++                                     "Purge toppar fetch queue buffer "
++                                     "containing %d op(s) "
++                                     "(%d barrier(s), %d message(s), %d other)"
++                                     " to avoid "
++                                     "circular references",
++                                     cnt, barrier_cnt, message_cnt, other_cnt);
++                        rd_kafka_q_purge0(rktp->rktp_fetchq, rd_false);
++                } else {
++                        rd_kafka_dbg(rktp->rktp_rkt->rkt_rk, CGRP, "PARTDEL",
++                                     "Not purging toppar fetch queue buffer."
++                                     " No ops present in the buffer.");
++                }
++        }
++        mtx_unlock(&rkq->rkq_lock);
++}
+ 
+ /**
+  * Helper method for purging queues when removing a toppar.
+--- src/rdkafka_partition.h
++++ src/rdkafka_partition.h
+@@ -541,6 +541,8 @@ void rd_kafka_toppar_offset_request(rd_kafka_toppar_t *rktp,
+                                     int64_t query_offset,
+                                     int backoff_ms);
+ 
++void rd_kafka_toppar_purge_internal_fetch_queue_maybe(rd_kafka_toppar_t *rktp);
++
+ int rd_kafka_toppar_purge_queues(rd_kafka_toppar_t *rktp,
+                                  int purge_flags,
+                                  rd_bool_t include_xmit_msgq);