diff --git a/Cargo.lock b/Cargo.lock
index 1424a2515ea89..a9ca62f37e52c 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -3979,6 +3979,7 @@ dependencies = [
  "databend-common-storages-view",
  "databend-common-users",
  "databend-enterprise-data-mask-feature",
+ "databend-enterprise-hilbert-clustering",
  "databend-storages-common-cache",
  "databend-storages-common-io",
  "databend-storages-common-session",
@@ -4630,6 +4631,18 @@ dependencies = [
  "databend-common-meta-app",
 ]
 
+[[package]]
+name = "databend-enterprise-hilbert-clustering"
+version = "0.1.0"
+dependencies = [
+ "async-backtrace",
+ "async-trait",
+ "databend-common-base",
+ "databend-common-catalog",
+ "databend-common-exception",
+ "databend-storages-common-table-meta",
+]
+
 [[package]]
 name = "databend-enterprise-inverted-index"
 version = "0.1.0"
@@ -4690,6 +4703,7 @@ dependencies = [
  "databend-enterprise-background-service",
  "databend-enterprise-data-mask-feature",
  "databend-enterprise-fail-safe",
+ "databend-enterprise-hilbert-clustering",
  "databend-enterprise-inverted-index",
  "databend-enterprise-resources-management",
  "databend-enterprise-storage-encryption",
diff --git a/Cargo.toml b/Cargo.toml
index eb73f1ccd05f1..5ffca0121cbc9 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -184,6 +184,7 @@ databend-enterprise-attach-table = { path = "src/query/ee_features/attach_table"
 databend-enterprise-background-service = { path = "src/query/ee_features/background_service" }
 databend-enterprise-data-mask-feature = { path = "src/query/ee_features/data_mask" }
 databend-enterprise-fail-safe = { path = "src/query/ee_features/fail_safe" }
+databend-enterprise-hilbert-clustering = { path = "src/query/ee_features/hilbert_clustering" }
 databend-enterprise-inverted-index = { path = "src/query/ee_features/inverted_index" }
 databend-enterprise-meta = { path = "src/meta/ee" }
 databend-enterprise-query = { path = "src/query/ee" }
diff --git a/src/common/exception/src/exception_code.rs b/src/common/exception/src/exception_code.rs
index 71384fd959055..a059ccd8abc62 100644
--- a/src/common/exception/src/exception_code.rs
+++ b/src/common/exception/src/exception_code.rs
@@ -426,8 +426,9 @@ build_exceptions! {
     // recluster error codes
     NoNeedToRecluster(4011),
     NoNeedToCompact(4012),
+    UnsupportedClusterType(4013),
 
-    RefreshTableInfoFailure(4012),
+    RefreshTableInfoFailure(4021),
 }
 
 // Service errors [5001,6000].
diff --git a/src/common/license/src/license.rs b/src/common/license/src/license.rs
index 219a903498acb..2584893b7eda5 100644
--- a/src/common/license/src/license.rs
+++ b/src/common/license/src/license.rs
@@ -75,6 +75,8 @@ pub enum Feature {
     AmendTable,
     #[serde(alias = "system_management", alias = "SYSTEM_MANAGEMENT")]
     SystemManagement,
+    #[serde(alias = "hilbert_clustering", alias = "HILBERT_CLUSTERING")]
+    HilbertClustering,
     #[serde(other)]
     Unknown,
 }
@@ -122,6 +124,7 @@ impl fmt::Display for Feature {
             }
             Feature::AmendTable => write!(f, "amend_table"),
             Feature::SystemManagement => write!(f, "system_management"),
+            Feature::HilbertClustering => write!(f, "hilbert_clustering"),
             Feature::Unknown => write!(f, "unknown"),
         }
     }
@@ -169,7 +172,8 @@ impl Feature {
             | (Feature::InvertedIndex, Feature::InvertedIndex)
             | (Feature::VirtualColumn, Feature::VirtualColumn)
             | (Feature::AttacheTable, Feature::AttacheTable)
-            | (Feature::StorageEncryption, Feature::StorageEncryption) => Ok(true),
+            | (Feature::StorageEncryption, Feature::StorageEncryption)
+            | (Feature::HilbertClustering, Feature::HilbertClustering) => Ok(true),
             (_, _) => Ok(false),
         }
     }
@@ -337,6 +341,11 @@ mod tests {
             serde_json::from_str::<Feature>("\"amend_table\"").unwrap()
         );
 
+        assert_eq!(
+            Feature::HilbertClustering,
+            serde_json::from_str::<Feature>("\"hilbert_clustering\"").unwrap()
+        );
+
         assert_eq!(
             Feature::Unknown,
             serde_json::from_str::<Feature>("\"ssss\"").unwrap()
@@ -370,11 +379,12 @@ mod tests {
                     storage_usage: Some(1),
                 }),
                 Feature::AmendTable,
+                Feature::HilbertClustering,
             ]),
         };
 
         assert_eq!(
-            "LicenseInfo{ type: enterprise, org: databend, tenants: [databend_tenant,foo], features: [aggregate_index,amend_table,attach_table,background_service,compute_quota(threads_num: 1, memory_usage: 1),computed_column,data_mask,inverted_index,license_info,storage_encryption,storage_quota(storage_usage: 1),stream,vacuum,virtual_column] }",
+            "LicenseInfo{ type: enterprise, org: databend, tenants: [databend_tenant,foo], features: [aggregate_index,amend_table,attach_table,background_service,compute_quota(threads_num: 1, memory_usage: 1),computed_column,data_mask,hilbert_clustering,inverted_index,license_info,storage_encryption,storage_quota(storage_usage: 1),stream,vacuum,virtual_column] }",
             license_info.to_string()
         );
     }
diff --git a/src/query/catalog/src/plan/partition.rs b/src/query/catalog/src/plan/partition.rs
index 3278c22d3123b..026f80d4c32f2 100644
--- a/src/query/catalog/src/plan/partition.rs
+++ b/src/query/catalog/src/plan/partition.rs
@@ -391,3 +391,10 @@ impl ReclusterParts {
         }
     }
 }
+
+#[derive(serde::Serialize, serde::Deserialize, Clone, Debug, Default)]
+pub struct ReclusterInfoSideCar {
+    pub merged_blocks: Vec<Arc<BlockMeta>>,
+    pub removed_segment_indexes: Vec<usize>,
+    pub removed_statistics: Statistics,
+}
diff --git a/src/query/catalog/src/table.rs b/src/query/catalog/src/table.rs
index d3e04f0686089..c58ecedb3f036 100644
--- a/src/query/catalog/src/table.rs
+++ b/src/query/catalog/src/table.rs
@@ -19,6 +19,9 @@ use std::sync::Arc;
 
 use chrono::DateTime;
 use chrono::Utc;
+use databend_common_ast::ast::Expr;
+use databend_common_ast::parser::parse_comma_separated_exprs;
+use databend_common_ast::parser::tokenize_sql;
 use databend_common_exception::ErrorCode;
 use databend_common_exception::Result;
 use databend_common_expression::BlockThresholds;
@@ -136,6 +139,28 @@ pub trait Table: Sync + Send {
         Some(cluster_type)
     }
 
+    fn resolve_cluster_keys(&self, ctx: Arc<dyn TableContext>) -> Option<Vec<Expr>> {
+        let Some((_, cluster_key_str)) = &self.cluster_key_meta() else {
+            return None;
+        };
+        let tokens = tokenize_sql(cluster_key_str).unwrap();
+        let sql_dialect = ctx.get_settings().get_sql_dialect().unwrap_or_default();
+        let mut ast_exprs = parse_comma_separated_exprs(&tokens, sql_dialect).unwrap();
+        // unwrap tuple.
+        if ast_exprs.len() == 1 {
+            if let Expr::Tuple { exprs, .. } = &ast_exprs[0] {
+                ast_exprs = exprs.clone();
+            }
+        } else {
+            // Defensive check:
+            // `ast_exprs` should always contain one element which can be one of the following:
+            // 1. A tuple of composite cluster keys
+            // 2. A single cluster key
+            unreachable!("invalid cluster key ast expression, {:?}", ast_exprs);
+        }
+        Some(ast_exprs)
+    }
+
     fn change_tracking_enabled(&self) -> bool {
         false
     }
diff --git a/src/query/catalog/src/table_context.rs b/src/query/catalog/src/table_context.rs
index c7f45b5701847..1e957eb2ea68c 100644
--- a/src/query/catalog/src/table_context.rs
+++ b/src/query/catalog/src/table_context.rs
@@ -279,11 +279,23 @@ pub trait TableContext: Send + Sync {
         max_files: Option<usize>,
     ) -> Result<FilteredCopyFiles>;
 
-    fn add_segment_location(&self, segment_loc: Location) -> Result<()>;
+    fn add_written_segment_location(&self, segment_loc: Location) -> Result<()>;
 
-    fn clear_segment_locations(&self) -> Result<()>;
+    fn clear_written_segment_locations(&self) -> Result<()>;
 
-    fn get_segment_locations(&self) -> Result<Vec<Location>>;
+    fn get_written_segment_locations(&self) -> Result<Vec<Location>>;
+
+    fn add_selected_segment_location(&self, _segment_loc: Location) {
+        unimplemented!()
+    }
+
+    fn get_selected_segment_locations(&self) -> Vec<Location> {
+        unimplemented!()
+    }
+
+    fn clear_selected_segment_locations(&self) {
+        unimplemented!()
+    }
 
     fn add_file_status(&self, file_path: &str, file_status: FileStatus) -> Result<()>;
 
diff --git a/src/query/ee/Cargo.toml b/src/query/ee/Cargo.toml
index baaad1302bcdf..52a8c2d69f005 100644
--- a/src/query/ee/Cargo.toml
+++ b/src/query/ee/Cargo.toml
@@ -48,6 +48,7 @@ databend-enterprise-attach-table = { workspace = true }
 databend-enterprise-background-service = { workspace = true }
 databend-enterprise-data-mask-feature = { workspace = true }
 databend-enterprise-fail-safe = { workspace = true }
+databend-enterprise-hilbert-clustering = { workspace = true }
 databend-enterprise-inverted-index = { workspace = true }
 databend-enterprise-resources-management = { workspace = true }
 databend-enterprise-storage-encryption = { workspace = true }
diff --git a/src/query/ee/src/enterprise_services.rs b/src/query/ee/src/enterprise_services.rs
index 1507ac44a43f0..23c75fd69b041 100644
--- a/src/query/ee/src/enterprise_services.rs
+++ b/src/query/ee/src/enterprise_services.rs
@@ -21,6 +21,7 @@ use crate::attach_table::RealAttachTableHandler;
 use crate::background_service::RealBackgroundService;
 use crate::data_mask::RealDatamaskHandler;
 use crate::fail_safe::RealFailSafeHandler;
+use crate::hilbert_clustering::RealHilbertClusteringHandler;
 use crate::inverted_index::RealInvertedIndexHandler;
 use crate::license::license_mgr::RealLicenseManager;
 use crate::resource_management::init_resources_management;
@@ -47,6 +48,7 @@ impl EnterpriseServices {
         RealStorageQuotaHandler::init(&cfg)?;
         RealFailSafeHandler::init()?;
         init_resources_management(&cfg).await?;
+        RealHilbertClusteringHandler::init()?;
         Ok(())
     }
 }
diff --git a/src/query/ee/src/hilbert_clustering/handler.rs b/src/query/ee/src/hilbert_clustering/handler.rs
new file mode 100644
index 0000000000000..995d99496c72d
--- /dev/null
+++ b/src/query/ee/src/hilbert_clustering/handler.rs
@@ -0,0 +1,239 @@
+// Copyright 2023 Databend Cloud
+//
+// Licensed under the Elastic License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     https://www.elastic.co/licensing/elastic-license
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use std::sync::Arc;
+
+use databend_common_base::base::GlobalInstance;
+use databend_common_catalog::plan::PushDownInfo;
+use databend_common_catalog::plan::ReclusterInfoSideCar;
+use databend_common_catalog::table::Table;
+use databend_common_catalog::table_context::TableContext;
+use databend_common_exception::Result;
+use databend_common_expression::BlockThresholds;
+use databend_common_storages_fuse::pruning::create_segment_location_vector;
+use databend_common_storages_fuse::statistics::reducers::merge_statistics_mut;
+use databend_common_storages_fuse::FuseTable;
+use databend_common_storages_fuse::SegmentLocation;
+use databend_common_storages_fuse::DEFAULT_BLOCK_PER_SEGMENT;
+use databend_common_storages_fuse::FUSE_OPT_KEY_BLOCK_PER_SEGMENT;
+use databend_enterprise_hilbert_clustering::HilbertClusteringHandler;
+use databend_enterprise_hilbert_clustering::HilbertClusteringHandlerWrapper;
+use databend_storages_common_table_meta::meta::ClusterStatistics;
+use databend_storages_common_table_meta::meta::CompactSegmentInfo;
+use databend_storages_common_table_meta::meta::Statistics;
+use databend_storages_common_table_meta::meta::TableSnapshot;
+
+pub struct RealHilbertClusteringHandler {}
+
+#[async_trait::async_trait]
+impl HilbertClusteringHandler for RealHilbertClusteringHandler {
+    #[async_backtrace::framed]
+    async fn do_hilbert_clustering(
+        &self,
+        table: Arc<dyn Table>,
+        ctx: Arc<dyn TableContext>,
+        push_downs: Option<PushDownInfo>,
+    ) -> Result<Option<(ReclusterInfoSideCar, Arc<TableSnapshot>)>> {
+        let Some((cluster_key_id, _)) = table.cluster_key_meta() else {
+            return Ok(None);
+        };
+
+        let fuse_table = FuseTable::try_from_table(table.as_ref())?;
+        let Some(snapshot) = fuse_table.read_table_snapshot().await? else {
+            // no snapshot, no recluster.
+            return Ok(None);
+        };
+
+        let block_per_seg =
+            fuse_table.get_option(FUSE_OPT_KEY_BLOCK_PER_SEGMENT, DEFAULT_BLOCK_PER_SEGMENT);
+        let block_thresholds = fuse_table.get_block_thresholds();
+        let thresholds = BlockThresholds {
+            max_rows_per_block: block_per_seg * block_thresholds.max_rows_per_block,
+            min_rows_per_block: block_per_seg * block_thresholds.min_rows_per_block,
+            max_bytes_per_block: block_per_seg * block_thresholds.max_bytes_per_block,
+        };
+        let segment_locations = snapshot.segments.clone();
+        let segment_locations = create_segment_location_vector(segment_locations, None);
+
+        let max_threads = ctx.get_settings().get_max_threads()? as usize;
+        let chunk_size = max_threads * 4;
+        let mut checker = ReclusterChecker::new(
+            cluster_key_id,
+            thresholds,
+            push_downs.as_ref().is_none_or(|v| v.filters.is_none()),
+        );
+        'FOR: for chunk in segment_locations.chunks(chunk_size) {
+            // read segments.
+            let compact_segments = FuseTable::segment_pruning(
+                &ctx,
+                fuse_table.schema_with_stream(),
+                fuse_table.get_operator(),
+                &push_downs,
+                fuse_table.get_storage_format(),
+                chunk.to_vec(),
+            )
+            .await?;
+
+            for (location, segment) in compact_segments.into_iter() {
+                if checker.add(location, segment) {
+                    break 'FOR;
+                }
+            }
+        }
+
+        let target_segments = checker.finalize();
+        if target_segments.is_empty() {
+            return Ok(None);
+        }
+
+        let rows_per_block =
+            block_thresholds.calc_rows_per_block(checker.total_size, checker.total_rows) as u64;
+        let block_size = ctx.get_settings().get_max_block_size()?;
+        ctx.get_settings()
+            .set_max_block_size(rows_per_block.min(block_size))?;
+
+        let mut removed_statistics = Statistics::default();
+        let mut removed_segment_indexes = Vec::with_capacity(target_segments.len());
+        for (segment_loc, segment) in target_segments {
+            ctx.add_selected_segment_location(segment_loc.location);
+            removed_segment_indexes.push(segment_loc.segment_idx);
+            merge_statistics_mut(
+                &mut removed_statistics,
+                &segment.summary,
+                Some(cluster_key_id),
+            );
+        }
+
+        let recluster_info = ReclusterInfoSideCar {
+            merged_blocks: vec![],
+            removed_segment_indexes,
+            removed_statistics,
+        };
+        Ok(Some((recluster_info, snapshot)))
+    }
+}
+
+impl RealHilbertClusteringHandler {
+    pub fn init() -> Result<()> {
+        let handler = RealHilbertClusteringHandler {};
+        let wrapper = HilbertClusteringHandlerWrapper::new(Box::new(handler));
+        GlobalInstance::set(Arc::new(wrapper));
+        Ok(())
+    }
+}
+
+struct ReclusterChecker {
+    segments: Vec<(SegmentLocation, Arc<CompactSegmentInfo>)>,
+    default_cluster_id: u32,
+    thresholds: BlockThresholds,
+
+    total_rows: usize,
+    total_size: usize,
+
+    finished: bool,
+    // Whether the target segments is at the head of snapshot.
+    head_of_snapshot: bool,
+}
+
+impl ReclusterChecker {
+    fn new(default_cluster_id: u32, thresholds: BlockThresholds, head_of_snapshot: bool) -> Self {
+        Self {
+            segments: vec![],
+            default_cluster_id,
+            thresholds,
+            total_rows: 0,
+            total_size: 0,
+            finished: false,
+            head_of_snapshot,
+        }
+    }
+
+    fn add(&mut self, location: SegmentLocation, segment: Arc<CompactSegmentInfo>) -> bool {
+        let row_count = segment.summary.row_count as usize;
+        let byte_size = segment.summary.uncompressed_byte_size as usize;
+        self.total_rows += row_count;
+        self.total_size += byte_size;
+        if !self
+            .thresholds
+            .check_large_enough(self.total_rows, self.total_size)
+        {
+            // totals < N
+            self.segments.push((location, segment));
+            return false;
+        }
+
+        let segment_should_recluster = self.should_recluster(&segment, |v| {
+            v.cluster_key_id != self.default_cluster_id || v.level != -1
+        });
+        let mut retained = false;
+        if !self.head_of_snapshot || segment_should_recluster {
+            if self
+                .thresholds
+                .check_for_compact(self.total_rows, self.total_size)
+            {
+                // N <= totals < 2N
+                self.segments.push((location, segment));
+                retained = true;
+            } else if segment_should_recluster {
+                // totals >= 2N
+                self.segments = vec![(location, segment)];
+                self.total_rows = row_count;
+                self.total_size = byte_size;
+                self.finished = true;
+                return true;
+            }
+        }
+
+        if self.check_for_recluster() {
+            if !retained {
+                self.total_rows -= row_count;
+                self.total_size -= byte_size;
+            }
+            self.finished = true;
+            return true;
+        }
+
+        self.reset();
+        false
+    }
+
+    fn finalize(&mut self) -> Vec<(SegmentLocation, Arc<CompactSegmentInfo>)> {
+        if !self.finished && !self.check_for_recluster() {
+            return vec![];
+        }
+        std::mem::take(&mut self.segments)
+    }
+
+    fn check_for_recluster(&self) -> bool {
+        match self.segments.len() {
+            0 => false,
+            1 => self.should_recluster(&self.segments[0].1, |v| {
+                v.cluster_key_id != self.default_cluster_id
+            }),
+            _ => true,
+        }
+    }
+
+    fn should_recluster<F>(&self, segment: &CompactSegmentInfo, pred: F) -> bool
+    where F: Fn(&ClusterStatistics) -> bool {
+        segment.summary.cluster_stats.as_ref().is_none_or(pred)
+    }
+
+    fn reset(&mut self) {
+        self.total_rows = 0;
+        self.total_size = 0;
+        self.head_of_snapshot = false;
+        self.segments.clear();
+    }
+}
diff --git a/src/query/ee/src/hilbert_clustering/mod.rs b/src/query/ee/src/hilbert_clustering/mod.rs
new file mode 100644
index 0000000000000..fa357368f0f4d
--- /dev/null
+++ b/src/query/ee/src/hilbert_clustering/mod.rs
@@ -0,0 +1,17 @@
+// Copyright 2023 Databend Cloud
+//
+// Licensed under the Elastic License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     https://www.elastic.co/licensing/elastic-license
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+mod handler;
+
+pub use handler::RealHilbertClusteringHandler;
diff --git a/src/query/ee/src/lib.rs b/src/query/ee/src/lib.rs
index 9ea8a9f26fbac..c473e8550d817 100644
--- a/src/query/ee/src/lib.rs
+++ b/src/query/ee/src/lib.rs
@@ -18,6 +18,7 @@ pub mod background_service;
 pub mod data_mask;
 pub mod enterprise_services;
 pub mod fail_safe;
+pub mod hilbert_clustering;
 pub mod inverted_index;
 pub mod license;
 pub mod resource_management;
diff --git a/src/query/ee_features/hilbert_clustering/Cargo.toml b/src/query/ee_features/hilbert_clustering/Cargo.toml
new file mode 100644
index 0000000000000..0f856e1c45143
--- /dev/null
+++ b/src/query/ee_features/hilbert_clustering/Cargo.toml
@@ -0,0 +1,24 @@
+[package]
+name = "databend-enterprise-hilbert-clustering"
+version = { workspace = true }
+authors = { workspace = true }
+license = { workspace = true }
+publish = { workspace = true }
+edition = { workspace = true }
+
+[lib]
+doctest = false
+test = true
+
+[dependencies]
+async-backtrace = { workspace = true }
+async-trait = { workspace = true }
+databend-common-base = { workspace = true }
+databend-common-catalog = { workspace = true }
+databend-common-exception = { workspace = true }
+databend-storages-common-table-meta = { workspace = true }
+
+[build-dependencies]
+
+[lints]
+workspace = true
diff --git a/src/query/ee_features/hilbert_clustering/src/handler.rs b/src/query/ee_features/hilbert_clustering/src/handler.rs
new file mode 100644
index 0000000000000..a0104079d7026
--- /dev/null
+++ b/src/query/ee_features/hilbert_clustering/src/handler.rs
@@ -0,0 +1,59 @@
+// Copyright 2021 Datafuse Labs
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use std::sync::Arc;
+
+use databend_common_base::base::GlobalInstance;
+use databend_common_catalog::plan::PushDownInfo;
+use databend_common_catalog::plan::ReclusterInfoSideCar;
+use databend_common_catalog::table::Table;
+use databend_common_catalog::table_context::TableContext;
+use databend_common_exception::Result;
+use databend_storages_common_table_meta::meta::TableSnapshot;
+
+#[async_trait::async_trait]
+pub trait HilbertClusteringHandler: Sync + Send {
+    async fn do_hilbert_clustering(
+        &self,
+        table: Arc<dyn Table>,
+        ctx: Arc<dyn TableContext>,
+        push_downs: Option<PushDownInfo>,
+    ) -> Result<Option<(ReclusterInfoSideCar, Arc<TableSnapshot>)>>;
+}
+
+pub struct HilbertClusteringHandlerWrapper {
+    handler: Box<dyn HilbertClusteringHandler>,
+}
+
+impl HilbertClusteringHandlerWrapper {
+    pub fn new(handler: Box<dyn HilbertClusteringHandler>) -> Self {
+        Self { handler }
+    }
+
+    #[async_backtrace::framed]
+    pub async fn do_hilbert_clustering(
+        &self,
+        table: Arc<dyn Table>,
+        ctx: Arc<dyn TableContext>,
+        push_downs: Option<PushDownInfo>,
+    ) -> Result<Option<(ReclusterInfoSideCar, Arc<TableSnapshot>)>> {
+        self.handler
+            .do_hilbert_clustering(table, ctx, push_downs)
+            .await
+    }
+}
+
+pub fn get_hilbert_clustering_handler() -> Arc<HilbertClusteringHandlerWrapper> {
+    GlobalInstance::get()
+}
diff --git a/src/query/ee_features/hilbert_clustering/src/lib.rs b/src/query/ee_features/hilbert_clustering/src/lib.rs
new file mode 100644
index 0000000000000..ff2070f19983b
--- /dev/null
+++ b/src/query/ee_features/hilbert_clustering/src/lib.rs
@@ -0,0 +1,18 @@
+// Copyright 2021 Datafuse Labs
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#[allow(unused)]
+mod handler;
+
+pub use handler::*;
diff --git a/src/query/expression/src/kernels/sort.rs b/src/query/expression/src/kernels/sort.rs
index 91bc7ebff2992..02a6c1fcb579d 100644
--- a/src/query/expression/src/kernels/sort.rs
+++ b/src/query/expression/src/kernels/sort.rs
@@ -16,6 +16,7 @@ use databend_common_exception::Result;
 
 use crate::types::DataType;
 use crate::visitor::ValueVisitor;
+use crate::Column;
 use crate::ColumnBuilder;
 use crate::DataBlock;
 use crate::Scalar;
@@ -126,8 +127,11 @@ pub fn compare_scalars(rows: Vec<Vec<Scalar>>, data_types: &[DataType]) -> Resul
         .into_iter()
         .map(|builder| builder.build())
         .collect::<Vec<_>>();
+    compare_columns(order_columns, length)
+}
 
-    let descriptions = order_columns
+pub fn compare_columns(columns: Vec<Column>, length: usize) -> Result<Vec<u32>> {
+    let descriptions = columns
         .iter()
         .enumerate()
         .map(|(idx, _)| SortColumnDescription {
@@ -139,7 +143,7 @@ pub fn compare_scalars(rows: Vec<Vec<Scalar>>, data_types: &[DataType]) -> Resul
 
     let mut sort_compare = SortCompare::new(descriptions, length, LimitType::None);
 
-    for array in order_columns {
+    for array in columns {
         sort_compare.visit_value(Value::Column(array))?;
         sort_compare.increment_column_index();
     }
diff --git a/src/query/functions/src/aggregates/aggregate_range_bound.rs b/src/query/functions/src/aggregates/aggregate_range_bound.rs
new file mode 100644
index 0000000000000..b311a65f455e1
--- /dev/null
+++ b/src/query/functions/src/aggregates/aggregate_range_bound.rs
@@ -0,0 +1,368 @@
+// Copyright 2021 Datafuse Labs
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use std::any::Any;
+use std::sync::Arc;
+
+use borsh::BorshDeserialize;
+use borsh::BorshSerialize;
+use databend_common_exception::ErrorCode;
+use databend_common_exception::Result;
+use databend_common_expression::compare_columns;
+use databend_common_expression::types::array::ArrayColumnBuilder;
+use databend_common_expression::types::Bitmap;
+use databend_common_expression::types::*;
+use databend_common_expression::with_number_mapped_type;
+use databend_common_expression::AggregateFunctionRef;
+use databend_common_expression::Scalar;
+use ethnum::i256;
+use rand::prelude::SliceRandom;
+use rand::rngs::SmallRng;
+use rand::thread_rng;
+use rand::Rng;
+use rand::SeedableRng;
+
+use super::assert_unary_arguments;
+use super::AggregateUnaryFunction;
+use super::FunctionData;
+use super::UnaryState;
+use crate::aggregates::aggregate_function_factory::AggregateFunctionDescription;
+use crate::with_simple_no_number_mapped_type;
+
+struct RangeBoundData {
+    partitions: usize,
+    sample_size: usize,
+}
+
+impl FunctionData for RangeBoundData {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+}
+
+#[derive(BorshSerialize, BorshDeserialize)]
+pub struct RangeBoundState<T>
+where
+    T: ValueType,
+    T::Scalar: BorshSerialize + BorshDeserialize,
+{
+    values: Vec<(u64, Vec<T::Scalar>)>,
+    total_rows: usize,
+    total_samples: usize,
+}
+
+impl<T> Default for RangeBoundState<T>
+where
+    T: ValueType,
+    T::Scalar: BorshSerialize + BorshDeserialize,
+{
+    fn default() -> Self {
+        RangeBoundState::<T> {
+            values: vec![],
+            total_rows: 0,
+            total_samples: 0,
+        }
+    }
+}
+
+impl<T> UnaryState<T, ArrayType<T>> for RangeBoundState<T>
+where
+    T: ArgType + Sync + Send,
+    T::Scalar: Ord + Sync + Send + BorshSerialize + BorshDeserialize,
+{
+    fn add(
+        &mut self,
+        other: T::ScalarRef<'_>,
+        function_data: Option<&dyn FunctionData>,
+    ) -> Result<()> {
+        let range_bound_data = unsafe {
+            function_data
+                .unwrap()
+                .as_any()
+                .downcast_ref_unchecked::<RangeBoundData>()
+        };
+
+        let total_sample_size = std::cmp::min(
+            range_bound_data.sample_size * range_bound_data.partitions,
+            10_000,
+        );
+
+        if self.values.is_empty() {
+            self.values.push((0, vec![]));
+        }
+        let (total_rows, samples) = &mut self.values[0];
+        *total_rows += 1;
+        self.total_rows += 1;
+        if samples.len() < total_sample_size {
+            self.total_samples += 1;
+            samples.push(T::to_owned_scalar(other));
+        } else {
+            let mut rng = thread_rng();
+            let replacement_index = rng.gen_range(0..*total_rows) as usize;
+            if replacement_index < total_sample_size {
+                self.total_samples += 1;
+                samples[replacement_index] = T::to_owned_scalar(other);
+            }
+        }
+        Ok(())
+    }
+
+    fn add_batch(
+        &mut self,
+        other: T::Column,
+        validity: Option<&Bitmap>,
+        function_data: Option<&dyn FunctionData>,
+    ) -> Result<()> {
+        let column_len = T::column_len(&other);
+        let unset_bits = validity.map_or(0, |v| v.null_count());
+        if unset_bits == column_len {
+            return Ok(());
+        }
+
+        let valid_size = column_len - unset_bits;
+        let range_bound_data = unsafe {
+            function_data
+                .unwrap()
+                .as_any()
+                .downcast_ref_unchecked::<RangeBoundData>()
+        };
+        let sample_size = std::cmp::max(valid_size / 100, range_bound_data.sample_size);
+
+        let mut indices = validity.map_or_else(
+            || (0..column_len).collect::<Vec<_>>(),
+            |v| {
+                v.iter()
+                    .enumerate()
+                    .filter_map(|(i, v)| v.then_some(i))
+                    .collect()
+            },
+        );
+
+        let sampled_indices = if valid_size > sample_size {
+            let mut rng = SmallRng::from_entropy();
+            indices.shuffle(&mut rng);
+            &indices[..sample_size]
+        } else {
+            &indices
+        };
+
+        let sample_values = sampled_indices
+            .iter()
+            .map(|i| T::to_owned_scalar(unsafe { T::index_column_unchecked(&other, *i) }))
+            .collect::<Vec<_>>();
+
+        self.total_rows += valid_size;
+        self.total_samples += sample_values.len();
+        self.values.push((valid_size as u64, sample_values));
+        Ok(())
+    }
+
+    fn merge(&mut self, rhs: &Self) -> Result<()> {
+        self.values.extend_from_slice(&rhs.values);
+        self.total_rows += rhs.total_rows;
+        self.total_samples += rhs.total_samples;
+        Ok(())
+    }
+
+    fn merge_result(
+        &mut self,
+        builder: &mut ArrayColumnBuilder<T>,
+        function_data: Option<&dyn FunctionData>,
+    ) -> Result<()> {
+        let range_bound_data = unsafe {
+            function_data
+                .unwrap()
+                .as_any()
+                .downcast_ref_unchecked::<RangeBoundData>()
+        };
+        let step = self.total_rows as f64 / range_bound_data.partitions as f64;
+
+        let values = std::mem::take(&mut self.values);
+        let mut data = Vec::with_capacity(self.total_samples);
+        let mut weights = Vec::with_capacity(self.total_samples);
+        for (num, values) in values.into_iter() {
+            let weight = num as f64 / values.len() as f64;
+            values.into_iter().for_each(|v| {
+                data.push(v);
+                weights.push(weight);
+            });
+        }
+        let col = T::upcast_column(T::column_from_vec(data.clone(), &[]));
+        let indices = compare_columns(vec![col], self.total_samples)?;
+
+        let mut cum_weight = 0.0;
+        let mut target = step;
+        let mut bounds = Vec::with_capacity(range_bound_data.partitions - 1);
+        let mut previous_bound = None;
+
+        let mut i = 0;
+        let mut j = 0;
+        while i < self.total_samples && j < range_bound_data.partitions - 1 {
+            let idx = indices[i] as usize;
+            let weight = weights[idx];
+            cum_weight += weight;
+            if cum_weight >= target {
+                let data = &data[idx];
+                if previous_bound.as_ref().map_or(true, |prev| data > prev) {
+                    bounds.push(data.clone());
+                    target += step;
+                    j += 1;
+                    previous_bound = Some(data.clone());
+                }
+            }
+            i += 1;
+        }
+
+        let col = T::column_from_vec(bounds, &[]);
+        builder.push(col);
+        Ok(())
+    }
+}
+
+pub fn try_create_aggregate_range_bound_function(
+    display_name: &str,
+    params: Vec<Scalar>,
+    arguments: Vec<DataType>,
+) -> Result<AggregateFunctionRef> {
+    assert_unary_arguments(display_name, arguments.len())?;
+    let data_type = arguments[0].clone().remove_nullable();
+    let function_data = get_partitions(&params, display_name)?;
+    let return_type = DataType::Array(Box::new(data_type.clone()));
+
+    with_simple_no_number_mapped_type!(|T| match data_type {
+        DataType::T => {
+            let func = AggregateUnaryFunction::<RangeBoundState<T>, T, ArrayType<T>>::try_create(
+                display_name,
+                return_type,
+                params,
+                arguments[0].clone(),
+            )
+            .with_function_data(Box::new(function_data))
+            .with_need_drop(true);
+            Ok(Arc::new(func))
+        }
+        DataType::Number(num_type) => {
+            with_number_mapped_type!(|NUM| match num_type {
+                NumberDataType::NUM => {
+                    let func = AggregateUnaryFunction::<
+                        RangeBoundState<NumberType<NUM>>,
+                        NumberType<NUM>,
+                        ArrayType<NumberType<NUM>>,
+                    >::try_create(
+                        display_name, return_type, params, arguments[0].clone()
+                    )
+                    .with_function_data(Box::new(function_data))
+                    .with_need_drop(true);
+                    Ok(Arc::new(func))
+                }
+            })
+        }
+        DataType::Decimal(DecimalDataType::Decimal128(_)) => {
+            let func = AggregateUnaryFunction::<
+                RangeBoundState<DecimalType<i128>>,
+                DecimalType<i128>,
+                ArrayType<DecimalType<i128>>,
+            >::try_create(
+                display_name, return_type, params, arguments[0].clone()
+            )
+            .with_function_data(Box::new(function_data))
+            .with_need_drop(true);
+            Ok(Arc::new(func))
+        }
+        DataType::Decimal(DecimalDataType::Decimal256(_)) => {
+            let func = AggregateUnaryFunction::<
+                RangeBoundState<DecimalType<i256>>,
+                DecimalType<i256>,
+                ArrayType<DecimalType<i256>>,
+            >::try_create(
+                display_name, return_type, params, arguments[0].clone()
+            )
+            .with_function_data(Box::new(function_data))
+            .with_need_drop(true);
+            Ok(Arc::new(func))
+        }
+        DataType::Binary => {
+            let func = AggregateUnaryFunction::<
+                RangeBoundState<BinaryType>,
+                BinaryType,
+                ArrayType<BinaryType>,
+            >::try_create(
+                display_name, return_type, params, arguments[0].clone()
+            )
+            .with_function_data(Box::new(function_data))
+            .with_need_drop(true);
+            Ok(Arc::new(func))
+        }
+        _ => Err(ErrorCode::BadDataValueType(format!(
+            "{} does not support type '{:?}'",
+            display_name, data_type
+        ))),
+    })
+}
+
+/// The `range_bound(partition_num, sample_size)(col)` function calculates the partition boundaries
+/// for a given column `col`. It divides the column's data range into `partition_num` partitions,
+/// using `sample_size` to determine the number of samples per block. The resulting boundaries
+/// define the ranges for each partition.
+///
+/// Example:
+/// For a column with values `(0, 1, 3, 6, 8)` and `partition_num = 3`, the function calculates the
+/// partition boundaries based on the distribution of the data. The boundaries might be `[1, 6]`.
+pub fn aggregate_range_bound_function_desc() -> AggregateFunctionDescription {
+    AggregateFunctionDescription::creator(Box::new(
+        crate::aggregates::try_create_aggregate_range_bound_function,
+    ))
+}
+
+fn get_partitions(params: &[Scalar], display_name: &str) -> Result<RangeBoundData> {
+    match params.len() {
+        0 => Ok(RangeBoundData {
+            partitions: 1024,
+            sample_size: 100,
+        }),
+        1 => {
+            let partitions = get_positive_integer(&params[0], display_name)?;
+            Ok(RangeBoundData {
+                partitions,
+                sample_size: 100,
+            })
+        }
+        2 => {
+            let partitions = get_positive_integer(&params[0], display_name)?;
+            let sample_size = get_positive_integer(&params[1], display_name)?;
+            Ok(RangeBoundData {
+                partitions,
+                sample_size,
+            })
+        }
+        _ => Err(ErrorCode::BadArguments(format!(
+            "The number of arguments in aggregate function {} must be [0, 1, 2]",
+            display_name,
+        ))),
+    }
+}
+
+fn get_positive_integer(val: &Scalar, display_name: &str) -> Result<usize> {
+    if let Scalar::Number(number) = val {
+        if let Some(number) = number.integer_to_i128() {
+            if number > 0 {
+                return Ok(number as usize);
+            }
+        }
+    }
+    Err(ErrorCode::BadDataValueType(format!(
+        "The argument of aggregate function {} must be positive int",
+        display_name
+    )))
+}
diff --git a/src/query/functions/src/aggregates/aggregator.rs b/src/query/functions/src/aggregates/aggregator.rs
index 4c9c88a6e9b40..a8141c310940d 100644
--- a/src/query/functions/src/aggregates/aggregator.rs
+++ b/src/query/functions/src/aggregates/aggregator.rs
@@ -52,6 +52,7 @@ use crate::aggregates::aggregate_quantile_cont_function_desc;
 use crate::aggregates::aggregate_quantile_disc_function_desc;
 use crate::aggregates::aggregate_quantile_tdigest_function_desc;
 use crate::aggregates::aggregate_quantile_tdigest_weighted_function_desc;
+use crate::aggregates::aggregate_range_bound_function_desc;
 use crate::aggregates::aggregate_retention_function_desc;
 use crate::aggregates::aggregate_skewness_function_desc;
 use crate::aggregates::aggregate_st_collect_function_desc;
@@ -119,6 +120,8 @@ impl Aggregators {
         factory.register("skewness", aggregate_skewness_function_desc());
         factory.register("string_agg", aggregate_string_agg_function_desc());
 
+        factory.register("range_bound", aggregate_range_bound_function_desc());
+
         factory.register(
             "bitmap_and_count",
             aggregate_bitmap_and_count_function_desc(),
diff --git a/src/query/functions/src/aggregates/mod.rs b/src/query/functions/src/aggregates/mod.rs
index a24d642ff76f2..8f21e14d41074 100644
--- a/src/query/functions/src/aggregates/mod.rs
+++ b/src/query/functions/src/aggregates/mod.rs
@@ -40,6 +40,7 @@ mod aggregate_quantile_cont;
 mod aggregate_quantile_disc;
 mod aggregate_quantile_tdigest;
 mod aggregate_quantile_tdigest_weighted;
+mod aggregate_range_bound;
 mod aggregate_retention;
 mod aggregate_scalar_state;
 mod aggregate_skewness;
@@ -74,6 +75,7 @@ pub use aggregate_quantile_cont::*;
 pub use aggregate_quantile_disc::*;
 pub use aggregate_quantile_tdigest::*;
 pub use aggregate_quantile_tdigest_weighted::*;
+pub use aggregate_range_bound::*;
 pub use aggregate_retention::*;
 pub use aggregate_skewness::*;
 pub use aggregate_st_collect::*;
diff --git a/src/query/functions/src/scalars/hilbert.rs b/src/query/functions/src/scalars/hilbert.rs
index 67f426e6ffb19..615f2d6dab004 100644
--- a/src/query/functions/src/scalars/hilbert.rs
+++ b/src/query/functions/src/scalars/hilbert.rs
@@ -15,6 +15,8 @@
 use databend_common_expression::hilbert_index;
 use databend_common_expression::types::ArrayType;
 use databend_common_expression::types::BinaryType;
+use databend_common_expression::types::GenericType;
+use databend_common_expression::types::NullableType;
 use databend_common_expression::types::NumberDataType;
 use databend_common_expression::types::NumberType;
 use databend_common_expression::types::StringType;
@@ -56,25 +58,56 @@ pub fn register(registry: &mut FunctionRegistry) {
         })
     }
 
-    registry.register_passthrough_nullable_2_arg::<ArrayType<BinaryType>, NumberType<u64>, BinaryType, _, _>(
+    registry.register_combine_nullable_2_arg::<ArrayType<NullableType<BinaryType>>, NumberType<u64>, BinaryType, _, _>(
         "hilbert_index",
         |_, _, _| FunctionDomain::Full,
-        vectorize_with_builder_2_arg::<ArrayType<BinaryType>, NumberType<u64>, BinaryType>(
+        vectorize_with_builder_2_arg::<ArrayType<NullableType<BinaryType>>, NumberType<u64>, NullableType<BinaryType>>(
             |val, len, builder, ctx| {
-                let points = val.iter().collect::<Vec<_>>();
+                let mut points = Vec::with_capacity(val.len());
+                for a in val.iter() {
+                    if a.is_none() {
+                        builder.push_null();
+                        return;
+                    }
+                    points.push(a.unwrap());
+                }
                 let dimension = points.len();
 
                 if std::intrinsics::unlikely(len > 64) {
                     ctx.set_error(builder.len(), "Width must be less than or equal to 64");
+                    builder.push_null();
                 } else if std::intrinsics::unlikely(!(2..=5).contains(&dimension)) {
                     ctx.set_error(builder.len(), "Dimension must between 2 and 5");
+                    builder.push_null();
                 } else {
                     let slice = hilbert_index(&points, len as usize);
-                    builder.put_slice(&slice);
+                    builder.push(&slice);
                 }
-
-                builder.commit_row();
             },
         ),
     );
+
+    // This `range_partition_id(col, range_bounds)` function calculates the partition ID for each value
+    // in the column based on the specified partition boundaries.
+    // The column values are conceptually divided into multiple partitions defined by the range_bounds.
+    // For example, given the column values (0, 1, 3, 6, 8) and a partition configuration with 3 partitions,
+    // the range_bounds might be [1, 6]. The function would then return partition IDs as (0, 0, 1, 1, 2).
+    registry.register_passthrough_nullable_2_arg::<GenericType<0>, ArrayType<GenericType<0>>, NumberType<u64>, _, _>(
+        "range_partition_id",
+        |_, _, _| FunctionDomain::Full,
+        vectorize_with_builder_2_arg::<GenericType<0>, ArrayType<GenericType<0>>, NumberType<u64>>(|val, arr, builder, _| {
+            let mut low = 0;
+            let mut high = arr.len();
+            while low < high {
+                let mid = low + ((high - low) / 2);
+                let bound = unsafe {arr.index_unchecked(mid)};
+                if val > bound {
+                    low = mid + 1;
+                } else {
+                    high = mid;
+                }
+            }
+            builder.push(low as u64);
+        }),
+    );
 }
diff --git a/src/query/functions/tests/it/scalars/testdata/function_list.txt b/src/query/functions/tests/it/scalars/testdata/function_list.txt
index f18d7486df983..a7ebd51716226 100644
--- a/src/query/functions/tests/it/scalars/testdata/function_list.txt
+++ b/src/query/functions/tests/it/scalars/testdata/function_list.txt
@@ -1942,8 +1942,8 @@ Functions overloads:
 1 h3_unidirectional_edge_is_valid(UInt64 NULL) :: Boolean NULL
 0 haversine(Float64, Float64, Float64, Float64) :: Float64
 1 haversine(Float64 NULL, Float64 NULL, Float64 NULL, Float64 NULL) :: Float64 NULL
-0 hilbert_index(Array(Binary), UInt64) :: Binary
-1 hilbert_index(Array(Binary) NULL, UInt64 NULL) :: Binary NULL
+0 hilbert_index(Array(Binary NULL), UInt64) :: Binary NULL
+1 hilbert_index(Array(Binary NULL) NULL, UInt64 NULL) :: Binary NULL
 0 hilbert_key(String) :: Binary
 1 hilbert_key(String NULL) :: Binary NULL
 2 hilbert_key(UInt8) :: Binary
@@ -3204,6 +3204,8 @@ Functions overloads:
 2 rand(UInt64 NULL) :: Float64 NULL
 0 range(UInt64, UInt64) :: Array(UInt64)
 1 range(UInt64 NULL, UInt64 NULL) :: Array(UInt64) NULL
+0 range_partition_id(T0, Array(T0)) :: UInt64
+1 range_partition_id(T0 NULL, Array(T0) NULL) :: UInt64 NULL
 0 regexp(String, String) :: Boolean
 1 regexp(String NULL, String NULL) :: Boolean NULL
 0 regexp_instr FACTORY
diff --git a/src/query/pipeline/transforms/src/processors/transforms/transform_compact_no_split_builder.rs b/src/query/pipeline/transforms/src/processors/transforms/transform_compact_no_split_builder.rs
index 13a8786660c25..85215b0b58b6f 100644
--- a/src/query/pipeline/transforms/src/processors/transforms/transform_compact_no_split_builder.rs
+++ b/src/query/pipeline/transforms/src/processors/transforms/transform_compact_no_split_builder.rs
@@ -27,7 +27,7 @@ pub fn build_compact_block_no_split_pipeline(
     thresholds: BlockThresholds,
     max_threads: usize,
 ) -> Result<()> {
-    // has been resize 1.
+    pipeline.try_resize(1)?;
     pipeline.add_accumulating_transformer(|| BlockCompactNoSplitBuilder::new(thresholds));
     pipeline.try_resize(max_threads)?;
     pipeline.add_block_meta_transformer(TransformCompactBlock::default);
diff --git a/src/query/service/src/interpreters/hook/compact_hook.rs b/src/query/service/src/interpreters/hook/compact_hook.rs
index 61e1a7c5bcaaf..3c695cf3465e9 100644
--- a/src/query/service/src/interpreters/hook/compact_hook.rs
+++ b/src/query/service/src/interpreters/hook/compact_hook.rs
@@ -27,6 +27,7 @@ use databend_common_sql::optimizer::SExpr;
 use databend_common_sql::plans::OptimizeCompactBlock;
 use databend_common_sql::plans::Recluster;
 use databend_common_sql::plans::RelOperator;
+use databend_storages_common_table_meta::table::ClusterType;
 use log::info;
 
 use crate::interpreters::common::metrics_inc_compact_hook_compact_time_ms;
@@ -185,7 +186,7 @@ async fn compact_table(
                 PipelineCompleteExecutor::from_pipelines(pipelines, executor_settings)?;
 
             // Clears previously generated segment locations to avoid duplicate data in the refresh phase
-            ctx.clear_segment_locations()?;
+            ctx.clear_written_segment_locations()?;
             ctx.set_executor(complete_executor.get_inner())?;
             complete_executor.execute()?;
             drop(complete_executor);
@@ -194,21 +195,34 @@ async fn compact_table(
 
     {
         // do recluster.
-        if table.cluster_key_meta().is_some() {
-            let recluster = RelOperator::Recluster(Recluster {
-                catalog: compact_target.catalog,
-                database: compact_target.database,
-                table: compact_target.table,
-                filters: None,
-                limit: Some(settings.get_auto_compaction_segments_limit()? as usize),
-            });
-            let s_expr = SExpr::create_leaf(Arc::new(recluster));
-            let recluster_interpreter =
-                ReclusterTableInterpreter::try_create(ctx.clone(), s_expr, lock_opt, false)?;
-            // Recluster will be done in `ReclusterTableInterpreter::execute2` directly,
-            // we do not need to use `PipelineCompleteExecutor` to execute it.
-            let build_res = recluster_interpreter.execute2().await?;
-            assert!(build_res.main_pipeline.is_empty());
+        if let Some(cluster_type) = table.cluster_type() {
+            if cluster_type == ClusterType::Linear {
+                // evict the table from cache
+                ctx.evict_table_from_cache(
+                    &compact_target.catalog,
+                    &compact_target.database,
+                    &compact_target.table,
+                )?;
+                let recluster = RelOperator::Recluster(Recluster {
+                    catalog: compact_target.catalog,
+                    database: compact_target.database,
+                    table: compact_target.table,
+                    limit: Some(settings.get_auto_compaction_segments_limit()? as usize),
+                    filters: None,
+                });
+                let s_expr = SExpr::create_leaf(Arc::new(recluster));
+                let recluster_interpreter = ReclusterTableInterpreter::try_create(
+                    ctx.clone(),
+                    s_expr,
+                    None,
+                    lock_opt,
+                    false,
+                )?;
+                // Recluster will be done in `ReclusterTableInterpreter::execute2` directly,
+                // we do not need to use `PipelineCompleteExecutor` to execute it.
+                let build_res = recluster_interpreter.execute2().await?;
+                debug_assert!(build_res.main_pipeline.is_empty());
+            }
         }
     }
 
diff --git a/src/query/service/src/interpreters/hook/refresh_hook.rs b/src/query/service/src/interpreters/hook/refresh_hook.rs
index ecdcbab1e9fbf..52a775668244f 100644
--- a/src/query/service/src/interpreters/hook/refresh_hook.rs
+++ b/src/query/service/src/interpreters/hook/refresh_hook.rs
@@ -209,7 +209,7 @@ async fn generate_refresh_index_plan(
     catalog: &str,
     table_id: MetaId,
 ) -> Result<Vec<Plan>> {
-    let segment_locs = ctx.get_segment_locations()?;
+    let segment_locs = ctx.get_written_segment_locations()?;
     let catalog = ctx.get_catalog(catalog).await?;
     let mut plans = vec![];
     let indexes = catalog
@@ -272,7 +272,7 @@ async fn generate_refresh_inverted_index_plan(
     desc: &RefreshDesc,
     table: Arc<dyn Table>,
 ) -> Result<Vec<Plan>> {
-    let segment_locs = ctx.get_segment_locations()?;
+    let segment_locs = ctx.get_written_segment_locations()?;
     let mut plans = vec![];
 
     let table_meta = &table.get_table_info().meta;
@@ -296,7 +296,7 @@ async fn generate_refresh_virtual_column_plan(
     ctx: Arc<QueryContext>,
     desc: &RefreshDesc,
 ) -> Result<Option<Plan>> {
-    let segment_locs = ctx.get_segment_locations()?;
+    let segment_locs = ctx.get_written_segment_locations()?;
 
     let table_info = ctx
         .get_table(&desc.catalog, &desc.database, &desc.table)
diff --git a/src/query/service/src/interpreters/interpreter.rs b/src/query/service/src/interpreters/interpreter.rs
index 3948cd47f256e..fdc9e32217728 100644
--- a/src/query/service/src/interpreters/interpreter.rs
+++ b/src/query/service/src/interpreters/interpreter.rs
@@ -240,7 +240,7 @@ async fn plan_sql(
     let extras = planner.parse_sql(sql)?;
     if !acquire_queue {
         // If queue guard is not required, plan the statement directly.
-        let plan = planner.plan_stmt(&extras.statement).await?;
+        let plan = planner.plan_stmt(&extras.statement, true).await?;
         return Ok((plan, extras, AcquireQueueGuard::create(None)));
     }
 
@@ -251,11 +251,11 @@ async fn plan_sql(
         // See PR https://github.com/databendlabs/databend/pull/16632
         let query_entry = QueryEntry::create_entry(&ctx, &extras, true)?;
         let guard = QueriesQueueManager::instance().acquire(query_entry).await?;
-        let plan = planner.plan_stmt(&extras.statement).await?;
+        let plan = planner.plan_stmt(&extras.statement, true).await?;
         Ok((plan, extras, guard))
     } else {
         // No lock is needed, plan the statement first, then acquire the queue guard.
-        let plan = planner.plan_stmt(&extras.statement).await?;
+        let plan = planner.plan_stmt(&extras.statement, true).await?;
         let query_entry = QueryEntry::create(&ctx, &plan, &extras)?;
         let guard = QueriesQueueManager::instance().acquire(query_entry).await?;
         Ok((plan, extras, guard))
diff --git a/src/query/service/src/interpreters/interpreter_factory.rs b/src/query/service/src/interpreters/interpreter_factory.rs
index 2dc366f621191..a2854fa28c208 100644
--- a/src/query/service/src/interpreters/interpreter_factory.rs
+++ b/src/query/service/src/interpreters/interpreter_factory.rs
@@ -339,14 +339,17 @@ impl InterpreterFactory {
             Plan::DropTableClusterKey(drop_table_cluster_key) => Ok(Arc::new(
                 DropTableClusterKeyInterpreter::try_create(ctx, *drop_table_cluster_key.clone())?,
             )),
-            Plan::ReclusterTable { s_expr, is_final } => {
-                Ok(Arc::new(ReclusterTableInterpreter::try_create(
-                    ctx,
-                    *s_expr.clone(),
-                    LockTableOption::LockWithRetry,
-                    *is_final,
-                )?))
-            }
+            Plan::ReclusterTable {
+                s_expr,
+                hilbert_query,
+                is_final,
+            } => Ok(Arc::new(ReclusterTableInterpreter::try_create(
+                ctx,
+                *s_expr.clone(),
+                hilbert_query.clone(),
+                LockTableOption::LockWithRetry,
+                *is_final,
+            )?)),
             Plan::TruncateTable(truncate_table) => Ok(Arc::new(
                 TruncateTableInterpreter::try_create(ctx, *truncate_table.clone())?,
             )),
diff --git a/src/query/service/src/interpreters/interpreter_replace.rs b/src/query/service/src/interpreters/interpreter_replace.rs
index 65084b30ac970..18c1e6eed442b 100644
--- a/src/query/service/src/interpreters/interpreter_replace.rs
+++ b/src/query/service/src/interpreters/interpreter_replace.rs
@@ -47,6 +47,7 @@ use databend_common_storage::StageFileInfo;
 use databend_common_storages_factory::Table;
 use databend_common_storages_fuse::FuseTable;
 use databend_storages_common_table_meta::readers::snapshot_reader::TableSnapshotAccessor;
+use databend_storages_common_table_meta::table::ClusterType;
 use parking_lot::RwLock;
 
 use crate::interpreters::common::check_deduplicate_label;
@@ -290,7 +291,10 @@ impl ReplaceInterpreter {
             .ctx
             .get_settings()
             .get_replace_into_bloom_pruning_max_column_number()?;
-        let bloom_filter_column_indexes = if table.cluster_key_meta().is_some() {
+        let bloom_filter_column_indexes = if table
+            .cluster_type()
+            .is_some_and(|v| v == ClusterType::Linear)
+        {
             fuse_table
                 .choose_bloom_filter_columns(
                     self.ctx.clone(),
diff --git a/src/query/service/src/interpreters/interpreter_table_recluster.rs b/src/query/service/src/interpreters/interpreter_table_recluster.rs
index ffb4329203726..9c9f08633d285 100644
--- a/src/query/service/src/interpreters/interpreter_table_recluster.rs
+++ b/src/query/service/src/interpreters/interpreter_table_recluster.rs
@@ -17,16 +17,23 @@ use std::sync::Arc;
 use std::time::Duration;
 use std::time::SystemTime;
 
+use databend_common_ast::ast::Query;
+use databend_common_ast::ast::Statement;
 use databend_common_catalog::lock::LockTableOption;
 use databend_common_exception::ErrorCode;
 use databend_common_exception::Result;
 use databend_common_sql::executor::PhysicalPlanBuilder;
 use databend_common_sql::optimizer::SExpr;
+use databend_common_sql::plans::set_update_stream_columns;
+use databend_common_sql::plans::Plan;
 use databend_common_sql::plans::Recluster;
 use databend_common_sql::MetadataRef;
+use databend_common_sql::Planner;
 use log::error;
 use log::warn;
 
+use crate::interpreters::hook::vacuum_hook::hook_disk_temp_dir;
+use crate::interpreters::hook::vacuum_hook::hook_vacuum_temp_files;
 use crate::interpreters::Interpreter;
 use crate::interpreters::InterpreterClusteringHistory;
 use crate::pipelines::executor::ExecutorSettings;
@@ -39,6 +46,7 @@ use crate::sessions::TableContext;
 pub struct ReclusterTableInterpreter {
     ctx: Arc<QueryContext>,
     s_expr: SExpr,
+    hilbert_query: Option<Box<Query>>,
     lock_opt: LockTableOption,
     is_final: bool,
 }
@@ -47,12 +55,14 @@ impl ReclusterTableInterpreter {
     pub fn try_create(
         ctx: Arc<QueryContext>,
         s_expr: SExpr,
+        hilbert_query: Option<Box<Query>>,
         lock_opt: LockTableOption,
         is_final: bool,
     ) -> Result<Self> {
         Ok(Self {
             ctx,
             s_expr,
+            hilbert_query,
             lock_opt,
             is_final,
         })
@@ -77,6 +87,7 @@ impl Interpreter for ReclusterTableInterpreter {
         let mut times = 0;
         let start = SystemTime::now();
         let timeout = Duration::from_secs(recluster_timeout_secs);
+        let plan: Recluster = self.s_expr.plan().clone().try_into()?;
         loop {
             if let Err(err) = ctx.check_aborting() {
                 error!(
@@ -85,7 +96,7 @@ impl Interpreter for ReclusterTableInterpreter {
                 return Err(err.with_context("failed to execute"));
             }
 
-            let res = self.execute_recluster().await;
+            let res = self.execute_recluster(plan.clone()).await;
 
             match res {
                 Ok(is_break) => {
@@ -132,6 +143,10 @@ impl Interpreter for ReclusterTableInterpreter {
                 );
                 break;
             }
+
+            self.ctx.clear_selected_segment_locations();
+            self.ctx
+                .evict_table_from_cache(&plan.catalog, &plan.database, &plan.table)?;
         }
 
         Ok(PipelineBuildResult::create())
@@ -139,19 +154,45 @@ impl Interpreter for ReclusterTableInterpreter {
 }
 
 impl ReclusterTableInterpreter {
-    async fn execute_recluster(&self) -> Result<bool> {
+    async fn execute_recluster(&self, op: Recluster) -> Result<bool> {
         let start = SystemTime::now();
-        let plan: Recluster = self.s_expr.plan().clone().try_into()?;
 
-        // try add lock table.
+        // try to add lock table.
         let lock_guard = self
             .ctx
             .clone()
-            .acquire_table_lock(&plan.catalog, &plan.database, &plan.table, &self.lock_opt)
+            .acquire_table_lock(&op.catalog, &op.database, &op.table, &self.lock_opt)
             .await?;
 
-        let mut builder = PhysicalPlanBuilder::new(MetadataRef::default(), self.ctx.clone(), false);
-        let physical_plan = match builder.build(&self.s_expr, HashSet::new()).await {
+        let tbl = self
+            .ctx
+            .get_table(&op.catalog, &op.database, &op.table)
+            .await?;
+        let (s_expr, metadata, required) = if let Some(hilbert) = &self.hilbert_query {
+            let mut planner = Planner::new(self.ctx.clone());
+            let plan = planner
+                .plan_stmt(&Statement::Query(hilbert.clone()), false)
+                .await?;
+            let Plan::Query {
+                mut s_expr,
+                metadata,
+                bind_context,
+                ..
+            } = plan
+            else {
+                unreachable!()
+            };
+            if tbl.change_tracking_enabled() {
+                *s_expr = set_update_stream_columns(&s_expr)?;
+            }
+            let s_expr = self.s_expr.replace_children(vec![Arc::new(*s_expr)]);
+            (s_expr, metadata, bind_context.column_set())
+        } else {
+            (self.s_expr.clone(), MetadataRef::default(), HashSet::new())
+        };
+
+        let mut builder = PhysicalPlanBuilder::new(metadata, self.ctx.clone(), false);
+        let physical_plan = match builder.build(&s_expr, required).await {
             Ok(res) => res,
             Err(e) => {
                 return if e.code() == ErrorCode::NO_NEED_TO_RECLUSTER {
@@ -164,7 +205,7 @@ impl ReclusterTableInterpreter {
 
         let mut build_res =
             build_query_pipeline_without_render_result_set(&self.ctx, &physical_plan).await?;
-        assert!(build_res.main_pipeline.is_complete_pipeline()?);
+        debug_assert!(build_res.main_pipeline.is_complete_pipeline()?);
 
         let max_threads = self.ctx.get_settings().get_max_threads()? as usize;
         build_res.set_max_threads(max_threads);
@@ -176,7 +217,7 @@ impl ReclusterTableInterpreter {
 
         let complete_executor =
             PipelineCompleteExecutor::from_pipelines(pipelines, executor_settings)?;
-        self.ctx.clear_segment_locations()?;
+        self.ctx.clear_written_segment_locations()?;
         self.ctx.set_executor(complete_executor.get_inner())?;
         complete_executor.execute()?;
         // make sure the executor is dropped before the next loop.
@@ -184,7 +225,11 @@ impl ReclusterTableInterpreter {
         // make sure the lock guard is dropped before the next loop.
         drop(lock_guard);
 
-        InterpreterClusteringHistory::write_log(&self.ctx, start, &plan.database, &plan.table)?;
+        // vacuum temp files.
+        hook_vacuum_temp_files(&self.ctx)?;
+        hook_disk_temp_dir(&self.ctx)?;
+
+        InterpreterClusteringHistory::write_log(&self.ctx, start, &op.database, &op.table)?;
         Ok(false)
     }
 }
diff --git a/src/query/service/src/pipelines/builders/builder_column_mutation.rs b/src/query/service/src/pipelines/builders/builder_column_mutation.rs
index 225fef28c1380..1e5ea0acdead0 100644
--- a/src/query/service/src/pipelines/builders/builder_column_mutation.rs
+++ b/src/query/service/src/pipelines/builders/builder_column_mutation.rs
@@ -19,7 +19,6 @@ use databend_common_exception::Result;
 use databend_common_expression::RemoteExpr;
 use databend_common_functions::BUILTIN_FUNCTIONS;
 use databend_common_pipeline_transforms::processors::TransformPipelineHelper;
-use databend_common_sql::binder::MutationType;
 use databend_common_sql::evaluator::BlockOperator;
 use databend_common_sql::evaluator::CompoundBlockOperator;
 use databend_common_sql::executor::physical_plans::ColumnMutation;
@@ -47,45 +46,28 @@ impl PipelineBuilder {
             .build_table_by_table_info(&column_mutation.table_info, None)?;
         let table = FuseTable::try_from_table(table.as_ref())?;
 
-        if column_mutation.mutation_type == MutationType::Delete {
-            let cluster_stats_gen = table.get_cluster_stats_gen(
-                self.ctx.clone(),
-                0,
-                table.get_block_thresholds(),
-                None,
-            )?;
-            self.main_pipeline.add_transform(|input, output| {
-                let proc = TransformSerializeBlock::try_create(
-                    self.ctx.clone(),
-                    input,
-                    output,
-                    table,
-                    cluster_stats_gen.clone(),
-                    MutationKind::Delete,
-                )?;
-                proc.into_processor()
-            })?;
+        let block_thresholds = table.get_block_thresholds();
+        let cluster_stats_gen = if matches!(column_mutation.mutation_kind, MutationKind::Delete) {
+            table.get_cluster_stats_gen(self.ctx.clone(), 0, block_thresholds, None)?
         } else {
-            let block_thresholds = table.get_block_thresholds();
-            let cluster_stats_gen = table.cluster_gen_for_append(
+            table.cluster_gen_for_append(
                 self.ctx.clone(),
                 &mut self.main_pipeline,
                 block_thresholds,
                 None,
+            )?
+        };
+        self.main_pipeline.add_transform(|input, output| {
+            let proc = TransformSerializeBlock::try_create(
+                self.ctx.clone(),
+                input,
+                output,
+                table,
+                cluster_stats_gen.clone(),
+                column_mutation.mutation_kind,
             )?;
-            self.main_pipeline.add_transform(|input, output| {
-                let proc = TransformSerializeBlock::try_create(
-                    self.ctx.clone(),
-                    input,
-                    output,
-                    table,
-                    cluster_stats_gen.clone(),
-                    MutationKind::Update,
-                )?;
-                proc.into_processor()
-            })?;
-        }
-
+            proc.into_processor()
+        })?;
         Ok(())
     }
 
diff --git a/src/query/service/src/pipelines/builders/builder_hilbert_serialize.rs b/src/query/service/src/pipelines/builders/builder_hilbert_serialize.rs
new file mode 100644
index 0000000000000..d931544037aae
--- /dev/null
+++ b/src/query/service/src/pipelines/builders/builder_hilbert_serialize.rs
@@ -0,0 +1,56 @@
+// Copyright 2021 Datafuse Labs
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use databend_common_exception::Result;
+use databend_common_pipeline_transforms::processors::build_compact_block_no_split_pipeline;
+use databend_common_sql::executor::physical_plans::HilbertSerialize;
+use databend_common_sql::executor::physical_plans::MutationKind;
+use databend_common_storages_factory::Table;
+use databend_common_storages_fuse::operations::TransformSerializeBlock;
+use databend_common_storages_fuse::statistics::ClusterStatsGenerator;
+use databend_common_storages_fuse::FuseTable;
+use databend_common_storages_fuse::TableContext;
+
+use crate::pipelines::PipelineBuilder;
+
+impl PipelineBuilder {
+    pub(crate) fn build_hilbert_serialize(&mut self, serialize: &HilbertSerialize) -> Result<()> {
+        self.build_pipeline(&serialize.input)?;
+        let table = self
+            .ctx
+            .build_table_by_table_info(&serialize.table_info, None)?;
+        let table = FuseTable::try_from_table(table.as_ref())?;
+
+        let block_thresholds = table.get_block_thresholds();
+        let max_threads = self.ctx.get_settings().get_max_threads()? as usize;
+        build_compact_block_no_split_pipeline(
+            &mut self.main_pipeline,
+            block_thresholds,
+            max_threads,
+        )?;
+
+        self.main_pipeline
+            .add_transform(|transform_input_port, transform_output_port| {
+                let proc = TransformSerializeBlock::try_create(
+                    self.ctx.clone(),
+                    transform_input_port,
+                    transform_output_port,
+                    table,
+                    ClusterStatsGenerator::default(),
+                    MutationKind::Recluster,
+                )?;
+                proc.into_processor()
+            })
+    }
+}
diff --git a/src/query/service/src/pipelines/builders/builder_recluster.rs b/src/query/service/src/pipelines/builders/builder_recluster.rs
index dfc414490f9bb..f57e149feab6b 100644
--- a/src/query/service/src/pipelines/builders/builder_recluster.rs
+++ b/src/query/service/src/pipelines/builders/builder_recluster.rs
@@ -40,6 +40,26 @@ use crate::pipelines::processors::TransformAddStreamColumns;
 use crate::pipelines::PipelineBuilder;
 
 impl PipelineBuilder {
+    /// The flow of Pipeline is as follows:
+    // ┌──────────┐     ┌───────────────┐     ┌─────────┐
+    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┐
+    // └──────────┘     └───────────────┘     └─────────┘    │
+    // ┌──────────┐     ┌───────────────┐     ┌─────────┐    │     ┌──────────────┐     ┌─────────┐
+    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┤────►│MultiSortMerge├────►│Resize(N)├───┐
+    // └──────────┘     └───────────────┘     └─────────┘    │     └──────────────┘     └─────────┘   │
+    // ┌──────────┐     ┌───────────────┐     ┌─────────┐    │                                        │
+    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┘                                        │
+    // └──────────┘     └───────────────┘     └─────────┘                                             │
+    // ┌──────────────────────────────────────────────────────────────────────────────────────────────┘
+    // │         ┌──────────────┐
+    // │    ┌───►│SerializeBlock├───┐
+    // │    │    └──────────────┘   │
+    // │    │    ┌──────────────┐   │    ┌─────────┐    ┌────────────────┐     ┌─────────────┐     ┌──────────┐
+    // └───►│───►│SerializeBlock├───┤───►│Resize(1)├───►│SerializeSegment├────►│ReclusterAggr├────►│CommitSink│
+    //      │    └──────────────┘   │    └─────────┘    └────────────────┘     └─────────────┘     └──────────┘
+    //      │    ┌──────────────┐   │
+    //      └───►│SerializeBlock├───┘
+    //           └──────────────┘
     pub(crate) fn build_recluster(&mut self, recluster: &Recluster) -> Result<()> {
         match recluster.tasks.len() {
             0 => self.main_pipeline.add_source(EmptySource::create, 1),
diff --git a/src/query/service/src/pipelines/builders/builder_replace_into.rs b/src/query/service/src/pipelines/builders/builder_replace_into.rs
index ad3fd8854904c..e8e1f08d3228e 100644
--- a/src/query/service/src/pipelines/builders/builder_replace_into.rs
+++ b/src/query/service/src/pipelines/builders/builder_replace_into.rs
@@ -359,7 +359,7 @@ impl PipelineBuilder {
         } else {
             None
         };
-        let cluster_keys = table.cluster_keys(self.ctx.clone());
+        let cluster_keys = table.linear_cluster_keys(self.ctx.clone());
         if *need_insert {
             let replace_into_processor = ReplaceIntoProcessor::create(
                 self.ctx.clone(),
diff --git a/src/query/service/src/pipelines/builders/mod.rs b/src/query/service/src/pipelines/builders/mod.rs
index a35c735954af7..707ed7c7e4b58 100644
--- a/src/query/service/src/pipelines/builders/mod.rs
+++ b/src/query/service/src/pipelines/builders/mod.rs
@@ -25,6 +25,7 @@ mod builder_distributed_insert_select;
 mod builder_exchange;
 mod builder_fill_missing_columns;
 mod builder_filter;
+mod builder_hilbert_serialize;
 mod builder_insert_multi_table;
 mod builder_join;
 mod builder_limit;
diff --git a/src/query/service/src/pipelines/pipeline_builder.rs b/src/query/service/src/pipelines/pipeline_builder.rs
index 8a87ce1e7eb7c..6508dcca83b6c 100644
--- a/src/query/service/src/pipelines/pipeline_builder.rs
+++ b/src/query/service/src/pipelines/pipeline_builder.rs
@@ -227,6 +227,7 @@ impl PipelineBuilder {
 
             // Recluster.
             PhysicalPlan::Recluster(recluster) => self.build_recluster(recluster),
+            PhysicalPlan::HilbertSerialize(serialize) => self.build_hilbert_serialize(serialize),
 
             PhysicalPlan::Duplicate(duplicate) => self.build_duplicate(duplicate),
             PhysicalPlan::Shuffle(shuffle) => self.build_shuffle(shuffle),
diff --git a/src/query/service/src/pipelines/processors/transforms/transform_recursive_cte_source.rs b/src/query/service/src/pipelines/processors/transforms/transform_recursive_cte_source.rs
index 4fd297786eae6..b8285d3061c24 100644
--- a/src/query/service/src/pipelines/processors/transforms/transform_recursive_cte_source.rs
+++ b/src/query/service/src/pipelines/processors/transforms/transform_recursive_cte_source.rs
@@ -339,6 +339,7 @@ async fn create_memory_table_for_cte_scan(
         | PhysicalPlan::CompactSource(_)
         | PhysicalPlan::CommitSink(_)
         | PhysicalPlan::Recluster(_)
+        | PhysicalPlan::HilbertSerialize(_)
         | PhysicalPlan::Duplicate(_)
         | PhysicalPlan::ChunkFilter(_)
         | PhysicalPlan::ChunkEvalScalar(_)
diff --git a/src/query/service/src/sessions/query_ctx.rs b/src/query/service/src/sessions/query_ctx.rs
index 0392c22f6336b..9c55fba8f5b37 100644
--- a/src/query/service/src/sessions/query_ctx.rs
+++ b/src/query/service/src/sessions/query_ctx.rs
@@ -152,7 +152,9 @@ pub struct QueryContext {
     query_settings: Arc<Settings>,
     fragment_id: Arc<AtomicUsize>,
     // Used by synchronized generate aggregating indexes when new data written.
-    inserted_segment_locs: Arc<RwLock<HashSet<Location>>>,
+    written_segment_locs: Arc<RwLock<HashSet<Location>>>,
+    // Used by hilbert clustering when do recluster.
+    selected_segment_locs: Arc<RwLock<HashSet<Location>>>,
     // Temp table for materialized CTE, first string is the database_name, second string is the table_name
     // All temp tables' catalog is `CATALOG_DEFAULT`, so we don't need to store it.
     m_cte_temp_table: Arc<RwLock<Vec<(String, String)>>>,
@@ -179,9 +181,10 @@ impl QueryContext {
             shared,
             query_settings,
             fragment_id: Arc::new(AtomicUsize::new(0)),
-            inserted_segment_locs: Arc::new(RwLock::new(HashSet::new())),
-            block_threshold: Arc::new(RwLock::new(BlockThresholds::default())),
+            written_segment_locs: Default::default(),
+            block_threshold: Default::default(),
             m_cte_temp_table: Default::default(),
+            selected_segment_locs: Default::default(),
         })
     }
 
@@ -1220,27 +1223,41 @@ impl TableContext for QueryContext {
         })
     }
 
-    fn add_segment_location(&self, segment_loc: Location) -> Result<()> {
-        let mut segment_locations = self.inserted_segment_locs.write();
+    fn add_written_segment_location(&self, segment_loc: Location) -> Result<()> {
+        let mut segment_locations = self.written_segment_locs.write();
         segment_locations.insert(segment_loc);
         Ok(())
     }
 
-    fn clear_segment_locations(&self) -> Result<()> {
-        let mut segment_locations = self.inserted_segment_locs.write();
+    fn clear_written_segment_locations(&self) -> Result<()> {
+        let mut segment_locations = self.written_segment_locs.write();
         segment_locations.clear();
         Ok(())
     }
 
-    fn get_segment_locations(&self) -> Result<Vec<Location>> {
+    fn get_written_segment_locations(&self) -> Result<Vec<Location>> {
         Ok(self
-            .inserted_segment_locs
+            .written_segment_locs
             .read()
             .iter()
             .cloned()
             .collect::<Vec<_>>())
     }
 
+    fn add_selected_segment_location(&self, segment_loc: Location) {
+        let mut segment_locations = self.selected_segment_locs.write();
+        segment_locations.insert(segment_loc);
+    }
+
+    fn get_selected_segment_locations(&self) -> Vec<Location> {
+        self.selected_segment_locs.read().iter().cloned().collect()
+    }
+
+    fn clear_selected_segment_locations(&self) {
+        let mut segment_locations = self.selected_segment_locs.write();
+        segment_locations.clear();
+    }
+
     fn add_file_status(&self, file_path: &str, file_status: FileStatus) -> Result<()> {
         if matches!(self.get_query_kind(), QueryKind::CopyIntoTable) {
             self.shared.copy_status.add_chunk(file_path, file_status);
diff --git a/src/query/service/src/table_functions/table_function_factory.rs b/src/query/service/src/table_functions/table_function_factory.rs
index 3a24d03099102..32b6615059eb8 100644
--- a/src/query/service/src/table_functions/table_function_factory.rs
+++ b/src/query/service/src/table_functions/table_function_factory.rs
@@ -27,6 +27,7 @@ use databend_common_storages_fuse::table_functions::FuseEncodingFunc;
 use databend_common_storages_fuse::table_functions::FuseStatisticsFunc;
 use databend_common_storages_fuse::table_functions::FuseTimeTravelSizeFunc;
 use databend_common_storages_fuse::table_functions::FuseVacuumTemporaryTable;
+use databend_common_storages_fuse::table_functions::HilbertClusteringInfoFunc;
 use databend_common_storages_fuse::table_functions::SetCacheCapacity;
 use databend_common_storages_fuse::table_functions::TableFunctionTemplate;
 use databend_common_storages_stream::stream_status_table_func::StreamStatusTable;
@@ -195,6 +196,14 @@ impl TableFunctionFactory {
             ),
         );
 
+        creators.insert(
+            "hilbert_clustering_information".to_string(),
+            (
+                next_id(),
+                Arc::new(TableFunctionTemplate::<HilbertClusteringInfoFunc>::create),
+            ),
+        );
+
         creators.insert(
             "fuse_vacuum_temporary_table".to_string(),
             (
diff --git a/src/query/service/tests/it/sql/exec/get_table_bind_test.rs b/src/query/service/tests/it/sql/exec/get_table_bind_test.rs
index 95045562db4f8..228f0753b4378 100644
--- a/src/query/service/tests/it/sql/exec/get_table_bind_test.rs
+++ b/src/query/service/tests/it/sql/exec/get_table_bind_test.rs
@@ -845,15 +845,15 @@ impl TableContext for CtxDelegation {
         todo!()
     }
 
-    fn add_segment_location(&self, _segment_loc: Location) -> Result<()> {
+    fn add_written_segment_location(&self, _segment_loc: Location) -> Result<()> {
         todo!()
     }
 
-    fn clear_segment_locations(&self) -> Result<()> {
+    fn clear_written_segment_locations(&self) -> Result<()> {
         todo!()
     }
 
-    fn get_segment_locations(&self) -> Result<Vec<Location>> {
+    fn get_written_segment_locations(&self) -> Result<Vec<Location>> {
         todo!()
     }
 
diff --git a/src/query/service/tests/it/storages/fuse/operations/commit.rs b/src/query/service/tests/it/storages/fuse/operations/commit.rs
index 9c216a0016ac3..884615af0a3dd 100644
--- a/src/query/service/tests/it/storages/fuse/operations/commit.rs
+++ b/src/query/service/tests/it/storages/fuse/operations/commit.rs
@@ -730,15 +730,15 @@ impl TableContext for CtxDelegation {
         HashMap::new()
     }
 
-    fn add_segment_location(&self, _segment_loc: Location) -> Result<()> {
+    fn add_written_segment_location(&self, _segment_loc: Location) -> Result<()> {
         todo!()
     }
 
-    fn clear_segment_locations(&self) -> Result<()> {
+    fn clear_written_segment_locations(&self) -> Result<()> {
         todo!()
     }
 
-    fn get_segment_locations(&self) -> Result<Vec<Location>> {
+    fn get_written_segment_locations(&self) -> Result<Vec<Location>> {
         todo!()
     }
 
diff --git a/src/query/settings/src/settings_default.rs b/src/query/settings/src/settings_default.rs
index b8e51c9dd75f7..ea88aa5a1506a 100644
--- a/src/query/settings/src/settings_default.rs
+++ b/src/query/settings/src/settings_default.rs
@@ -1158,6 +1158,20 @@ impl DefaultSettings {
                     scope: SettingScope::Session,
                     range: None,
                 }),
+                ("hilbert_num_range_ids", DefaultSettingValue {
+                    value: UserSettingValue::UInt64(1024),
+                    desc: "Specifies the domain of range IDs in Hilbert clustering. A larger value provides finer granularity, but may incur a performance cost.",
+                    mode: SettingMode::Both,
+                    scope: SettingScope::Both,
+                    range: Some(SettingRange::Numeric(1..=65535)),
+                }),
+                ("hilbert_sample_size_per_block", DefaultSettingValue {
+                    value: UserSettingValue::UInt64(1000),
+                    desc: "Specifies the number of sample points per block used in Hilbert clustering.",
+                    mode: SettingMode::Both,
+                    scope: SettingScope::Both,
+                    range: Some(SettingRange::Numeric(1..=u64::MAX)),
+                }),
             ]);
 
             Ok(Arc::new(DefaultSettings {
diff --git a/src/query/settings/src/settings_getter_setter.rs b/src/query/settings/src/settings_getter_setter.rs
index 803af09caf731..9b9608fcc79b3 100644
--- a/src/query/settings/src/settings_getter_setter.rs
+++ b/src/query/settings/src/settings_getter_setter.rs
@@ -181,6 +181,11 @@ impl Settings {
         self.try_get_u64("max_block_size")
     }
 
+    // Set max_block_size.
+    pub fn set_max_block_size(&self, val: u64) -> Result<()> {
+        self.try_set_u64("max_block_size", val)
+    }
+
     // Max block size for parquet reader
     pub fn get_parquet_max_block_size(&self) -> Result<u64> {
         self.try_get_u64("parquet_max_block_size")
@@ -853,4 +858,12 @@ impl Settings {
     pub unsafe fn set_warehouse(&self, warehouse: String) -> Result<()> {
         self.unchecked_set_setting(String::from("warehouse"), warehouse)
     }
+
+    pub fn get_hilbert_num_range_ids(&self) -> Result<u64> {
+        self.try_get_u64("hilbert_num_range_ids")
+    }
+
+    pub fn get_hilbert_sample_size_per_block(&self) -> Result<u64> {
+        self.try_get_u64("hilbert_sample_size_per_block")
+    }
 }
diff --git a/src/query/sql/Cargo.toml b/src/query/sql/Cargo.toml
index ba707dc16a72b..0cdb7cf0e5a88 100644
--- a/src/query/sql/Cargo.toml
+++ b/src/query/sql/Cargo.toml
@@ -35,6 +35,7 @@ databend-common-storages-result-cache = { workspace = true }
 databend-common-storages-view = { workspace = true }
 databend-common-users = { workspace = true }
 databend-enterprise-data-mask-feature = { workspace = true }
+databend-enterprise-hilbert-clustering = { workspace = true }
 databend-storages-common-cache = { workspace = true }
 databend-storages-common-io = { workspace = true }
 databend-storages-common-session = { workspace = true }
diff --git a/src/query/sql/src/executor/format.rs b/src/query/sql/src/executor/format.rs
index a671c196405ab..233c0c408340e 100644
--- a/src/query/sql/src/executor/format.rs
+++ b/src/query/sql/src/executor/format.rs
@@ -350,6 +350,9 @@ fn to_format_tree(
             distributed_insert_to_format_tree(plan.as_ref(), metadata, profs)
         }
         PhysicalPlan::Recluster(_) => Ok(FormatTreeNode::new("Recluster".to_string())),
+        PhysicalPlan::HilbertSerialize(_) => {
+            Ok(FormatTreeNode::new("HilbertSerialize".to_string()))
+        }
         PhysicalPlan::CompactSource(_) => Ok(FormatTreeNode::new("CompactSource".to_string())),
         PhysicalPlan::CommitSink(plan) => commit_sink_to_format_tree(plan, metadata, profs),
         PhysicalPlan::ProjectSet(plan) => project_set_to_format_tree(plan, metadata, profs),
diff --git a/src/query/sql/src/executor/physical_plan.rs b/src/query/sql/src/executor/physical_plan.rs
index 8888cfb8e9f92..292438a290e06 100644
--- a/src/query/sql/src/executor/physical_plan.rs
+++ b/src/query/sql/src/executor/physical_plan.rs
@@ -23,6 +23,7 @@ use enum_as_inner::EnumAsInner;
 use itertools::Itertools;
 
 use super::physical_plans::AddStreamColumn;
+use super::physical_plans::HilbertSerialize;
 use super::physical_plans::MutationManipulate;
 use super::physical_plans::MutationOrganize;
 use super::physical_plans::MutationSource;
@@ -131,6 +132,7 @@ pub enum PhysicalPlan {
 
     /// Recluster
     Recluster(Box<Recluster>),
+    HilbertSerialize(Box<HilbertSerialize>),
 
     /// Multi table insert
     Duplicate(Box<Duplicate>),
@@ -348,6 +350,10 @@ impl PhysicalPlan {
                 plan.plan_id = *next_id;
                 *next_id += 1;
             }
+            PhysicalPlan::HilbertSerialize(plan) => {
+                plan.plan_id = *next_id;
+                *next_id += 1;
+            }
             PhysicalPlan::Duplicate(plan) => {
                 plan.plan_id = *next_id;
                 *next_id += 1;
@@ -438,6 +444,7 @@ impl PhysicalPlan {
             PhysicalPlan::ReplaceInto(v) => v.plan_id,
             PhysicalPlan::CompactSource(v) => v.plan_id,
             PhysicalPlan::Recluster(v) => v.plan_id,
+            PhysicalPlan::HilbertSerialize(v) => v.plan_id,
             PhysicalPlan::Duplicate(v) => v.plan_id,
             PhysicalPlan::Shuffle(v) => v.plan_id,
             PhysicalPlan::ChunkFilter(v) => v.plan_id,
@@ -492,7 +499,8 @@ impl PhysicalPlan {
             | PhysicalPlan::CompactSource(_)
             | PhysicalPlan::CommitSink(_)
             | PhysicalPlan::DistributedInsertSelect(_)
-            | PhysicalPlan::Recluster(_) => Ok(DataSchemaRef::default()),
+            | PhysicalPlan::Recluster(_)
+            | PhysicalPlan::HilbertSerialize(_) => Ok(DataSchemaRef::default()),
             PhysicalPlan::Duplicate(plan) => plan.input.output_schema(),
             PhysicalPlan::Shuffle(plan) => plan.input.output_schema(),
             PhysicalPlan::ChunkFilter(plan) => plan.input.output_schema(),
@@ -552,6 +560,7 @@ impl PhysicalPlan {
             PhysicalPlan::ExpressionScan(_) => "ExpressionScan".to_string(),
             PhysicalPlan::CacheScan(_) => "CacheScan".to_string(),
             PhysicalPlan::Recluster(_) => "Recluster".to_string(),
+            PhysicalPlan::HilbertSerialize(_) => "HilbertSerialize".to_string(),
             PhysicalPlan::Udf(_) => "Udf".to_string(),
             PhysicalPlan::Duplicate(_) => "Duplicate".to_string(),
             PhysicalPlan::Shuffle(_) => "Shuffle".to_string(),
@@ -574,6 +583,7 @@ impl PhysicalPlan {
             | PhysicalPlan::CompactSource(_)
             | PhysicalPlan::ReplaceAsyncSourcer(_)
             | PhysicalPlan::Recluster(_)
+            | PhysicalPlan::HilbertSerialize(_)
             | PhysicalPlan::RecursiveCteScan(_) => Box::new(std::iter::empty()),
             PhysicalPlan::Filter(plan) => Box::new(std::iter::once(plan.input.as_ref())),
             PhysicalPlan::EvalScalar(plan) => Box::new(std::iter::once(plan.input.as_ref())),
@@ -679,6 +689,7 @@ impl PhysicalPlan {
             | PhysicalPlan::CacheScan(_)
             | PhysicalPlan::RecursiveCteScan(_)
             | PhysicalPlan::Recluster(_)
+            | PhysicalPlan::HilbertSerialize(_)
             | PhysicalPlan::Duplicate(_)
             | PhysicalPlan::Shuffle(_)
             | PhysicalPlan::ChunkFilter(_)
diff --git a/src/query/sql/src/executor/physical_plan_builder.rs b/src/query/sql/src/executor/physical_plan_builder.rs
index 1b28a32d5f87e..c020fdef52664 100644
--- a/src/query/sql/src/executor/physical_plan_builder.rs
+++ b/src/query/sql/src/executor/physical_plan_builder.rs
@@ -126,7 +126,9 @@ impl PhysicalPlanBuilder {
             RelOperator::MutationSource(mutation_source) => {
                 self.build_mutation_source(mutation_source).await
             }
-            RelOperator::Recluster(recluster) => self.build_recluster(recluster).await,
+            RelOperator::Recluster(recluster) => {
+                self.build_recluster(s_expr, recluster, required).await
+            }
             RelOperator::CompactBlock(compact) => self.build_compact_block(compact).await,
         }
     }
@@ -134,6 +136,10 @@ impl PhysicalPlanBuilder {
     pub fn set_mutation_build_info(&mut self, mutation_build_info: MutationBuildInfo) {
         self.mutation_build_info = Some(mutation_build_info);
     }
+
+    pub fn set_metadata(&mut self, metadata: MetadataRef) {
+        self.metadata = metadata;
+    }
 }
 
 #[derive(Clone)]
diff --git a/src/query/sql/src/executor/physical_plan_visitor.rs b/src/query/sql/src/executor/physical_plan_visitor.rs
index 7f53a14b515fd..5cdccd69f9e91 100644
--- a/src/query/sql/src/executor/physical_plan_visitor.rs
+++ b/src/query/sql/src/executor/physical_plan_visitor.rs
@@ -17,6 +17,7 @@ use databend_common_exception::Result;
 use super::physical_plans::AddStreamColumn;
 use super::physical_plans::CacheScan;
 use super::physical_plans::ExpressionScan;
+use super::physical_plans::HilbertSerialize;
 use super::physical_plans::MutationManipulate;
 use super::physical_plans::MutationOrganize;
 use super::physical_plans::MutationSplit;
@@ -107,6 +108,7 @@ pub trait PhysicalPlanReplacer {
             PhysicalPlan::ExpressionScan(plan) => self.replace_expression_scan(plan),
             PhysicalPlan::CacheScan(plan) => self.replace_cache_scan(plan),
             PhysicalPlan::Recluster(plan) => self.replace_recluster(plan),
+            PhysicalPlan::HilbertSerialize(plan) => self.replace_hilbert_serialize(plan),
             PhysicalPlan::Udf(plan) => self.replace_udf(plan),
             PhysicalPlan::AsyncFunction(plan) => self.replace_async_function(plan),
             PhysicalPlan::Duplicate(plan) => self.replace_duplicate(plan),
@@ -125,6 +127,10 @@ pub trait PhysicalPlanReplacer {
         Ok(PhysicalPlan::Recluster(Box::new(plan.clone())))
     }
 
+    fn replace_hilbert_serialize(&mut self, plan: &HilbertSerialize) -> Result<PhysicalPlan> {
+        Ok(PhysicalPlan::HilbertSerialize(Box::new(plan.clone())))
+    }
+
     fn replace_table_scan(&mut self, plan: &TableScan) -> Result<PhysicalPlan> {
         Ok(PhysicalPlan::TableScan(plan.clone()))
     }
@@ -639,6 +645,7 @@ impl PhysicalPlan {
                 | PhysicalPlan::ExpressionScan(_)
                 | PhysicalPlan::CacheScan(_)
                 | PhysicalPlan::Recluster(_)
+                | PhysicalPlan::HilbertSerialize(_)
                 | PhysicalPlan::ExchangeSource(_)
                 | PhysicalPlan::CompactSource(_)
                 | PhysicalPlan::MutationSource(_) => {}
diff --git a/src/query/sql/src/executor/physical_plans/mod.rs b/src/query/sql/src/executor/physical_plans/mod.rs
index 2bb277f10a73c..0caee74d6bec5 100644
--- a/src/query/sql/src/executor/physical_plans/mod.rs
+++ b/src/query/sql/src/executor/physical_plans/mod.rs
@@ -67,7 +67,6 @@ pub use physical_async_func::AsyncFunctionDesc;
 pub use physical_cache_scan::CacheScan;
 pub use physical_column_mutation::ColumnMutation;
 pub use physical_commit_sink::CommitSink;
-pub use physical_commit_sink::ReclusterInfoSideCar;
 pub use physical_compact_source::CompactSource;
 pub use physical_constant_table_scan::ConstantTableScan;
 pub use physical_copy_into_location::CopyIntoLocation;
@@ -91,6 +90,7 @@ pub use physical_mutation_source::*;
 pub use physical_project_set::ProjectSet;
 pub use physical_r_cte_scan::RecursiveCteScan;
 pub use physical_range_join::*;
+pub use physical_recluster::HilbertSerialize;
 pub use physical_recluster::Recluster;
 pub use physical_refresh_index::RefreshIndex;
 pub use physical_replace_async_source::ReplaceAsyncSourcer;
diff --git a/src/query/sql/src/executor/physical_plans/physical_column_mutation.rs b/src/query/sql/src/executor/physical_plans/physical_column_mutation.rs
index b3e167a802dd1..68f50af6e3117 100644
--- a/src/query/sql/src/executor/physical_plans/physical_column_mutation.rs
+++ b/src/query/sql/src/executor/physical_plans/physical_column_mutation.rs
@@ -17,8 +17,8 @@ use std::collections::HashMap;
 use databend_common_expression::RemoteExpr;
 use databend_common_meta_app::schema::TableInfo;
 
-use crate::binder::MutationType;
 use crate::executor::physical_plan::PhysicalPlan;
+use crate::executor::physical_plans::MutationKind;
 
 #[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
 pub struct ColumnMutation {
@@ -27,7 +27,7 @@ pub struct ColumnMutation {
     pub table_info: TableInfo,
     pub mutation_expr: Option<Vec<(usize, RemoteExpr)>>,
     pub computed_expr: Option<Vec<(usize, RemoteExpr)>>,
-    pub mutation_type: MutationType,
+    pub mutation_kind: MutationKind,
     pub field_id_to_schema_index: HashMap<usize, usize>,
     pub input_num_columns: usize,
     pub has_filter_column: bool,
diff --git a/src/query/sql/src/executor/physical_plans/physical_commit_sink.rs b/src/query/sql/src/executor/physical_plans/physical_commit_sink.rs
index 33bd4f06f7ca5..572a4944b1d1e 100644
--- a/src/query/sql/src/executor/physical_plans/physical_commit_sink.rs
+++ b/src/query/sql/src/executor/physical_plans/physical_commit_sink.rs
@@ -14,10 +14,9 @@
 
 use std::sync::Arc;
 
+use databend_common_catalog::plan::ReclusterInfoSideCar;
 use databend_common_meta_app::schema::TableInfo;
 use databend_common_meta_app::schema::UpdateStreamMetaReq;
-use databend_storages_common_table_meta::meta::BlockMeta;
-use databend_storages_common_table_meta::meta::Statistics;
 use databend_storages_common_table_meta::meta::TableSnapshot;
 
 use crate::executor::physical_plans::common::MutationKind;
@@ -39,11 +38,3 @@ pub struct CommitSink {
     // Used for recluster.
     pub recluster_info: Option<ReclusterInfoSideCar>,
 }
-
-// TODO refine this
-#[derive(serde::Serialize, serde::Deserialize, Clone, Debug, Default)]
-pub struct ReclusterInfoSideCar {
-    pub merged_blocks: Vec<Arc<BlockMeta>>,
-    pub removed_segment_indexes: Vec<usize>,
-    pub removed_statistics: Statistics,
-}
diff --git a/src/query/sql/src/executor/physical_plans/physical_mutation.rs b/src/query/sql/src/executor/physical_plans/physical_mutation.rs
index df8573418c554..d928bb43fe724 100644
--- a/src/query/sql/src/executor/physical_plans/physical_mutation.rs
+++ b/src/query/sql/src/executor/physical_plans/physical_mutation.rs
@@ -186,7 +186,7 @@ impl PhysicalPlanBuilder {
                 table_info: mutation_build_info.table_info.clone(),
                 mutation_expr,
                 computed_expr,
-                mutation_type: mutation_type.clone(),
+                mutation_kind,
                 field_id_to_schema_index,
                 input_num_columns: mutation_input_schema.fields().len(),
                 has_filter_column: predicate_column_index.is_some(),
diff --git a/src/query/sql/src/executor/physical_plans/physical_recluster.rs b/src/query/sql/src/executor/physical_plans/physical_recluster.rs
index 6fdb94eb97c9d..a82d2882d2a03 100644
--- a/src/query/sql/src/executor/physical_plans/physical_recluster.rs
+++ b/src/query/sql/src/executor/physical_plans/physical_recluster.rs
@@ -14,14 +14,14 @@
 
 use databend_common_catalog::plan::PartInfoType;
 use databend_common_catalog::plan::PushDownInfo;
+use databend_common_catalog::plan::ReclusterInfoSideCar;
 use databend_common_catalog::plan::ReclusterParts;
 use databend_common_catalog::plan::ReclusterTask;
-use databend_common_catalog::table::TableExt;
 use databend_common_exception::ErrorCode;
 use databend_common_exception::Result;
 use databend_common_meta_app::schema::TableInfo;
+use databend_enterprise_hilbert_clustering::get_hilbert_clustering_handler;
 
-use crate::executor::physical_plans::physical_commit_sink::ReclusterInfoSideCar;
 use crate::executor::physical_plans::CommitSink;
 use crate::executor::physical_plans::CompactSource;
 use crate::executor::physical_plans::Exchange;
@@ -29,6 +29,8 @@ use crate::executor::physical_plans::FragmentKind;
 use crate::executor::physical_plans::MutationKind;
 use crate::executor::PhysicalPlan;
 use crate::executor::PhysicalPlanBuilder;
+use crate::optimizer::SExpr;
+use crate::ColumnSet;
 
 #[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
 pub struct Recluster {
@@ -37,30 +39,19 @@ pub struct Recluster {
     pub table_info: TableInfo,
 }
 
+#[derive(serde::Serialize, serde::Deserialize, Clone, Debug)]
+pub struct HilbertSerialize {
+    pub plan_id: u32,
+    pub input: Box<PhysicalPlan>,
+    pub table_info: TableInfo,
+}
+
 impl PhysicalPlanBuilder {
-    /// The flow of Pipeline is as follows:
-    // ┌──────────┐     ┌───────────────┐     ┌─────────┐
-    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┐
-    // └──────────┘     └───────────────┘     └─────────┘    │
-    // ┌──────────┐     ┌───────────────┐     ┌─────────┐    │     ┌──────────────┐     ┌─────────┐
-    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┤────►│MultiSortMerge├────►│Resize(N)├───┐
-    // └──────────┘     └───────────────┘     └─────────┘    │     └──────────────┘     └─────────┘   │
-    // ┌──────────┐     ┌───────────────┐     ┌─────────┐    │                                        │
-    // │FuseSource├────►│CompoundBlockOp├────►│SortMerge├────┘                                        │
-    // └──────────┘     └───────────────┘     └─────────┘                                             │
-    // ┌──────────────────────────────────────────────────────────────────────────────────────────────┘
-    // │         ┌──────────────┐
-    // │    ┌───►│SerializeBlock├───┐
-    // │    │    └──────────────┘   │
-    // │    │    ┌──────────────┐   │    ┌─────────┐    ┌────────────────┐     ┌─────────────┐     ┌──────────┐
-    // └───►│───►│SerializeBlock├───┤───►│Resize(1)├───►│SerializeSegment├────►│ReclusterAggr├────►│CommitSink│
-    //      │    └──────────────┘   │    └─────────┘    └────────────────┘     └─────────────┘     └──────────┘
-    //      │    ┌──────────────┐   │
-    //      └───►│SerializeBlock├───┘
-    //           └──────────────┘
     pub async fn build_recluster(
         &mut self,
+        s_expr: &SExpr,
         recluster: &crate::plans::Recluster,
+        required: ColumnSet,
     ) -> Result<PhysicalPlan> {
         let crate::plans::Recluster {
             catalog,
@@ -70,100 +61,127 @@ impl PhysicalPlanBuilder {
             limit,
         } = recluster;
 
-        let tenant = self.ctx.get_tenant();
-        let catalog = self.ctx.get_catalog(catalog).await?;
-        let tbl = catalog.get_table(&tenant, database, table).await?;
-        // check mutability
-        tbl.check_mutable()?;
-
+        let tbl = self.ctx.get_table(catalog, database, table).await?;
         let push_downs = filters.clone().map(|v| PushDownInfo {
             filters: Some(v),
             ..PushDownInfo::default()
         });
-        let Some((parts, snapshot)) = tbl.recluster(self.ctx.clone(), push_downs, *limit).await?
-        else {
-            return Err(ErrorCode::NoNeedToRecluster(format!(
-                "No need to do recluster for '{database}'.'{table}'"
-            )));
-        };
-        if parts.is_empty() {
-            return Err(ErrorCode::NoNeedToRecluster(format!(
-                "No need to do recluster for '{database}'.'{table}'"
-            )));
-        }
-
-        let is_distributed = parts.is_distributed(self.ctx.clone());
         let table_info = tbl.get_table_info().clone();
-        let mut plan = match parts {
-            ReclusterParts::Recluster {
-                tasks,
-                remained_blocks,
-                removed_segment_indexes,
-                removed_segment_summary,
-            } => {
-                let mut root = PhysicalPlan::Recluster(Box::new(Recluster {
+        let is_hilbert = !s_expr.children.is_empty();
+        let mut plan = if is_hilbert {
+            let handler = get_hilbert_clustering_handler();
+            let Some((recluster_info, snapshot)) = handler
+                .do_hilbert_clustering(tbl.clone(), self.ctx.clone(), push_downs)
+                .await?
+            else {
+                return Err(ErrorCode::NoNeedToRecluster(format!(
+                    "No need to do recluster for '{database}'.'{table}'"
+                )));
+            };
+
+            let plan = self.build(s_expr.child(0)?, required).await?;
+            let plan = PhysicalPlan::HilbertSerialize(Box::new(HilbertSerialize {
+                plan_id: 0,
+                input: Box::new(plan),
+                table_info: table_info.clone(),
+            }));
+            PhysicalPlan::CommitSink(Box::new(CommitSink {
+                input: Box::new(plan),
+                table_info,
+                snapshot: Some(snapshot),
+                mutation_kind: MutationKind::Recluster,
+                update_stream_meta: vec![],
+                merge_meta: false,
+                deduplicated_label: None,
+                plan_id: u32::MAX,
+                recluster_info: Some(recluster_info),
+            }))
+        } else {
+            let Some((parts, snapshot)) =
+                tbl.recluster(self.ctx.clone(), push_downs, *limit).await?
+            else {
+                return Err(ErrorCode::NoNeedToRecluster(format!(
+                    "No need to do recluster for '{database}'.'{table}'"
+                )));
+            };
+            if parts.is_empty() {
+                return Err(ErrorCode::NoNeedToRecluster(format!(
+                    "No need to do recluster for '{database}'.'{table}'"
+                )));
+            }
+
+            let is_distributed = parts.is_distributed(self.ctx.clone());
+            match parts {
+                ReclusterParts::Recluster {
                     tasks,
-                    table_info: table_info.clone(),
-                    plan_id: u32::MAX,
-                }));
+                    remained_blocks,
+                    removed_segment_indexes,
+                    removed_segment_summary,
+                } => {
+                    let mut root = PhysicalPlan::Recluster(Box::new(Recluster {
+                        tasks,
+                        table_info: table_info.clone(),
+                        plan_id: u32::MAX,
+                    }));
 
-                if is_distributed {
-                    root = PhysicalPlan::Exchange(Exchange {
-                        plan_id: 0,
+                    if is_distributed {
+                        root = PhysicalPlan::Exchange(Exchange {
+                            plan_id: 0,
+                            input: Box::new(root),
+                            kind: FragmentKind::Merge,
+                            keys: vec![],
+                            allow_adjust_parallelism: true,
+                            ignore_exchange: false,
+                        });
+                    }
+                    PhysicalPlan::CommitSink(Box::new(CommitSink {
                         input: Box::new(root),
-                        kind: FragmentKind::Merge,
-                        keys: vec![],
-                        allow_adjust_parallelism: true,
-                        ignore_exchange: false,
-                    });
+                        table_info,
+                        snapshot: Some(snapshot),
+                        mutation_kind: MutationKind::Recluster,
+                        update_stream_meta: vec![],
+                        merge_meta: false,
+                        deduplicated_label: None,
+                        plan_id: u32::MAX,
+                        recluster_info: Some(ReclusterInfoSideCar {
+                            merged_blocks: remained_blocks,
+                            removed_segment_indexes,
+                            removed_statistics: removed_segment_summary,
+                        }),
+                    }))
                 }
-                PhysicalPlan::CommitSink(Box::new(CommitSink {
-                    input: Box::new(root),
-                    table_info,
-                    snapshot: Some(snapshot),
-                    mutation_kind: MutationKind::Recluster,
-                    update_stream_meta: vec![],
-                    merge_meta: false,
-                    deduplicated_label: None,
-                    plan_id: u32::MAX,
-                    recluster_info: Some(ReclusterInfoSideCar {
-                        merged_blocks: remained_blocks,
-                        removed_segment_indexes,
-                        removed_statistics: removed_segment_summary,
-                    }),
-                }))
-            }
-            ReclusterParts::Compact(parts) => {
-                let merge_meta = parts.partitions_type() == PartInfoType::LazyLevel;
-                let mut root = PhysicalPlan::CompactSource(Box::new(CompactSource {
-                    parts,
-                    table_info: table_info.clone(),
-                    column_ids: snapshot.schema.to_leaf_column_id_set(),
-                    plan_id: u32::MAX,
-                }));
+                ReclusterParts::Compact(parts) => {
+                    let merge_meta = parts.partitions_type() == PartInfoType::LazyLevel;
+                    let mut root = PhysicalPlan::CompactSource(Box::new(CompactSource {
+                        parts,
+                        table_info: table_info.clone(),
+                        column_ids: snapshot.schema.to_leaf_column_id_set(),
+                        plan_id: u32::MAX,
+                    }));
+
+                    if is_distributed {
+                        root = PhysicalPlan::Exchange(Exchange {
+                            plan_id: 0,
+                            input: Box::new(root),
+                            kind: FragmentKind::Merge,
+                            keys: vec![],
+                            allow_adjust_parallelism: true,
+                            ignore_exchange: false,
+                        });
+                    }
 
-                if is_distributed {
-                    root = PhysicalPlan::Exchange(Exchange {
-                        plan_id: 0,
+                    PhysicalPlan::CommitSink(Box::new(CommitSink {
                         input: Box::new(root),
-                        kind: FragmentKind::Merge,
-                        keys: vec![],
-                        allow_adjust_parallelism: true,
-                        ignore_exchange: false,
-                    });
+                        table_info,
+                        snapshot: Some(snapshot),
+                        mutation_kind: MutationKind::Compact,
+                        update_stream_meta: vec![],
+                        merge_meta,
+                        deduplicated_label: None,
+                        plan_id: u32::MAX,
+                        recluster_info: None,
+                    }))
                 }
-
-                PhysicalPlan::CommitSink(Box::new(CommitSink {
-                    input: Box::new(root),
-                    table_info,
-                    snapshot: Some(snapshot),
-                    mutation_kind: MutationKind::Compact,
-                    update_stream_meta: vec![],
-                    merge_meta,
-                    deduplicated_label: None,
-                    plan_id: u32::MAX,
-                    recluster_info: None,
-                }))
             }
         };
         plan.adjust_plan_id(&mut 0);
diff --git a/src/query/sql/src/planner/binder/ddl/table.rs b/src/query/sql/src/planner/binder/ddl/table.rs
index bccfe999c0bcd..219247b538dc8 100644
--- a/src/query/sql/src/planner/binder/ddl/table.rs
+++ b/src/query/sql/src/planner/binder/ddl/table.rs
@@ -22,7 +22,7 @@ use databend_common_ast::ast::AlterTableStmt;
 use databend_common_ast::ast::AnalyzeTableStmt;
 use databend_common_ast::ast::AttachTableStmt;
 use databend_common_ast::ast::ClusterOption;
-use databend_common_ast::ast::ClusterType;
+use databend_common_ast::ast::ClusterType as AstClusterType;
 use databend_common_ast::ast::ColumnDefinition;
 use databend_common_ast::ast::ColumnExpr;
 use databend_common_ast::ast::CompactTarget;
@@ -32,6 +32,7 @@ use databend_common_ast::ast::DescribeTableStmt;
 use databend_common_ast::ast::DropTableStmt;
 use databend_common_ast::ast::Engine;
 use databend_common_ast::ast::ExistsTableStmt;
+use databend_common_ast::ast::Expr;
 use databend_common_ast::ast::Identifier;
 use databend_common_ast::ast::InvertedIndexDefinition;
 use databend_common_ast::ast::ModifyColumnAction;
@@ -62,6 +63,7 @@ use databend_common_base::runtime::TrySpawn;
 use databend_common_catalog::lock::LockTableOption;
 use databend_common_catalog::plan::Filters;
 use databend_common_catalog::table::CompactionLimits;
+use databend_common_catalog::table::TableExt;
 use databend_common_config::GlobalConfig;
 use databend_common_exception::ErrorCode;
 use databend_common_exception::Result;
@@ -78,6 +80,8 @@ use databend_common_expression::TableSchema;
 use databend_common_expression::TableSchemaRef;
 use databend_common_expression::TableSchemaRefExt;
 use databend_common_functions::BUILTIN_FUNCTIONS;
+use databend_common_license::license::Feature;
+use databend_common_license::license_manager::LicenseManagerSwitch;
 use databend_common_meta_app::schema::CreateOption;
 use databend_common_meta_app::schema::TableIndex;
 use databend_common_meta_app::storage::StorageParams;
@@ -86,6 +90,7 @@ use databend_common_storage::init_operator;
 use databend_common_storages_view::view_table::QUERY;
 use databend_common_storages_view::view_table::VIEW_ENGINE;
 use databend_storages_common_table_meta::table::is_reserved_opt_key;
+use databend_storages_common_table_meta::table::ClusterType;
 use databend_storages_common_table_meta::table::OPT_KEY_CLUSTER_TYPE;
 use databend_storages_common_table_meta::table::OPT_KEY_DATABASE_ID;
 use databend_storages_common_table_meta::table::OPT_KEY_ENGINE_META;
@@ -98,6 +103,7 @@ use derive_visitor::DriveMut;
 use log::debug;
 use opendal::Operator;
 
+use crate::bind_table;
 use crate::binder::get_storage_params_from_options;
 use crate::binder::parse_storage_params_from_uri;
 use crate::binder::scalar::ScalarBinder;
@@ -145,8 +151,10 @@ use crate::plans::VacuumTableOption;
 use crate::plans::VacuumTablePlan;
 use crate::plans::VacuumTemporaryFilesPlan;
 use crate::BindContext;
+use crate::NameResolutionContext;
 use crate::Planner;
 use crate::SelectBuilder;
+use crate::TypeChecker;
 
 impl Binder {
     #[async_backtrace::framed]
@@ -469,7 +477,7 @@ impl Binder {
                     Some(self.ctx.as_ref()),
                     "when create TABLE with external location",
                 )
-                .await?;
+                    .await?;
 
                 // create a temporary op to check if params is correct
                 let op = init_operator(&sp)?;
@@ -1023,50 +1031,15 @@ impl Binder {
                 selection,
                 limit,
             } => {
-                let filters = if let Some(expr) = selection {
-                    let (_, mut context) =
-                        self.bind_table_reference(bind_context, table_reference)?;
-
-                    let mut scalar_binder = ScalarBinder::new(
-                        &mut context,
-                        self.ctx.clone(),
-                        &self.name_resolution_ctx,
-                        self.metadata.clone(),
-                        &[],
-                    );
-                    scalar_binder.forbid_udf();
-                    let (scalar, _) = scalar_binder.bind(expr)?;
-
-                    // prepare the filter expression
-                    let filter = cast_expr_to_non_null_boolean(
-                        scalar
-                            .as_expr()?
-                            .project_column_ref(|col| col.column_name.clone()),
-                    )?;
-                    // prepare the inverse filter expression
-                    let inverted_filter =
-                        check_function(None, "not", &[], &[filter.clone()], &BUILTIN_FUNCTIONS)?;
-
-                    Some(Filters {
-                        filter: filter.as_remote_expr(),
-                        inverted_filter: inverted_filter.as_remote_expr(),
-                    })
-                } else {
-                    None
-                };
-
-                let recluster = RelOperator::Recluster(Recluster {
+                self.bind_recluster_table(
                     catalog,
                     database,
                     table,
-                    filters,
-                    limit: limit.map(|v| v as usize),
-                });
-                let s_expr = SExpr::create_leaf(Arc::new(recluster));
-                Ok(Plan::ReclusterTable {
-                    s_expr: Box::new(s_expr),
-                    is_final: *is_final,
-                })
+                    limit.map(|v| v as usize),
+                    selection,
+                    *is_final,
+                )
+                .await
             }
             AlterTableAction::FlashbackTo { point } => {
                 let point = self.resolve_data_travel_point(bind_context, point)?;
@@ -1097,6 +1070,150 @@ impl Binder {
         }
     }
 
+    #[async_backtrace::framed]
+    pub async fn bind_recluster_table(
+        &mut self,
+        catalog: String,
+        database: String,
+        table: String,
+        limit: Option<usize>,
+        selection: &Option<Expr>,
+        is_final: bool,
+    ) -> Result<Plan> {
+        let tbl = self.ctx.get_table(&catalog, &database, &table).await?;
+        // check mutability
+        tbl.check_mutable()?;
+        let Some(cluster_type) = tbl.cluster_type() else {
+            return Err(ErrorCode::UnclusteredTable(format!(
+                "Unclustered table '{}.{}'",
+                database, table,
+            )));
+        };
+
+        let filters = if let Some(expr) = selection {
+            let (mut context, metadata) = bind_table(tbl.clone())?;
+            let mut type_checker = TypeChecker::try_create(
+                &mut context,
+                self.ctx.clone(),
+                &self.name_resolution_ctx,
+                metadata,
+                &[],
+                true,
+            )?;
+            let (scalar, _) = *type_checker.resolve(expr)?;
+
+            // prepare the filter expression
+            let filter = cast_expr_to_non_null_boolean(
+                scalar
+                    .as_expr()?
+                    .project_column_ref(|col| col.column_name.clone()),
+            )?;
+            // prepare the inverse filter expression
+            let inverted_filter =
+                check_function(None, "not", &[], &[filter.clone()], &BUILTIN_FUNCTIONS)?;
+
+            Some(Filters {
+                filter: filter.as_remote_expr(),
+                inverted_filter: inverted_filter.as_remote_expr(),
+            })
+        } else {
+            None
+        };
+
+        let hilbert_query = if matches!(cluster_type, ClusterType::Hilbert) {
+            LicenseManagerSwitch::instance()
+                .check_enterprise_enabled(self.ctx.get_license_key(), Feature::HilbertClustering)?;
+            let ast_exprs = tbl.resolve_cluster_keys(self.ctx.clone()).unwrap();
+            let cluster_keys_len = ast_exprs.len();
+            let settings = self.ctx.get_settings();
+            let name_resolution_ctx = NameResolutionContext::try_from(settings.as_ref())?;
+            let cluster_key_strs = ast_exprs.into_iter().fold(
+                Vec::with_capacity(cluster_keys_len),
+                |mut acc, mut ast| {
+                    let mut normalizer = IdentifierNormalizer {
+                        ctx: &name_resolution_ctx,
+                    };
+                    ast.drive_mut(&mut normalizer);
+                    acc.push(format!("{:#}", &ast));
+                    acc
+                },
+            );
+
+            let partitions = settings.get_hilbert_num_range_ids()?;
+            let sample_size = settings.get_hilbert_sample_size_per_block()?;
+            let keys_bounds_str = cluster_key_strs
+                .iter()
+                .map(|s| format!("range_bound({partitions}, {sample_size})({s}) AS {s}_bound"))
+                .collect::<Vec<_>>()
+                .join(", ");
+
+            let hilbert_keys_str = cluster_key_strs
+                .iter()
+                .map(|s| {
+                    format!(
+                        "hilbert_key(cast(ifnull(range_partition_id({table}.{s}, _keys_bound.{s}_bound), {}) as uint16))",
+                        partitions
+                    )
+                })
+                .collect::<Vec<_>>()
+                .join(", ");
+
+            let quote = settings.get_sql_dialect()?.default_ident_quote();
+            let schema = tbl.schema_with_stream();
+            let mut output_with_table = Vec::with_capacity(schema.fields.len());
+            let mut output = Vec::with_capacity(schema.fields.len());
+            for field in &schema.fields {
+                output_with_table.push(format!(
+                    "{quote}{table}{quote}.{quote}{}{quote}",
+                    field.name
+                ));
+                output.push(format!("{quote}{}{quote}", field.name));
+            }
+            let output_with_table_str = output_with_table.join(", ");
+            let output_str = output.join(", ");
+
+            let query = format!(
+                "WITH _keys_bound AS ( \
+                        SELECT \
+                            {keys_bounds_str} \
+                        FROM {database}.{table} \
+                    ), \
+                    _source_data AS ( \
+                        SELECT \
+                            {output_with_table_str}, \
+                            hilbert_index([{hilbert_keys_str}], 2) AS _hilbert_index \
+                        FROM {database}.{table}, _keys_bound \
+                    ) \
+                    SELECT \
+                        {output_str} \
+                    FROM _source_data \
+                    ORDER BY _hilbert_index"
+            );
+            let tokens = tokenize_sql(query.as_str())?;
+            let (stmt, _) = parse_sql(&tokens, self.dialect)?;
+            let Statement::Query(query) = stmt else {
+                unreachable!()
+            };
+            Some(query)
+        } else {
+            None
+        };
+
+        let recluster = RelOperator::Recluster(Recluster {
+            catalog,
+            database,
+            table,
+            limit,
+            filters,
+        });
+
+        Ok(Plan::ReclusterTable {
+            s_expr: Box::new(SExpr::create_leaf(Arc::new(recluster))),
+            hilbert_query,
+            is_final,
+        })
+    }
+
     #[async_backtrace::framed]
     pub(in crate::planner::binder) async fn bind_rename_table(
         &mut self,
@@ -1646,10 +1763,15 @@ impl Binder {
         } = cluster_opt;
 
         let expr_len = cluster_exprs.len();
-        if matches!(cluster_type, ClusterType::Hilbert) && !(2..=5).contains(&expr_len) {
-            return Err(ErrorCode::InvalidClusterKeys(
-                "Hilbert clustering requires the dimension to be between 2 and 5",
-            ));
+        if matches!(cluster_type, AstClusterType::Hilbert) {
+            LicenseManagerSwitch::instance()
+                .check_enterprise_enabled(self.ctx.get_license_key(), Feature::HilbertClustering)?;
+
+            if !(2..=5).contains(&expr_len) {
+                return Err(ErrorCode::InvalidClusterKeys(
+                    "Hilbert clustering requires the dimension to be between 2 and 5",
+                ));
+            }
         }
 
         // Build a temporary BindContext to resolve the expr
diff --git a/src/query/sql/src/planner/expression_parser.rs b/src/query/sql/src/planner/expression_parser.rs
index aa098e43e5d63..dce84a0d74425 100644
--- a/src/query/sql/src/planner/expression_parser.rs
+++ b/src/query/sql/src/planner/expression_parser.rs
@@ -28,7 +28,6 @@ use databend_common_expression::type_check::check_cast;
 use databend_common_expression::type_check::check_function;
 use databend_common_expression::types::DataType;
 use databend_common_expression::types::NumberDataType;
-use databend_common_expression::types::NumberScalar;
 use databend_common_expression::ConstantFolder;
 use databend_common_expression::DataBlock;
 use databend_common_expression::DataSchemaRef;
@@ -114,6 +113,17 @@ pub fn parse_exprs(
     ctx: Arc<dyn TableContext>,
     table_meta: Arc<dyn Table>,
     sql: &str,
+) -> Result<Vec<Expr>> {
+    let sql_dialect = ctx.get_settings().get_sql_dialect().unwrap_or_default();
+    let tokens = tokenize_sql(sql)?;
+    let ast_exprs = parse_comma_separated_exprs(&tokens, sql_dialect)?;
+    parse_ast_exprs(ctx, table_meta, ast_exprs)
+}
+
+fn parse_ast_exprs(
+    ctx: Arc<dyn TableContext>,
+    table_meta: Arc<dyn Table>,
+    ast_exprs: Vec<AExpr>,
 ) -> Result<Vec<Expr>> {
     let (mut bind_context, metadata) = bind_table(table_meta)?;
     let settings = ctx.get_settings();
@@ -127,9 +137,6 @@ pub fn parse_exprs(
         false,
     )?;
 
-    let tokens = tokenize_sql(sql)?;
-    let sql_dialect = settings.get_sql_dialect().unwrap_or_default();
-    let ast_exprs = parse_comma_separated_exprs(&tokens, sql_dialect)?;
     let exprs = ast_exprs
         .iter()
         .map(|ast| {
@@ -386,41 +393,11 @@ pub fn parse_lambda_expr(
 pub fn parse_cluster_keys(
     ctx: Arc<dyn TableContext>,
     table_meta: Arc<dyn Table>,
-    cluster_key_str: &str,
+    ast_exprs: Vec<AExpr>,
 ) -> Result<Vec<Expr>> {
-    let (mut bind_context, metadata) = bind_table(table_meta)?;
-    let settings = ctx.get_settings();
-    let name_resolution_ctx = NameResolutionContext::try_from(settings.as_ref())?;
-    let mut type_checker = TypeChecker::try_create(
-        &mut bind_context,
-        ctx,
-        &name_resolution_ctx,
-        metadata,
-        &[],
-        true,
-    )?;
-
-    let tokens = tokenize_sql(cluster_key_str)?;
-    let sql_dialect = settings.get_sql_dialect().unwrap_or_default();
-    let mut ast_exprs = parse_comma_separated_exprs(&tokens, sql_dialect)?;
-    // unwrap tuple.
-    if ast_exprs.len() == 1 {
-        if let AExpr::Tuple { exprs, .. } = &ast_exprs[0] {
-            ast_exprs = exprs.clone();
-        }
-    } else {
-        // Defensive check:
-        // `ast_exprs` should always contain one element which can be one of the following:
-        // 1. A tuple of composite cluster keys
-        // 2. A single cluster key
-        unreachable!("invalid cluster key ast expression, {:?}", ast_exprs);
-    }
-
-    let mut exprs = Vec::with_capacity(ast_exprs.len());
-    for ast in ast_exprs {
-        let (scalar, _) = *type_checker.resolve(&ast)?;
-        let expr = scalar.as_expr()?.project_column_ref(|col| col.index);
-
+    let exprs = parse_ast_exprs(ctx, table_meta, ast_exprs)?;
+    let mut res = Vec::with_capacity(exprs.len());
+    for expr in exprs {
         let inner_type = expr.data_type().remove_nullable();
         let mut should_wrapper = false;
         if inner_type == DataType::String {
@@ -455,153 +432,9 @@ pub fn parse_cluster_keys(
         } else {
             expr
         };
-        exprs.push(expr);
-    }
-    Ok(exprs)
-}
-
-pub fn parse_hilbert_cluster_key(
-    ctx: Arc<dyn TableContext>,
-    table_meta: Arc<dyn Table>,
-    cluster_key_str: &str,
-) -> Result<Vec<Expr>> {
-    let (mut bind_context, metadata) = bind_table(table_meta)?;
-    let settings = ctx.get_settings();
-    let name_resolution_ctx = NameResolutionContext::try_from(settings.as_ref())?;
-    let mut type_checker = TypeChecker::try_create(
-        &mut bind_context,
-        ctx,
-        &name_resolution_ctx,
-        metadata,
-        &[],
-        true,
-    )?;
-
-    let tokens = tokenize_sql(cluster_key_str)?;
-    let sql_dialect = settings.get_sql_dialect().unwrap_or_default();
-    let mut ast_exprs = parse_comma_separated_exprs(&tokens, sql_dialect)?;
-    // unwrap tuple.
-    if ast_exprs.len() == 1 {
-        if let AExpr::Tuple { exprs, .. } = &ast_exprs[0] {
-            ast_exprs = exprs.clone();
-        }
-    } else {
-        unreachable!("invalid cluster key ast expression, {:?}", ast_exprs);
-    }
-
-    let expr_len = ast_exprs.len();
-    if !(2..=5).contains(&expr_len) {
-        return Err(ErrorCode::InvalidClusterKeys(
-            "Hilbert clustering requires the dimension to be between 2 and 5",
-        ));
-    }
-
-    let mut max_size = 0;
-    let mut byte_sizes = Vec::with_capacity(expr_len);
-    let mut exprs = Vec::with_capacity(expr_len);
-    for ast in ast_exprs {
-        let (scalar, _) = *type_checker.resolve(&ast)?;
-        let expr = scalar.as_expr()?.project_column_ref(|col| col.index);
-        let byte_size = hilbert_byte_size(expr.data_type())?;
-        max_size = max_size.max(byte_size);
-        byte_sizes.push(byte_size);
-        exprs.push(expr);
-    }
-
-    let max_size = max_size.min(8);
-    let common_cast = match max_size {
-        1 => "to_int8",
-        2 => "to_int16",
-        4 => "to_int32",
-        8 => "to_int64",
-        _ => unreachable!(),
-    };
-    let max_val = Expr::Constant {
-        span: None,
-        scalar: Scalar::Binary(vec![0xFF; max_size]),
-        data_type: DataType::Binary,
-    };
-
-    for (expr, byte_size) in exprs.iter_mut().zip(byte_sizes.into_iter()) {
-        let inner_type = expr.data_type().remove_nullable();
-        let cast_str = match inner_type {
-            DataType::Date | DataType::Timestamp | DataType::Boolean => Some(common_cast),
-            DataType::Decimal(_) => Some("to_float64"),
-            DataType::Number(t) if max_size > byte_size => {
-                if matches!(t, NumberDataType::Float32) {
-                    Some("to_float64")
-                } else {
-                    Some(common_cast)
-                }
-            }
-            _ => None,
-        };
-        *expr = if let Some(cast) = cast_str {
-            check_function(None, cast, &[], &[expr.clone()], &BUILTIN_FUNCTIONS)?
-        } else {
-            expr.clone()
-        };
-        *expr = check_function(
-            None,
-            "hilbert_key",
-            &[],
-            &[expr.clone()],
-            &BUILTIN_FUNCTIONS,
-        )?;
-        let data_type = expr.data_type();
-        let is_nullable = data_type.is_nullable();
-        if is_nullable {
-            let is_not_null_expr = check_function(
-                None,
-                "is_not_null",
-                &[],
-                &[expr.clone()],
-                &BUILTIN_FUNCTIONS,
-            )?;
-
-            let assume_not_null_expr = check_function(
-                None,
-                "assume_not_null",
-                &[],
-                &[expr.clone()],
-                &BUILTIN_FUNCTIONS,
-            )?;
-
-            *expr = check_function(
-                None,
-                "if",
-                &[],
-                &[is_not_null_expr, assume_not_null_expr, max_val.clone()],
-                &BUILTIN_FUNCTIONS,
-            )?;
-        }
-    }
-
-    let array = check_function(None, "array", &[], &exprs, &BUILTIN_FUNCTIONS)?;
-    let result = check_function(
-        None,
-        "hilbert_index",
-        &[],
-        &[array, Expr::Constant {
-            span: None,
-            scalar: Scalar::Number(NumberScalar::UInt64(max_size as u64)),
-            data_type: DataType::Number(NumberDataType::UInt64),
-        }],
-        &BUILTIN_FUNCTIONS,
-    )?;
-    Ok(vec![result])
-}
-
-fn hilbert_byte_size(data_type: &DataType) -> Result<usize> {
-    match data_type {
-        DataType::Nullable(inner) => hilbert_byte_size(inner),
-        DataType::Number(_) | DataType::Date | DataType::Timestamp | DataType::Decimal(_) => {
-            Ok(data_type.numeric_byte_size().unwrap())
-        }
-        DataType::Boolean => Ok(1),
-        DataType::String => Ok(24),
-        _ => Err(ErrorCode::Internal("unsupported data type for hilbert")),
+        res.push(expr);
     }
+    Ok(res)
 }
 
 pub fn analyze_cluster_keys(
diff --git a/src/query/sql/src/planner/optimizer/optimizer.rs b/src/query/sql/src/planner/optimizer/optimizer.rs
index de1ea299a3fdd..9529adb43ef1c 100644
--- a/src/query/sql/src/planner/optimizer/optimizer.rs
+++ b/src/query/sql/src/planner/optimizer/optimizer.rs
@@ -507,7 +507,7 @@ async fn optimize_mutation(mut opt_ctx: OptimizerContext, s_expr: SExpr) -> Resu
     if let &RelOperator::Exchange(_) = input_s_expr.plan() {
         input_s_expr = input_s_expr.child(0)?.clone();
     }
-    // If there still exists a Exchange::Merge operator, we should disable distributed optimization and
+    // If there still exists an Exchange::Merge operator, we should disable distributed optimization and
     // optimize the input plan again.
     if input_s_expr.has_merge_exchange() {
         opt_ctx = opt_ctx.with_enable_distributed_optimization(false);
diff --git a/src/query/sql/src/planner/planner.rs b/src/query/sql/src/planner/planner.rs
index 8cdf8fe2ba16a..62126bca834b7 100644
--- a/src/query/sql/src/planner/planner.rs
+++ b/src/query/sql/src/planner/planner.rs
@@ -85,7 +85,7 @@ impl Planner {
     #[fastrace::trace]
     pub async fn plan_sql(&mut self, sql: &str) -> Result<(Plan, PlanExtras)> {
         let extras = self.parse_sql(sql)?;
-        let plan = self.plan_stmt(&extras.statement).await?;
+        let plan = self.plan_stmt(&extras.statement, true).await?;
         Ok((plan, extras))
     }
 
@@ -221,7 +221,7 @@ impl Planner {
 
     #[async_backtrace::framed]
     #[fastrace::trace]
-    pub async fn plan_stmt(&mut self, stmt: &Statement) -> Result<Plan> {
+    pub async fn plan_stmt(&mut self, stmt: &Statement, attach_query: bool) -> Result<Plan> {
         let start = Instant::now();
         let settings = self.ctx.get_settings();
         // Step 3: Bind AST with catalog, and generate a pure logical SExpr
@@ -241,9 +241,11 @@ impl Planner {
             );
             if let Some(plan) = plan {
                 info!("logical plan from cache, time used: {:?}", start.elapsed());
-                // update for clickhouse handler
-                self.ctx
-                    .attach_query_str(get_query_kind(stmt), stmt.to_mask_sql());
+                if attach_query {
+                    // update for clickhouse handler
+                    self.ctx
+                        .attach_query_str(get_query_kind(stmt), stmt.to_mask_sql());
+                }
                 return Ok(plan.plan);
             }
             enable_planner_cache = c;
@@ -259,12 +261,11 @@ impl Planner {
         .with_subquery_executor(self.query_executor.clone());
 
         // Indicate binder there is no need to collect column statistics for the binding table.
-        self.ctx
-            .attach_query_str(get_query_kind(stmt), stmt.to_mask_sql());
         let plan = binder.bind(stmt).await?;
-        // attach again to avoid the query kind is overwritten by the subquery
-        self.ctx
-            .attach_query_str(get_query_kind(stmt), stmt.to_mask_sql());
+        if attach_query {
+            self.ctx
+                .attach_query_str(get_query_kind(stmt), stmt.to_mask_sql());
+        }
 
         // Step 4: Optimize the SExpr with optimizers, and generate optimized physical SExpr
         let opt_ctx = OptimizerContext::new(self.ctx.clone(), metadata.clone())
diff --git a/src/query/sql/src/planner/plans/mod.rs b/src/query/sql/src/planner/plans/mod.rs
index 2704f874b0490..fc0a4746e7f29 100644
--- a/src/query/sql/src/planner/plans/mod.rs
+++ b/src/query/sql/src/planner/plans/mod.rs
@@ -85,7 +85,7 @@ pub use plan::*;
 pub use presign::*;
 pub use project_set::*;
 pub use r_cte_scan::*;
-pub use recluster::Recluster;
+pub use recluster::*;
 pub use replace::Replace;
 pub use revert_table::RevertTablePlan;
 pub use scalar_expr::*;
diff --git a/src/query/sql/src/planner/plans/plan.rs b/src/query/sql/src/planner/plans/plan.rs
index e3abfd95793f2..9a2c2f3406285 100644
--- a/src/query/sql/src/planner/plans/plan.rs
+++ b/src/query/sql/src/planner/plans/plan.rs
@@ -17,6 +17,7 @@ use std::fmt::Formatter;
 use std::sync::Arc;
 
 use databend_common_ast::ast::ExplainKind;
+use databend_common_ast::ast::Query;
 use databend_common_catalog::query_kind::QueryKind;
 use databend_common_expression::types::DataType;
 use databend_common_expression::DataField;
@@ -243,6 +244,7 @@ pub enum Plan {
     DropTableClusterKey(Box<DropTableClusterKeyPlan>),
     ReclusterTable {
         s_expr: Box<SExpr>,
+        hilbert_query: Option<Box<Query>>,
         is_final: bool,
     },
     RevertTable(Box<RevertTablePlan>),
diff --git a/src/query/sql/src/planner/plans/recluster.rs b/src/query/sql/src/planner/plans/recluster.rs
index 4cd9fbb6c63d2..efe48c6cacd5b 100644
--- a/src/query/sql/src/planner/plans/recluster.rs
+++ b/src/query/sql/src/planner/plans/recluster.rs
@@ -12,29 +12,48 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+use std::sync::Arc;
+
 use databend_common_catalog::plan::Filters;
+use educe::Educe;
 
+use crate::optimizer::SExpr;
 use crate::plans::Operator;
 use crate::plans::RelOp;
+use crate::plans::RelOperator;
 
-#[derive(Clone, Debug, PartialEq, Eq)]
+#[derive(Debug, PartialEq, Clone, Educe)]
+#[educe(Eq, Hash)]
 pub struct Recluster {
     pub catalog: String,
     pub database: String,
     pub table: String,
 
     pub limit: Option<usize>,
+    #[educe(Hash(ignore))]
     pub filters: Option<Filters>,
 }
 
-impl std::hash::Hash for Recluster {
-    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
-        self.table.hash(state);
-    }
-}
-
 impl Operator for Recluster {
     fn rel_op(&self) -> RelOp {
         RelOp::Recluster
     }
 }
+
+pub fn set_update_stream_columns(s_expr: &SExpr) -> databend_common_exception::Result<SExpr> {
+    match s_expr.plan() {
+        RelOperator::Scan(scan) if scan.table_index == 0 => {
+            let mut scan = scan.clone();
+            scan.set_update_stream_columns(true);
+            Ok(SExpr::create_leaf(Arc::new(scan.into())))
+        }
+        _ => {
+            let mut children = Vec::with_capacity(s_expr.arity());
+            for child in s_expr.children() {
+                let child = set_update_stream_columns(child)?;
+                children.push(Arc::new(child));
+            }
+            Ok(s_expr.replace_children(children))
+        }
+    }
+}
diff --git a/src/query/storages/common/table_meta/src/table/table_keys.rs b/src/query/storages/common/table_meta/src/table/table_keys.rs
index 0e4296fc3c8bd..e4202d5c05d51 100644
--- a/src/query/storages/common/table_meta/src/table/table_keys.rs
+++ b/src/query/storages/common/table_meta/src/table/table_keys.rs
@@ -87,7 +87,7 @@ pub fn is_internal_opt_key<S: AsRef<str>>(opt_key: S) -> bool {
     INTERNAL_TABLE_OPTION_KEYS.contains(opt_key.as_ref().to_lowercase().as_str())
 }
 
-#[derive(Debug, Clone, Eq, PartialEq)]
+#[derive(Debug, serde::Serialize, serde::Deserialize, Clone, Eq, PartialEq, Copy)]
 pub enum ClusterType {
     Linear,
     Hilbert,
diff --git a/src/query/storages/fuse/src/fuse_table.rs b/src/query/storages/fuse/src/fuse_table.rs
index 9ac1dab010251..d89be771f19f0 100644
--- a/src/query/storages/fuse/src/fuse_table.rs
+++ b/src/query/storages/fuse/src/fuse_table.rs
@@ -64,7 +64,6 @@ use databend_common_meta_app::schema::UpsertTableCopiedFileReq;
 use databend_common_pipeline_core::Pipeline;
 use databend_common_sql::binder::STREAM_COLUMN_FACTORY;
 use databend_common_sql::parse_cluster_keys;
-use databend_common_sql::parse_hilbert_cluster_key;
 use databend_common_sql::BloomIndexColumns;
 use databend_common_storage::init_operator;
 use databend_common_storage::DataOperator;
@@ -403,28 +402,25 @@ impl FuseTable {
         self.cluster_key_meta.clone().map(|v| v.0)
     }
 
-    pub fn cluster_keys(&self, ctx: Arc<dyn TableContext>) -> Vec<RemoteExpr<String>> {
+    pub fn linear_cluster_keys(&self, ctx: Arc<dyn TableContext>) -> Vec<RemoteExpr<String>> {
+        if self
+            .cluster_type()
+            .is_none_or(|v| matches!(v, ClusterType::Hilbert))
+        {
+            return vec![];
+        }
+
         let table_meta = Arc::new(self.clone());
-        if let Some((_, order)) = &self.cluster_key_meta {
-            let cluster_type = self.get_option(OPT_KEY_CLUSTER_TYPE, ClusterType::Linear);
-            let cluster_keys = match cluster_type {
-                ClusterType::Linear => parse_cluster_keys(ctx, table_meta.clone(), order),
-                ClusterType::Hilbert => parse_hilbert_cluster_key(ctx, table_meta.clone(), order),
-            }
-            .unwrap();
-
-            let cluster_keys = cluster_keys
-                .iter()
-                .map(|k| {
-                    k.project_column_ref(|index| {
-                        table_meta.schema().field(*index).name().to_string()
-                    })
+        let cluster_key_exprs = self.resolve_cluster_keys(ctx.clone()).unwrap();
+        let exprs = parse_cluster_keys(ctx, table_meta.clone(), cluster_key_exprs).unwrap();
+        let cluster_keys = exprs
+            .iter()
+            .map(|k| {
+                k.project_column_ref(|index| table_meta.schema().field(*index).name().to_string())
                     .as_remote_expr()
-                })
-                .collect();
-            return cluster_keys;
-        }
-        vec![]
+            })
+            .collect();
+        cluster_keys
     }
 
     pub fn bloom_index_cols(&self) -> BloomIndexColumns {
@@ -439,7 +435,7 @@ impl FuseTable {
     }
 
     pub fn cluster_key_types(&self, ctx: Arc<dyn TableContext>) -> Vec<DataType> {
-        let Some((_, cluster_key_str)) = &self.cluster_key_meta else {
+        let Some(ast_exprs) = self.resolve_cluster_keys(ctx.clone()) else {
             return vec![];
         };
         let cluster_type = self.get_option(OPT_KEY_CLUSTER_TYPE, ClusterType::Linear);
@@ -447,7 +443,7 @@ impl FuseTable {
             ClusterType::Hilbert => vec![DataType::Binary],
             ClusterType::Linear => {
                 let cluster_keys =
-                    parse_cluster_keys(ctx, Arc::new(self.clone()), cluster_key_str).unwrap();
+                    parse_cluster_keys(ctx, Arc::new(self.clone()), ast_exprs).unwrap();
                 cluster_keys
                     .into_iter()
                     .map(|v| v.data_type().clone())
diff --git a/src/query/storages/fuse/src/operations/append.rs b/src/query/storages/fuse/src/operations/append.rs
index 0588a64b4c77a..6f80b8865a1aa 100644
--- a/src/query/storages/fuse/src/operations/append.rs
+++ b/src/query/storages/fuse/src/operations/append.rs
@@ -33,6 +33,7 @@ use databend_common_pipeline_transforms::processors::TransformSortPartial;
 use databend_common_sql::evaluator::BlockOperator;
 use databend_common_sql::evaluator::CompoundBlockOperator;
 use databend_common_sql::executor::physical_plans::MutationKind;
+use databend_storages_common_table_meta::table::ClusterType;
 
 use crate::operations::common::TransformSerializeBlock;
 use crate::statistics::ClusterStatsGenerator;
@@ -169,8 +170,8 @@ impl FuseTable {
         block_thresholds: BlockThresholds,
         modified_schema: Option<Arc<DataSchema>>,
     ) -> Result<ClusterStatsGenerator> {
-        let cluster_keys = self.cluster_keys(ctx.clone());
-        if cluster_keys.is_empty() {
+        let cluster_type = self.cluster_type();
+        if cluster_type.is_none_or(|v| v == ClusterType::Hilbert) {
             return Ok(ClusterStatsGenerator::default());
         }
 
@@ -178,6 +179,7 @@ impl FuseTable {
             modified_schema.unwrap_or(DataSchema::from(self.schema_with_stream()).into());
         let mut merged = input_schema.fields().clone();
 
+        let cluster_keys = self.linear_cluster_keys(ctx.clone());
         let mut cluster_key_index = Vec::with_capacity(cluster_keys.len());
         let mut extra_key_num = 0;
 
diff --git a/src/query/storages/fuse/src/operations/changes.rs b/src/query/storages/fuse/src/operations/changes.rs
index 9c8f013c2270c..a049eced60ba6 100644
--- a/src/query/storages/fuse/src/operations/changes.rs
+++ b/src/query/storages/fuse/src/operations/changes.rs
@@ -292,7 +292,10 @@ impl FuseTable {
             if !self.is_native() || self.cluster_key_meta().is_none() {
                 (vec![], None)
             } else {
-                (self.cluster_keys(ctx.clone()), self.cluster_key_meta())
+                (
+                    self.linear_cluster_keys(ctx.clone()),
+                    self.cluster_key_meta(),
+                )
             };
         let bloom_index_cols = self.bloom_index_cols();
         let mut pruner = FusePruner::create_with_pages(
diff --git a/src/query/storages/fuse/src/operations/common/processors/sink_commit.rs b/src/query/storages/fuse/src/operations/common/processors/sink_commit.rs
index 413a6c1170c44..dd35f5f4590a2 100644
--- a/src/query/storages/fuse/src/operations/common/processors/sink_commit.rs
+++ b/src/query/storages/fuse/src/operations/common/processors/sink_commit.rs
@@ -442,7 +442,7 @@ where F: SnapshotGenerator + Send + 'static
                             metrics_inc_commit_copied_files(files.file_info.len() as u64);
                         }
                         for segment_loc in std::mem::take(&mut self.new_segment_locs).into_iter() {
-                            self.ctx.add_segment_location(segment_loc)?;
+                            self.ctx.add_written_segment_location(segment_loc)?;
                         }
 
                         let target_descriptions = {
diff --git a/src/query/storages/fuse/src/operations/common/processors/transform_mutation_aggregator.rs b/src/query/storages/fuse/src/operations/common/processors/transform_mutation_aggregator.rs
index 3a42880d3b31c..7e44a6573e462 100644
--- a/src/query/storages/fuse/src/operations/common/processors/transform_mutation_aggregator.rs
+++ b/src/query/storages/fuse/src/operations/common/processors/transform_mutation_aggregator.rs
@@ -30,10 +30,12 @@ use databend_common_metrics::storage::metrics_inc_recluster_write_block_nums;
 use databend_common_pipeline_transforms::processors::AsyncAccumulatingTransform;
 use databend_common_sql::executor::physical_plans::MutationKind;
 use databend_storages_common_table_meta::meta::BlockMeta;
+use databend_storages_common_table_meta::meta::ClusterStatistics;
 use databend_storages_common_table_meta::meta::Location;
 use databend_storages_common_table_meta::meta::SegmentInfo;
 use databend_storages_common_table_meta::meta::Statistics;
 use databend_storages_common_table_meta::meta::Versioned;
+use databend_storages_common_table_meta::table::ClusterType;
 use itertools::Itertools;
 use log::debug;
 use log::info;
@@ -61,16 +63,17 @@ use crate::FUSE_OPT_KEY_BLOCK_PER_SEGMENT;
 pub struct TableMutationAggregator {
     ctx: Arc<dyn TableContext>,
     schema: TableSchemaRef,
+    table_id: u64,
     dal: Operator,
     location_gen: TableMetaLocationGenerator,
-
     thresholds: BlockThresholds,
     block_per_seg: usize,
-    default_cluster_key_id: Option<u32>,
 
+    default_cluster_key_id: Option<u32>,
     base_segments: Vec<Location>,
     // Used for recluster.
     recluster_merged_blocks: Vec<Arc<BlockMeta>>,
+    set_hilbert_level: bool,
 
     mutations: HashMap<SegmentIndex, BlockMutations>,
     appended_segments: Vec<Location>,
@@ -81,7 +84,6 @@ pub struct TableMutationAggregator {
     kind: MutationKind,
     start_time: Instant,
     finished_tasks: usize,
-    table_id: u64,
 }
 
 // takes in table mutation logs and aggregates them (former mutation_transform)
@@ -125,6 +127,7 @@ impl AsyncAccumulatingTransform for TableMutationAggregator {
 }
 
 impl TableMutationAggregator {
+    #[allow(clippy::too_many_arguments)]
     pub fn create(
         table: &FuseTable,
         ctx: Arc<dyn TableContext>,
@@ -134,6 +137,16 @@ impl TableMutationAggregator {
         removed_statistics: Statistics,
         kind: MutationKind,
     ) -> Self {
+        let set_hilbert_level = table
+            .cluster_type()
+            .is_some_and(|v| matches!(v, ClusterType::Hilbert))
+            && matches!(
+                kind,
+                MutationKind::Delete
+                    | MutationKind::MergeInto
+                    | MutationKind::Replace
+                    | MutationKind::Recluster
+            );
         TableMutationAggregator {
             ctx,
             schema: table.schema(),
@@ -141,6 +154,7 @@ impl TableMutationAggregator {
             location_gen: table.meta_location_generator().clone(),
             thresholds: table.get_block_thresholds(),
             default_cluster_key_id: table.cluster_key_id(),
+            set_hilbert_level,
             block_per_seg: table
                 .get_option(FUSE_OPT_KEY_BLOCK_PER_SEGMENT, DEFAULT_BLOCK_PER_SEGMENT),
             mutations: HashMap::new(),
@@ -258,6 +272,9 @@ impl TableMutationAggregator {
         let chunk_size = merged_blocks.len().div_ceil(segments_num);
         let default_cluster_key = Some(default_cluster_key_id);
         let thresholds = self.thresholds;
+        let block_per_seg = self.block_per_seg;
+        let set_hilbert_level = self.set_hilbert_level;
+        let kind = self.kind;
         for chunk in &merged_blocks.into_iter().chunks(chunk_size) {
             let new_blocks = chunk.collect::<Vec<_>>();
             let all_perfect = new_blocks.len() > 1;
@@ -272,7 +289,9 @@ impl TableMutationAggregator {
                     thresholds,
                     default_cluster_key,
                     all_perfect,
-                    MutationKind::Recluster,
+                    block_per_seg,
+                    kind,
+                    set_hilbert_level,
                 )
                 .await
             });
@@ -297,7 +316,7 @@ impl TableMutationAggregator {
         let mut appended_segments = Vec::new();
         let mut replaced_segments = HashMap::with_capacity(replaced_segments_len);
         if new_segments_len > removed_segments_len {
-            // The remain new segments will be append.
+            // The remain new segments will be appended.
             let appended = new_segments.split_off(removed_segments_len);
             for (location, stats) in appended.into_iter().rev() {
                 let segment_loc = (location, SegmentInfo::VERSION);
@@ -406,6 +425,9 @@ impl TableMutationAggregator {
     ) -> Result<Vec<SegmentLite>> {
         let thresholds = self.thresholds;
         let default_cluster_key_id = self.default_cluster_key_id;
+        let block_per_seg = self.block_per_seg;
+        let kind = self.kind;
+        let set_hilbert_level = self.set_hilbert_level;
         let mut tasks = Vec::with_capacity(segment_indices.len());
         for index in segment_indices {
             let segment_mutation = self.mutations.remove(&index).unwrap();
@@ -413,10 +435,10 @@ impl TableMutationAggregator {
             let schema = self.schema.clone();
             let op = self.dal.clone();
             let location_gen = self.location_gen.clone();
-            let kind = self.kind;
 
-            let mut all_perfect = false;
             tasks.push(async move {
+                let mut all_perfect = false;
+                let mut set_level = false;
                 let (new_blocks, origin_summary) = if let Some(loc) = location {
                     // read the old segment
                     let compact_segment_info =
@@ -446,6 +468,12 @@ impl TableMutationAggregator {
 
                     // assign back the mutated blocks to segment
                     let new_blocks = block_editor.into_values().collect::<Vec<_>>();
+                    set_level = set_hilbert_level
+                        && segment_info
+                            .summary
+                            .cluster_stats
+                            .as_ref()
+                            .is_some_and(|v| v.cluster_key_id == default_cluster_key_id.unwrap());
                     (new_blocks, Some(segment_info.summary))
                 } else {
                     // use by compact.
@@ -469,7 +497,9 @@ impl TableMutationAggregator {
                     thresholds,
                     default_cluster_key_id,
                     all_perfect,
+                    block_per_seg,
                     kind,
+                    set_level,
                 )
                 .await?;
 
@@ -541,7 +571,9 @@ async fn write_segment(
     thresholds: BlockThresholds,
     default_cluster_key: Option<u32>,
     all_perfect: bool,
+    block_per_seg: usize,
     kind: MutationKind,
+    set_hilbert_level: bool,
 ) -> Result<(String, Statistics)> {
     let location = location_gen.gen_segment_info_location();
     let mut new_summary = reduce_block_metas(&blocks, thresholds, default_cluster_key);
@@ -555,6 +587,25 @@ async fn write_segment(
             new_summary.perfect_block_count = new_summary.block_count;
         }
     }
+    if set_hilbert_level {
+        debug_assert!(new_summary.cluster_stats.is_none());
+        let level = if new_summary.block_count >= block_per_seg as u64
+            && (new_summary.row_count as usize >= block_per_seg * thresholds.min_rows_per_block
+                || new_summary.uncompressed_byte_size as usize
+                    >= block_per_seg * thresholds.max_bytes_per_block)
+        {
+            -1
+        } else {
+            0
+        };
+        new_summary.cluster_stats = Some(ClusterStatistics {
+            cluster_key_id: default_cluster_key.unwrap(),
+            min: vec![],
+            max: vec![],
+            level,
+            pages: None,
+        });
+    }
     // create new segment info
     let new_segment = SegmentInfo::new(blocks, new_summary.clone());
     new_segment
diff --git a/src/query/storages/fuse/src/operations/mutation/mutator/block_compact_mutator.rs b/src/query/storages/fuse/src/operations/mutation/mutator/block_compact_mutator.rs
index 4e487b41d4873..b0c159fdde7b1 100644
--- a/src/query/storages/fuse/src/operations/mutation/mutator/block_compact_mutator.rs
+++ b/src/query/storages/fuse/src/operations/mutation/mutator/block_compact_mutator.rs
@@ -349,7 +349,7 @@ impl SegmentCompactChecker {
             return vec![];
         }
 
-        if self.total_block_count > 2 * self.block_threshold {
+        if self.total_block_count >= 2 * self.block_threshold {
             self.total_block_count = 0;
             let trivial = vec![(idx, segment)];
             if self.segments.is_empty() {
@@ -458,7 +458,7 @@ impl CompactTaskBuilder {
             self.blocks.push(block.clone());
             (false, true)
         } else {
-            // blocks > 2N
+            // blocks >= 2N
             (true, !self.blocks.is_empty())
         }
     }
diff --git a/src/query/storages/fuse/src/operations/read_partitions.rs b/src/query/storages/fuse/src/operations/read_partitions.rs
index bc3730e9a7b03..e0a6d017d65e5 100644
--- a/src/query/storages/fuse/src/operations/read_partitions.rs
+++ b/src/query/storages/fuse/src/operations/read_partitions.rs
@@ -49,6 +49,7 @@ use databend_storages_common_pruner::TopNPrunner;
 use databend_storages_common_table_meta::meta::BlockMeta;
 use databend_storages_common_table_meta::meta::ColumnStatistics;
 use databend_storages_common_table_meta::table::ChangeType;
+use databend_storages_common_table_meta::table::ClusterType;
 use log::info;
 use opendal::Operator;
 use sha2::Digest;
@@ -104,6 +105,18 @@ impl FuseTable {
         );
         match snapshot {
             Some(snapshot) => {
+                // To optimize the Hilbert clustering logic, it is necessary to pre-set the selected segments.
+                // Since the recluster logic requires scanning the table twice, fetching the segments directly
+                // can avoid redundant selection logic and ensure that the same data is accessed during both scans.
+                // TODO(zhyass): refactor if necessary.
+                let selected_segment = ctx.get_selected_segment_locations();
+                let segment_locs = if !selected_segment.is_empty() {
+                    selected_segment
+                } else {
+                    snapshot.segments.clone()
+                };
+                let segment_len = segment_locs.len();
+
                 let snapshot_loc = self
                     .meta_location_generator
                     .snapshot_location_from_uuid(&snapshot.snapshot_id, snapshot.format_version)?;
@@ -115,10 +128,10 @@ impl FuseTable {
                     nodes_num = cluster.nodes.len();
                 }
 
-                if !dry_run && snapshot.segments.len() > nodes_num && distributed_pruning {
-                    let mut segments = Vec::with_capacity(snapshot.segments.len());
-                    for (idx, segment_location) in snapshot.segments.iter().enumerate() {
-                        segments.push(FuseLazyPartInfo::create(idx, segment_location.clone()))
+                if !dry_run && segment_len > nodes_num && distributed_pruning {
+                    let mut segments = Vec::with_capacity(segment_locs.len());
+                    for (idx, segment_location) in segment_locs.into_iter().enumerate() {
+                        segments.push(FuseLazyPartInfo::create(idx, segment_location))
                     }
 
                     return Ok((
@@ -126,8 +139,8 @@ impl FuseTable {
                             Some(snapshot_loc),
                             snapshot.summary.row_count as usize,
                             snapshot.summary.compressed_byte_size as usize,
-                            snapshot.segments.len(),
-                            snapshot.segments.len(),
+                            segment_len,
+                            segment_len,
                         ),
                         Partitions::create(PartitionsShuffleKind::Mod, segments),
                     ));
@@ -136,8 +149,7 @@ impl FuseTable {
                 let snapshot_loc = Some(snapshot_loc);
                 let table_schema = self.schema_with_stream();
                 let summary = snapshot.summary.block_count as usize;
-                let segments_location =
-                    create_segment_location_vector(snapshot.segments.clone(), snapshot_loc);
+                let segments_location = create_segment_location_vector(segment_locs, snapshot_loc);
 
                 self.prune_snapshot_blocks(
                     ctx.clone(),
@@ -471,31 +483,32 @@ impl FuseTable {
             None
         };
 
-        let pruner = if !self.is_native() || self.cluster_key_meta.is_none() {
-            FusePruner::create(
-                &ctx,
-                dal,
-                table_schema.clone(),
-                &push_downs,
-                self.bloom_index_cols(),
-                bloom_index_builder,
-                self.get_storage_format(),
-            )?
-        } else {
-            let cluster_keys = self.cluster_keys(ctx.clone());
-
-            FusePruner::create_with_pages(
-                &ctx,
-                dal,
-                table_schema,
-                &push_downs,
-                self.cluster_key_meta.clone(),
-                cluster_keys,
-                self.bloom_index_cols(),
-                bloom_index_builder,
-                self.get_storage_format(),
-            )?
-        };
+        let pruner =
+            if !self.is_native() || self.cluster_type().is_none_or(|v| v != ClusterType::Linear) {
+                FusePruner::create(
+                    &ctx,
+                    dal,
+                    table_schema.clone(),
+                    &push_downs,
+                    self.bloom_index_cols(),
+                    bloom_index_builder,
+                    self.get_storage_format(),
+                )?
+            } else {
+                let cluster_keys = self.linear_cluster_keys(ctx.clone());
+
+                FusePruner::create_with_pages(
+                    &ctx,
+                    dal,
+                    table_schema,
+                    &push_downs,
+                    self.cluster_key_meta.clone(),
+                    cluster_keys,
+                    self.bloom_index_cols(),
+                    bloom_index_builder,
+                    self.get_storage_format(),
+                )?
+            };
         Ok(pruner)
     }
 
diff --git a/src/query/storages/fuse/src/operations/recluster.rs b/src/query/storages/fuse/src/operations/recluster.rs
index f28e351c34b10..b4956c81c97a0 100644
--- a/src/query/storages/fuse/src/operations/recluster.rs
+++ b/src/query/storages/fuse/src/operations/recluster.rs
@@ -32,6 +32,7 @@ use databend_common_metrics::storage::metrics_inc_recluster_segment_nums_schedul
 use databend_common_sql::BloomIndexColumns;
 use databend_storages_common_table_meta::meta::CompactSegmentInfo;
 use databend_storages_common_table_meta::meta::TableSnapshot;
+use databend_storages_common_table_meta::table::ClusterType;
 use log::warn;
 use opendal::Operator;
 
@@ -61,14 +62,12 @@ impl FuseTable {
             ctx.set_status_info(status);
         }
 
-        if self.cluster_key_meta.is_none() {
+        let cluster_type = self.cluster_type();
+        if cluster_type.is_none_or(|v| v != ClusterType::Linear) {
             return Ok(None);
         }
 
-        let snapshot_opt = self.read_table_snapshot().await?;
-        let snapshot = if let Some(val) = snapshot_opt {
-            val
-        } else {
+        let Some(snapshot) = self.read_table_snapshot().await? else {
             // no snapshot, no recluster.
             return Ok(None);
         };
diff --git a/src/query/storages/fuse/src/pruning/fuse_pruner.rs b/src/query/storages/fuse/src/pruning/fuse_pruner.rs
index 1e52bc3578c47..f834f13055c22 100644
--- a/src/query/storages/fuse/src/pruning/fuse_pruner.rs
+++ b/src/query/storages/fuse/src/pruning/fuse_pruner.rs
@@ -508,9 +508,6 @@ impl FusePruner {
             let res = worker?;
             metas.extend(res);
         }
-        // Todo:: for now, all operation (contains other mutation other than delete, like select,update etc.)
-        // will get here, we can prevent other mutations like update and so on.
-        // TopN pruner.
         self.topn_pruning(metas)
     }
 
diff --git a/src/query/storages/fuse/src/table_functions/clustering_information.rs b/src/query/storages/fuse/src/table_functions/clustering_information.rs
index 1f153b2e1b1aa..4dd15b734ad22 100644
--- a/src/query/storages/fuse/src/table_functions/clustering_information.rs
+++ b/src/query/storages/fuse/src/table_functions/clustering_information.rs
@@ -189,7 +189,7 @@ impl<'a> ClusteringInformation<'a> {
                 (cluster_key, exprs)
             }
             (Some(a), None) => {
-                let exprs = self.table.cluster_keys(self.ctx.clone());
+                let exprs = self.table.linear_cluster_keys(self.ctx.clone());
                 let exprs = exprs
                     .iter()
                     .map(|k| k.as_expr(&BUILTIN_FUNCTIONS))
@@ -205,13 +205,17 @@ impl<'a> ClusteringInformation<'a> {
             }
         };
 
-        let cluster_type = if default_cluster_key_id.is_some() {
-            self.table
-                .get_option(OPT_KEY_CLUSTER_TYPE, ClusterType::Linear)
-                .to_string()
-        } else {
-            "linear".to_string()
-        };
+        if default_cluster_key_id.is_some() {
+            let typ = self
+                .table
+                .get_option(OPT_KEY_CLUSTER_TYPE, ClusterType::Linear);
+            if matches!(typ, ClusterType::Hilbert) {
+                return Err(ErrorCode::UnsupportedClusterType(
+                    "Unsupported 'hilbert' type, please use `hilbert_clustering_information` instead",
+                ));
+            }
+        }
+        let cluster_type = "linear".to_string();
 
         let snapshot = self.table.read_table_snapshot().await?;
         let now = Utc::now();
diff --git a/src/query/storages/fuse/src/table_functions/clustering_statistics.rs b/src/query/storages/fuse/src/table_functions/clustering_statistics.rs
index e1f1f994b2f31..bf3292ce036f3 100644
--- a/src/query/storages/fuse/src/table_functions/clustering_statistics.rs
+++ b/src/query/storages/fuse/src/table_functions/clustering_statistics.rs
@@ -172,7 +172,6 @@ impl<'a> ClusteringStatisticsImpl<'a> {
         );
 
         let mut row_num = 0;
-        let mut end_flag = false;
         let chunk_size =
             std::cmp::min(self.ctx.get_settings().get_max_threads()? as usize * 4, len).max(1);
 
@@ -220,14 +219,9 @@ impl<'a> ClusteringStatisticsImpl<'a> {
 
                     row_num += 1;
                     if row_num >= limit {
-                        end_flag = true;
-                        break;
+                        break 'FOR;
                     }
                 }
-
-                if end_flag {
-                    break 'FOR;
-                }
             }
         }
 
diff --git a/src/query/storages/fuse/src/table_functions/fuse_block.rs b/src/query/storages/fuse/src/table_functions/fuse_block.rs
index 7a96a755ba5d6..e81525fbc11b8 100644
--- a/src/query/storages/fuse/src/table_functions/fuse_block.rs
+++ b/src/query/storages/fuse/src/table_functions/fuse_block.rs
@@ -90,7 +90,6 @@ impl TableMetaFunc for FuseBlock {
         let segments_io = SegmentsIO::create(ctx.clone(), tbl.operator.clone(), tbl.schema());
 
         let mut row_num = 0;
-        let mut end_flag = false;
         let chunk_size =
             std::cmp::min(ctx.get_settings().get_max_threads()? as usize * 4, len).max(1);
         'FOR: for chunk in snapshot.segments.chunks(chunk_size) {
@@ -117,14 +116,9 @@ impl TableMetaFunc for FuseBlock {
 
                     row_num += 1;
                     if row_num >= limit {
-                        end_flag = true;
-                        break;
+                        break 'FOR;
                     }
                 }
-
-                if end_flag {
-                    break 'FOR;
-                }
             }
         }
 
diff --git a/src/query/storages/fuse/src/table_functions/fuse_column.rs b/src/query/storages/fuse/src/table_functions/fuse_column.rs
index 7ae42f3025df5..484eb8b53c537 100644
--- a/src/query/storages/fuse/src/table_functions/fuse_column.rs
+++ b/src/query/storages/fuse/src/table_functions/fuse_column.rs
@@ -98,7 +98,6 @@ impl TableMetaFunc for FuseColumn {
         let schema = tbl.schema();
         let leaf_fields = schema.leaf_fields();
 
-        let mut end = false;
         'FOR: for chunk in snapshot.segments.chunks(chunk_size) {
             let segments = segments_io
                 .read_segments::<SegmentInfo>(chunk, true)
@@ -128,15 +127,10 @@ impl TableMetaFunc for FuseColumn {
                             row_num += 1;
 
                             if row_num >= limit {
-                                end = true;
-                                break;
+                                break 'FOR;
                             }
                         }
                     }
-
-                    if end {
-                        break 'FOR;
-                    }
                 }
             }
         }
diff --git a/src/query/storages/fuse/src/table_functions/fuse_segment.rs b/src/query/storages/fuse/src/table_functions/fuse_segment.rs
index 8a84757f8eacd..d5a6e91e9205c 100644
--- a/src/query/storages/fuse/src/table_functions/fuse_segment.rs
+++ b/src/query/storages/fuse/src/table_functions/fuse_segment.rs
@@ -25,7 +25,7 @@ use databend_common_expression::TableDataType;
 use databend_common_expression::TableField;
 use databend_common_expression::TableSchema;
 use databend_common_expression::TableSchemaRefExt;
-use databend_storages_common_table_meta::meta::SegmentInfo;
+use databend_storages_common_table_meta::meta::CompactSegmentInfo;
 use databend_storages_common_table_meta::meta::TableSnapshot;
 
 use crate::io::SegmentsIO;
@@ -85,7 +85,7 @@ impl TableMetaFunc for FuseSegment {
             std::cmp::min(ctx.get_settings().get_max_threads()? as usize * 4, len).max(1);
         for chunk in segment_locations.chunks(chunk_size) {
             let segments = segments_io
-                .read_segments::<SegmentInfo>(chunk, true)
+                .read_segments::<Arc<CompactSegmentInfo>>(chunk, true)
                 .await?;
 
             for (idx, segment) in segments.into_iter().enumerate() {
diff --git a/src/query/storages/fuse/src/table_functions/hilbert_clustering_information.rs b/src/query/storages/fuse/src/table_functions/hilbert_clustering_information.rs
new file mode 100644
index 0000000000000..f57ef9bf9f711
--- /dev/null
+++ b/src/query/storages/fuse/src/table_functions/hilbert_clustering_information.rs
@@ -0,0 +1,241 @@
+// Copyright 2021 Datafuse Labs
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use std::sync::Arc;
+
+use chrono::Utc;
+use databend_common_catalog::catalog::CATALOG_DEFAULT;
+use databend_common_catalog::plan::DataSourcePlan;
+use databend_common_catalog::table::Table;
+use databend_common_catalog::table_args::TableArgs;
+use databend_common_catalog::table_context::TableContext;
+use databend_common_exception::ErrorCode;
+use databend_common_exception::Result;
+use databend_common_expression::types::DataType;
+use databend_common_expression::types::NumberDataType;
+use databend_common_expression::types::NumberScalar;
+use databend_common_expression::BlockEntry;
+use databend_common_expression::DataBlock;
+use databend_common_expression::Scalar;
+use databend_common_expression::TableDataType;
+use databend_common_expression::TableField;
+use databend_common_expression::TableSchema;
+use databend_common_expression::TableSchemaRef;
+use databend_common_expression::TableSchemaRefExt;
+use databend_common_expression::Value;
+use databend_storages_common_table_meta::meta::CompactSegmentInfo;
+use databend_storages_common_table_meta::table::ClusterType;
+use databend_storages_common_table_meta::table::OPT_KEY_CLUSTER_TYPE;
+
+use crate::io::SegmentsIO;
+use crate::table_functions::parse_db_tb_args;
+use crate::table_functions::string_literal;
+use crate::table_functions::SimpleArgFunc;
+use crate::table_functions::SimpleArgFuncTemplate;
+use crate::FuseTable;
+
+pub struct HilbertClusteringInfoArgs {
+    database_name: String,
+    table_name: String,
+}
+
+impl From<&HilbertClusteringInfoArgs> for TableArgs {
+    fn from(args: &HilbertClusteringInfoArgs) -> Self {
+        let tbl_args = vec![
+            string_literal(args.database_name.as_str()),
+            string_literal(args.table_name.as_str()),
+        ];
+        TableArgs::new_positioned(tbl_args)
+    }
+}
+
+impl TryFrom<(&str, TableArgs)> for HilbertClusteringInfoArgs {
+    type Error = ErrorCode;
+    fn try_from(
+        (func_name, table_args): (&str, TableArgs),
+    ) -> std::result::Result<Self, Self::Error> {
+        let (database_name, table_name) = parse_db_tb_args(&table_args, func_name)?;
+
+        Ok(Self {
+            database_name,
+            table_name,
+        })
+    }
+}
+
+pub type HilbertClusteringInfoFunc = SimpleArgFuncTemplate<HilbertClusteringInfo>;
+pub struct HilbertClusteringInfo;
+
+#[async_trait::async_trait]
+impl SimpleArgFunc for HilbertClusteringInfo {
+    type Args = HilbertClusteringInfoArgs;
+
+    fn schema() -> TableSchemaRef {
+        HilbertClusteringInfoImpl::schema()
+    }
+
+    async fn apply(
+        ctx: &Arc<dyn TableContext>,
+        args: &Self::Args,
+        _plan: &DataSourcePlan,
+    ) -> Result<DataBlock> {
+        let tenant_id = ctx.get_tenant();
+        let tbl = ctx
+            .get_catalog(CATALOG_DEFAULT)
+            .await?
+            .get_table(
+                &tenant_id,
+                args.database_name.as_str(),
+                args.table_name.as_str(),
+            )
+            .await?;
+
+        let tbl = FuseTable::try_from_table(tbl.as_ref())?;
+
+        HilbertClusteringInfoImpl::new(ctx.clone(), tbl)
+            .get_clustering_info()
+            .await
+    }
+}
+
+struct HilbertClusteringInfoImpl<'a> {
+    pub ctx: Arc<dyn TableContext>,
+    pub table: &'a FuseTable,
+}
+
+impl<'a> HilbertClusteringInfoImpl<'a> {
+    fn new(ctx: Arc<dyn TableContext>, table: &'a FuseTable) -> Self {
+        Self { ctx, table }
+    }
+
+    #[async_backtrace::framed]
+    async fn get_clustering_info(&self) -> Result<DataBlock> {
+        let Some(cluster_key_str) = self.table.cluster_key_str() else {
+            return Err(ErrorCode::UnclusteredTable(format!(
+                "Unclustered table {}",
+                self.table.table_info.desc
+            )));
+        };
+        let cluster_type = self
+            .table
+            .get_option(OPT_KEY_CLUSTER_TYPE, ClusterType::Linear);
+        if matches!(cluster_type, ClusterType::Linear) {
+            return Err(ErrorCode::UnsupportedClusterType(
+                "Unsupported `linear` type, please use `clustering_information` instead",
+            ));
+        }
+
+        let snapshot = self.table.read_table_snapshot().await?;
+        let now = Utc::now();
+        let timestamp = snapshot
+            .as_ref()
+            .map_or(now, |s| s.timestamp.unwrap_or(now))
+            .timestamp_micros();
+        let mut total_segment_count = 0;
+        let mut stable_segment_count = 0;
+        let mut partial_segment_count = 0;
+        let mut unclustered_segment_count = 0;
+        if let Some(snapshot) = snapshot {
+            let total_count = snapshot.segments.len();
+            total_segment_count = total_count as u64;
+            let chunk_size = std::cmp::min(
+                self.ctx.get_settings().get_max_threads()? as usize * 4,
+                total_count,
+            )
+            .max(1);
+            let segments_io = SegmentsIO::create(
+                self.ctx.clone(),
+                self.table.operator.clone(),
+                self.table.schema(),
+            );
+            for chunk in snapshot.segments.chunks(chunk_size) {
+                let segments = segments_io
+                    .read_segments::<Arc<CompactSegmentInfo>>(chunk, true)
+                    .await?;
+                for segment in segments {
+                    let segment = segment?;
+                    let Some(level) = segment.summary.cluster_stats.as_ref().map(|v| v.level)
+                    else {
+                        unclustered_segment_count += 1;
+                        continue;
+                    };
+                    if level == -1 {
+                        stable_segment_count += 1;
+                    } else {
+                        partial_segment_count += 1;
+                    }
+                }
+            }
+        }
+        Ok(DataBlock::new(
+            vec![
+                BlockEntry::new(
+                    DataType::String,
+                    Value::Scalar(Scalar::String(cluster_key_str.to_string())),
+                ),
+                BlockEntry::new(
+                    DataType::String,
+                    Value::Scalar(Scalar::String("hilbert".to_string())),
+                ),
+                BlockEntry::new(
+                    DataType::Timestamp,
+                    Value::Scalar(Scalar::Timestamp(timestamp)),
+                ),
+                BlockEntry::new(
+                    DataType::Number(NumberDataType::UInt64),
+                    Value::Scalar(Scalar::Number(NumberScalar::UInt64(total_segment_count))),
+                ),
+                BlockEntry::new(
+                    DataType::Number(NumberDataType::UInt64),
+                    Value::Scalar(Scalar::Number(NumberScalar::UInt64(stable_segment_count))),
+                ),
+                BlockEntry::new(
+                    DataType::Number(NumberDataType::UInt64),
+                    Value::Scalar(Scalar::Number(NumberScalar::UInt64(partial_segment_count))),
+                ),
+                BlockEntry::new(
+                    DataType::Number(NumberDataType::UInt64),
+                    Value::Scalar(Scalar::Number(NumberScalar::UInt64(
+                        unclustered_segment_count,
+                    ))),
+                ),
+            ],
+            1,
+        ))
+    }
+
+    fn schema() -> Arc<TableSchema> {
+        TableSchemaRefExt::create(vec![
+            TableField::new("cluster_key", TableDataType::String),
+            TableField::new("type", TableDataType::String),
+            TableField::new("timestamp", TableDataType::Timestamp),
+            TableField::new(
+                "total_segment_count",
+                TableDataType::Number(NumberDataType::UInt64),
+            ),
+            TableField::new(
+                "stable_segment_count",
+                TableDataType::Number(NumberDataType::UInt64),
+            ),
+            TableField::new(
+                "partial_segment_count",
+                TableDataType::Number(NumberDataType::UInt64),
+            ),
+            TableField::new(
+                "unclustered_segment_count",
+                TableDataType::Number(NumberDataType::UInt64),
+            ),
+        ])
+    }
+}
diff --git a/src/query/storages/fuse/src/table_functions/mod.rs b/src/query/storages/fuse/src/table_functions/mod.rs
index b4bf4e61872d3..68967aaf7bec4 100644
--- a/src/query/storages/fuse/src/table_functions/mod.rs
+++ b/src/query/storages/fuse/src/table_functions/mod.rs
@@ -24,6 +24,7 @@ mod fuse_snapshot;
 mod fuse_statistic;
 mod fuse_time_travel_size;
 mod fuse_vacuum_temporary_table;
+mod hilbert_clustering_information;
 mod table_args;
 
 mod set_cache_capacity;
@@ -45,5 +46,6 @@ pub use fuse_statistic::FuseStatisticsFunc;
 pub use fuse_time_travel_size::FuseTimeTravelSize;
 pub use fuse_time_travel_size::FuseTimeTravelSizeFunc;
 pub use fuse_vacuum_temporary_table::FuseVacuumTemporaryTable;
+pub use hilbert_clustering_information::HilbertClusteringInfoFunc;
 pub use set_cache_capacity::SetCacheCapacity;
 pub use table_args::*;
diff --git a/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0000_recluster_final.test b/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0000_recluster_final.test
new file mode 100644
index 0000000000000..01b2579043fb5
--- /dev/null
+++ b/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0000_recluster_final.test
@@ -0,0 +1,95 @@
+## Copyright 2023 Databend Cloud
+##
+## Licensed under the Elastic License, Version 2.0 (the "License");
+## you may not use this file except in compliance with the License.
+## You may obtain a copy of the License at
+##
+##     https://www.elastic.co/licensing/elastic-license
+##
+## Unless required by applicable law or agreed to in writing, software
+## distributed under the License is distributed on an "AS IS" BASIS,
+## WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+## See the License for the specific language governing permissions and
+## limitations under the License.
+
+statement ok
+CREATE OR REPLACE DATABASE test_hilbert
+
+statement ok
+USE test_hilbert
+
+statement ok
+set enable_parallel_multi_merge_sort = 0;
+
+statement ok
+create or replace table t(a int, b int) cluster by hilbert(a, b) row_per_block=2 block_per_segment=2;
+
+statement ok
+insert into t values(1, 1), (3, 3);
+
+statement ok
+insert into t values(0, 0), (5, 5);
+
+statement ok
+insert into t values(2, 2), (6, 6);
+
+statement ok
+insert into t values(4, 4), (7, 7);
+
+query I
+select count() from fuse_snapshot('test_hilbert','t');
+----
+4
+
+statement error 4013
+select * EXCLUDE(timestamp) from clustering_information('test_hilbert','t');
+
+query TTIIII
+select * EXCLUDE(timestamp) from hilbert_clustering_information('test_hilbert','t');
+----
+(a, b) hilbert 4 0 0 4
+
+statement ok
+alter table t recluster final;
+
+query I
+select count() from fuse_snapshot('test_hilbert','t');
+----
+6
+
+query II
+select count(a), sum(a) from t;
+----
+8 28
+
+statement ok
+insert into t values(8, 8);
+
+statement ok
+insert into t values(9, 9);
+
+statement ok
+alter table t recluster final;
+
+query TTIIII
+select * EXCLUDE(timestamp) from hilbert_clustering_information('test_hilbert','t');
+----
+(a, b) hilbert 3 2 1 0
+
+query I
+select count() from fuse_snapshot('test_hilbert','t');
+----
+9
+
+query II
+select block_count,row_count from fuse_segment('test_hilbert','t');
+----
+1 2
+2 4
+2 4
+
+statement ok
+drop table t all;
+
+statement ok
+drop database test_hilbert;
diff --git a/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0001_change_tracking.test b/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0001_change_tracking.test
new file mode 100644
index 0000000000000..372ba402c9da1
--- /dev/null
+++ b/tests/sqllogictests/suites/ee/07_hilbert_clustering/07_0001_change_tracking.test
@@ -0,0 +1,56 @@
+## Copyright 2023 Databend Cloud
+##
+## Licensed under the Elastic License, Version 2.0 (the "License");
+## you may not use this file except in compliance with the License.
+## You may obtain a copy of the License at
+##
+##     https://www.elastic.co/licensing/elastic-license
+##
+## Unless required by applicable law or agreed to in writing, software
+## distributed under the License is distributed on an "AS IS" BASIS,
+## WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+## See the License for the specific language governing permissions and
+## limitations under the License.
+
+statement ok
+CREATE OR REPLACE DATABASE test_hilbert_1
+
+statement ok
+USE test_hilbert_1
+
+statement ok
+create or replace table t(a int, b int) cluster by hilbert(a, b);
+
+statement ok
+insert into t values(1, 1), (3, 3);
+
+statement ok
+alter table t set options(change_tracking = true);
+
+statement ok
+insert into t values(2, 2), (4, 4);
+
+query IIBBII
+select a, b, _origin_version is null, _origin_block_id is null, _origin_block_row_num, _row_version from t order by a;
+----
+1 1 1 1 NULL 0
+2 2 1 1 NULL 0
+3 3 1 1 NULL 0
+4 4 1 1 NULL 0
+
+statement ok
+alter table t recluster;
+
+query IIBBII
+select a, b, _origin_version is null, _origin_block_id is null, _origin_block_row_num, _row_version from t order by a;
+----
+1 1 0 0 0 0
+2 2 0 0 0 0
+3 3 0 0 1 0
+4 4 0 0 1 0
+
+statement ok
+drop table t all;
+
+statement ok
+drop database test_hilbert_1;
diff --git a/tests/sqllogictests/suites/mode/standalone/ee/explain_hilbert_clustering.test b/tests/sqllogictests/suites/mode/standalone/ee/explain_hilbert_clustering.test
new file mode 100644
index 0000000000000..a2926ad814ead
--- /dev/null
+++ b/tests/sqllogictests/suites/mode/standalone/ee/explain_hilbert_clustering.test
@@ -0,0 +1,70 @@
+## Copyright 2023 Databend Cloud
+##
+## Licensed under the Elastic License, Version 2.0 (the "License");
+## you may not use this file except in compliance with the License.
+## You may obtain a copy of the License at
+##
+##     https://www.elastic.co/licensing/elastic-license
+##
+## Unless required by applicable law or agreed to in writing, software
+## distributed under the License is distributed on an "AS IS" BASIS,
+## WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+## See the License for the specific language governing permissions and
+## limitations under the License.
+
+statement ok
+set enable_parallel_multi_merge_sort = 0;
+
+statement ok
+CREATE OR REPLACE TABLE test_hilbert(a int, b int) cluster by hilbert(a,b) row_per_block = 2;
+
+statement ok
+INSERT INTO test_hilbert VALUES(1, 1), (1, 2);
+
+statement ok
+INSERT INTO test_hilbert VALUES(2, 1), (2, 2);
+
+statement ok
+ALTER TABLE test_hilbert RECLUSTER FINAL;
+
+statement error 4013
+select * from clustering_information('default','test_hilbert')
+
+query T
+EXPLAIN SELECT * FROM test_hilbert WHERE a = 1;
+----
+Filter
+├── output columns: [test_hilbert.a (#0), test_hilbert.b (#1)]
+├── filters: [is_true(test_hilbert.a (#0) = 1)]
+├── estimated rows: 2.00
+└── TableScan
+    ├── table: default.default.test_hilbert
+    ├── output columns: [a (#0), b (#1)]
+    ├── read rows: 4
+    ├── read size: < 1 KiB
+    ├── partitions total: 2
+    ├── partitions scanned: 2
+    ├── pruning stats: [segments: <range pruning: 1 to 1>, blocks: <range pruning: 2 to 2, bloom pruning: 2 to 2>]
+    ├── push downs: [filters: [is_true(test_hilbert.a (#0) = 1)], limit: NONE]
+    └── estimated rows: 4.00
+
+query T
+EXPLAIN SELECT * FROM test_hilbert WHERE b = 1;
+----
+Filter
+├── output columns: [test_hilbert.a (#0), test_hilbert.b (#1)]
+├── filters: [is_true(test_hilbert.b (#1) = 1)]
+├── estimated rows: 2.00
+└── TableScan
+    ├── table: default.default.test_hilbert
+    ├── output columns: [a (#0), b (#1)]
+    ├── read rows: 2
+    ├── read size: < 1 KiB
+    ├── partitions total: 2
+    ├── partitions scanned: 1
+    ├── pruning stats: [segments: <range pruning: 1 to 1>, blocks: <range pruning: 2 to 1, bloom pruning: 1 to 1>]
+    ├── push downs: [filters: [is_true(test_hilbert.b (#1) = 1)], limit: NONE]
+    └── estimated rows: 4.00
+
+statement ok
+DROP TABLE test_hilbert ALL;
diff --git a/tests/sqllogictests/suites/mode/standalone/explain/clustering.test b/tests/sqllogictests/suites/mode/standalone/explain/clustering.test
index 0a20fe6dc65a4..12f8069645f34 100644
--- a/tests/sqllogictests/suites/mode/standalone/explain/clustering.test
+++ b/tests/sqllogictests/suites/mode/standalone/explain/clustering.test
@@ -54,61 +54,5 @@ Filter
     ├── push downs: [filters: [is_true(test_linear.b (#1) = 1)], limit: NONE]
     └── estimated rows: 4.00
 
-statement ok
-CREATE OR REPLACE TABLE test_hilbert(a int, b int) cluster by hilbert(a,b) row_per_block = 2;
-
-statement ok
-INSERT INTO test_hilbert VALUES(1, 1), (1, 2);
-
-statement ok
-INSERT INTO test_hilbert VALUES(2, 1), (2, 2);
-
-statement ok
-ALTER TABLE test_hilbert RECLUSTER FINAL;
-
-query TTIFFT
-select cluster_key, type, total_block_count, average_overlaps, average_depth, block_depth_histogram from clustering_information('default','test_hilbert')
-----
-(a, b) hilbert 2 0.0 1.0 {"00001":2}
-
-query T
-EXPLAIN SELECT * FROM test_hilbert WHERE a = 1;
-----
-Filter
-├── output columns: [test_hilbert.a (#0), test_hilbert.b (#1)]
-├── filters: [is_true(test_hilbert.a (#0) = 1)]
-├── estimated rows: 2.00
-└── TableScan
-    ├── table: default.default.test_hilbert
-    ├── output columns: [a (#0), b (#1)]
-    ├── read rows: 4
-    ├── read size: < 1 KiB
-    ├── partitions total: 2
-    ├── partitions scanned: 2
-    ├── pruning stats: [segments: <range pruning: 1 to 1>, blocks: <range pruning: 2 to 2, bloom pruning: 2 to 2>]
-    ├── push downs: [filters: [is_true(test_hilbert.a (#0) = 1)], limit: NONE]
-    └── estimated rows: 4.00
-
-query T
-EXPLAIN SELECT * FROM test_hilbert WHERE b = 1;
-----
-Filter
-├── output columns: [test_hilbert.a (#0), test_hilbert.b (#1)]
-├── filters: [is_true(test_hilbert.b (#1) = 1)]
-├── estimated rows: 2.00
-└── TableScan
-    ├── table: default.default.test_hilbert
-    ├── output columns: [a (#0), b (#1)]
-    ├── read rows: 2
-    ├── read size: < 1 KiB
-    ├── partitions total: 2
-    ├── partitions scanned: 1
-    ├── pruning stats: [segments: <range pruning: 1 to 1>, blocks: <range pruning: 2 to 1, bloom pruning: 1 to 1>]
-    ├── push downs: [filters: [is_true(test_hilbert.b (#1) = 1)], limit: NONE]
-    └── estimated rows: 4.00
-
 statement ok
 DROP TABLE test_linear ALL;
-
-statement ok
-DROP TABLE test_hilbert ALL;
diff --git a/tests/suites/0_stateless/19_fuzz/19_0004_fuzz_filter.py b/tests/suites/0_stateless/19_fuzz/19_0004_fuzz_filter.py
index eddbe3fc0f8ca..eba4fa1396a6b 100755
--- a/tests/suites/0_stateless/19_fuzz/19_0004_fuzz_filter.py
+++ b/tests/suites/0_stateless/19_fuzz/19_0004_fuzz_filter.py
@@ -23,4 +23,4 @@
 
 for i in range(num_predicates):
     sql = f"explain analyze partial select * from t where a >= {int(step * i)};"
-    client1.run(sql)
\ No newline at end of file
+    client1.run(sql)