fix test

zhyass · zhyass · commit ce16f7230414 · 2025-06-14T01:56:50.000+08:00
diff --git a/src/query/expression/src/utils/block_thresholds.rs b/src/query/expression/src/utils/block_thresholds.rs
@@ -39,7 +39,7 @@ impl Default for BlockThresholds {
             max_bytes_per_block: DEFAULT_BLOCK_BUFFER_SIZE * 2,
             min_bytes_per_block: (DEFAULT_BLOCK_BUFFER_SIZE * 4).div_ceil(5),
             max_compressed_per_block: DEFAULT_BLOCK_COMPRESSED_SIZE,
-            min_compressed_per_block: (DEFAULT_BLOCK_COMPRESSED_SIZE * 4).div_ceil(5),
+            min_compressed_per_block: (DEFAULT_BLOCK_COMPRESSED_SIZE * 3).div_ceil(5),
             block_per_segment: DEFAULT_BLOCK_PER_SEGMENT,
         }
     }
@@ -58,7 +58,7 @@ impl BlockThresholds {
             max_bytes_per_block: bytes_per_block * 2,
             min_bytes_per_block: (bytes_per_block * 4).div_ceil(5),
             max_compressed_per_block,
-            min_compressed_per_block: (max_compressed_per_block * 4).div_ceil(5),
+            min_compressed_per_block: (max_compressed_per_block * 3).div_ceil(5),
             block_per_segment,
         }
     }
@@ -153,7 +153,7 @@ impl BlockThresholds {
         let bytes_per_block = total_bytes.div_ceil(block_num_by_compressed);
         // Adjust the number of blocks based on block size thresholds.
         let max_bytes_per_block = self.max_bytes_per_block.min(400 * 1024 * 1024);
-        let min_bytes_per_block = (self.min_bytes_per_block / 2).min(50 * 1024 * 1024);
+        let min_bytes_per_block = self.min_bytes_per_block.min(100 * 1024 * 1024);
         let block_nums = if bytes_per_block > max_bytes_per_block {
             // Case 1: If the block size is too bigger.
             total_bytes.div_ceil(max_bytes_per_block)
@@ -201,7 +201,7 @@ impl BlockThresholds {
         // Adjust block count based on byte size thresholds.
         let bytes_per_block = total_bytes.div_ceil(by_compressed);
         let max_bytes = self.max_bytes_per_block.min(400 * 1024 * 1024);
-        let min_bytes = (self.min_bytes_per_block / 2).min(50 * 1024 * 1024);
+        let min_bytes = self.min_bytes_per_block.min(100 * 1024 * 1024);
         let total_partitions = if bytes_per_block > max_bytes {
             // Block size is too large.
             total_bytes / max_bytes
diff --git a/src/query/expression/tests/it/block_thresholds.rs b/src/query/expression/tests/it/block_thresholds.rs
@@ -105,8 +105,8 @@ fn test_calc_rows_for_recluster() {
     assert_eq!(result, 300);
 
     // Case 2: If the block size is too smaller.
-    let result = t.calc_rows_for_recluster(4_000, 2_000_000, 600_000);
-    assert_eq!(result, 800);
+    let result = t.calc_rows_for_recluster(4_000, 1_600_000, 600_000);
+    assert_eq!(result, 2000);
 
     // Case 3: use the compressed-based block count.
     let result = t.calc_rows_for_recluster(4_000, 10_000_000, 600_000);
@@ -131,7 +131,7 @@ fn test_calc_partitions_for_recluster() {
     assert_eq!(result, 15);
 
     // Case 2: If the block size is too smaller.
-    let result = t.calc_partitions_for_recluster(4_000, 800_000, 800_000);
+    let result = t.calc_partitions_for_recluster(4_000, 1_600_000, 800_000);
     assert_eq!(result, 2);
 
     // Case 3: use the compressed-based block count.
diff --git a/src/query/service/src/interpreters/interpreter_table_recluster.rs b/src/query/service/src/interpreters/interpreter_table_recluster.rs
@@ -631,7 +631,7 @@ impl ReclusterTableInterpreter {
         let database = &self.plan.database;
         let table = &self.plan.table;
         let settings = self.ctx.get_settings();
-        let sample_size = settings.get_hilbert_sample_size_per_block()?;
+        let sample_size = settings.get_recluster_sample_size_per_block()?;
 
         let name_resolution_ctx = NameResolutionContext::try_from(settings.as_ref())?;
         let ast_exprs = tbl.resolve_cluster_keys(self.ctx.clone()).unwrap();
diff --git a/src/query/service/src/pipelines/builders/builder_recluster.rs b/src/query/service/src/pipelines/builders/builder_recluster.rs
@@ -187,15 +187,19 @@ impl PipelineBuilder {
                         .collect();
 
                     let num_processors = self.main_pipeline.output_len();
-                    let sample_rate = 0.01;
+                    let sample_size = self
+                        .ctx
+                        .get_settings()
+                        .get_recluster_sample_size_per_block()?
+                        as usize;
                     let partitions = block_thresholds.calc_partitions_for_recluster(
                         task.total_rows,
                         task.total_bytes,
                         task.total_compressed,
                     );
                     let state = SampleState::new(num_processors, partitions);
                     let recluster_pipeline_builder =
-                        ReclusterPipelineBuilder::create(schema, sort_descs.into(), sample_rate)
+                        ReclusterPipelineBuilder::create(schema, sort_descs.into(), sample_size)
                             .with_state(state);
                     recluster_pipeline_builder
                         .build_recluster_sample_pipeline(&mut self.main_pipeline)?;
@@ -314,21 +318,21 @@ struct ReclusterPipelineBuilder {
     schema: DataSchemaRef,
     sort_desc: Arc<[SortColumnDescription]>,
     state: Option<Arc<SampleState>>,
-    sample_rate: f64,
+    sample_size: usize,
     seed: u64,
 }
 
 impl ReclusterPipelineBuilder {
     fn create(
         schema: DataSchemaRef,
         sort_desc: Arc<[SortColumnDescription]>,
-        sample_rate: f64,
+        sample_size: usize,
     ) -> Self {
         Self {
             schema,
             sort_desc,
             state: None,
-            sample_rate,
+            sample_size,
             seed: rand::random(),
         }
     }
@@ -382,7 +386,7 @@ impl ReclusterPipelineBuilder {
         })?;
         let offset = self.schema.num_fields();
         pipeline.add_accumulating_transformer(|| {
-            TransformReclusterCollect::<R::Type>::new(offset, self.sample_rate, self.seed)
+            TransformReclusterCollect::<R::Type>::new(offset, self.sample_size, self.seed)
         });
         pipeline.add_transform(|input, output| {
             Ok(ProcessorPtr::create(TransformRangePartitionIndexer::<
diff --git a/src/query/service/src/pipelines/processors/transforms/recluster/range_bound_sampler.rs b/src/query/service/src/pipelines/processors/transforms/recluster/range_bound_sampler.rs
@@ -26,7 +26,7 @@ pub struct RangeBoundSampler<T>
 where T: ValueType
 {
     offset: usize,
-    sample_rate: f64,
+    sample_size: usize,
     rng: SmallRng,
 
     values: Vec<(u64, Vec<Scalar>)>,
@@ -36,11 +36,11 @@ where T: ValueType
 impl<T> RangeBoundSampler<T>
 where T: ValueType
 {
-    pub fn new(offset: usize, sample_rate: f64, seed: u64) -> Self {
+    pub fn new(offset: usize, sample_size: usize, seed: u64) -> Self {
         let rng = SmallRng::seed_from_u64(seed);
         Self {
             offset,
-            sample_rate,
+            sample_size,
             rng,
             values: vec![],
             _t: PhantomData,
@@ -58,15 +58,10 @@ where
         assert!(rows > 0);
         let column = data.get_by_offset(self.offset).to_column(rows);
 
-        let sample_size = std::cmp::max((self.sample_rate * rows as f64).ceil() as usize, 100);
+        let sample_size = std::cmp::min(self.sample_size, rows);
         let mut indices = (0..rows).collect::<Vec<_>>();
-
-        let sampled_indices = if rows > sample_size {
-            indices.shuffle(&mut self.rng);
-            &indices[..sample_size]
-        } else {
-            &indices
-        };
+        indices.shuffle(&mut self.rng);
+        let sampled_indices = &indices[..sample_size];
 
         let column = T::try_downcast_column(&column).unwrap();
         let sample_values = sampled_indices
diff --git a/src/query/service/src/pipelines/processors/transforms/recluster/recluster_partition_strategy.rs b/src/query/service/src/pipelines/processors/transforms/recluster/recluster_partition_strategy.rs
@@ -32,6 +32,10 @@ impl ReclusterPartitionStrategy {
     pub fn new(properties: Arc<StreamBlockProperties>) -> Self {
         Self { properties }
     }
+
+    fn concat_blocks(blocks: Vec<DataBlock>) -> Result<DataBlock> {
+        DataBlock::concat(&blocks)
+    }
 }
 
 impl PartitionProcessStrategy for ReclusterPartitionStrategy {
@@ -51,22 +55,44 @@ impl PartitionProcessStrategy for ReclusterPartitionStrategy {
     /// Stream write each block, and flush it conditionally based on builder status
     /// and input size estimation.
     fn process_data_blocks(&self, data_blocks: Vec<DataBlock>) -> Result<Vec<DataBlock>> {
-        let mut input_sizes: usize = data_blocks.iter().map(|b| b.estimate_block_size()).sum();
-        let mut input_rows: usize = data_blocks.iter().map(|b| b.num_rows()).sum();
+        let blocks_num = data_blocks.len();
+        let mut accumulated_rows = 0;
+        let mut accumulated_bytes = 0;
+        let mut pending_blocks = Vec::with_capacity(blocks_num);
+        let mut staged_blocks = Vec::with_capacity(blocks_num);
+        let mut compacted = Vec::with_capacity(blocks_num);
+        for block in data_blocks {
+            accumulated_rows += block.num_rows();
+            accumulated_bytes += block.estimate_block_size();
+            pending_blocks.push(block);
+            if !self
+                .properties
+                .check_large_enough(accumulated_rows, accumulated_bytes)
+            {
+                continue;
+            }
+            if !staged_blocks.is_empty() {
+                compacted.push(Self::concat_blocks(std::mem::take(&mut staged_blocks))?);
+            }
+            std::mem::swap(&mut staged_blocks, &mut pending_blocks);
+            accumulated_rows = 0;
+            accumulated_bytes = 0;
+        }
+        staged_blocks.append(&mut pending_blocks);
+        if !staged_blocks.is_empty() {
+            compacted.push(Self::concat_blocks(std::mem::take(&mut staged_blocks))?);
+        }
 
         let mut result = Vec::new();
         let mut builder = StreamBlockBuilder::try_new_with_config(self.properties.clone())?;
-        for block in data_blocks {
-            input_sizes -= block.estimate_block_size();
-            input_rows -= block.num_rows();
+        for block in compacted {
             builder.write(block)?;
-            if builder.need_flush() && self.properties.check_large_enough(input_rows, input_sizes) {
+            if builder.need_flush() {
                 let serialized = builder.finish()?;
                 result.push(DataBlock::empty_with_meta(Box::new(serialized)));
                 builder = StreamBlockBuilder::try_new_with_config(self.properties.clone())?;
             }
         }
-
         if !builder.is_empty() {
             let serialized = builder.finish()?;
             result.push(DataBlock::empty_with_meta(Box::new(serialized)));
diff --git a/src/query/service/src/pipelines/processors/transforms/recluster/transform_recluster_collect.rs b/src/query/service/src/pipelines/processors/transforms/recluster/transform_recluster_collect.rs
@@ -36,10 +36,10 @@ where
     T: ArgType + Send + Sync,
     T::Scalar: Ord + Send,
 {
-    pub fn new(offset: usize, sample_rate: f64, seed: u64) -> Self {
+    pub fn new(offset: usize, sample_size: usize, seed: u64) -> Self {
         Self {
             input_data: vec![],
-            sampler: RangeBoundSampler::<T>::new(offset, sample_rate, seed),
+            sampler: RangeBoundSampler::<T>::new(offset, sample_size, seed),
         }
     }
 }
diff --git a/src/query/settings/src/settings_default.rs b/src/query/settings/src/settings_default.rs
@@ -755,7 +755,7 @@ impl DefaultSettings {
                     range: Some(SettingRange::Numeric(0..=1)),
                 }),
                 ("enable_distributed_compact", DefaultSettingValue {
-                    value: UserSettingValue::UInt64(0),
+                    value: UserSettingValue::UInt64(1),
                     desc: "Enables distributed execution of table compaction.",
                     mode: SettingMode::Both,
                     scope: SettingScope::Both,
@@ -870,7 +870,7 @@ impl DefaultSettings {
                     range: Some(SettingRange::Numeric(2..=u64::MAX)),
                 }),
                 ("enable_distributed_recluster", DefaultSettingValue {
-                    value: UserSettingValue::UInt64(0),
+                    value: UserSettingValue::UInt64(1),
                     desc: "Enable distributed execution of table recluster.",
                     mode: SettingMode::Both,
                     scope: SettingScope::Both,
@@ -1220,9 +1220,9 @@ impl DefaultSettings {
                     scope: SettingScope::Both,
                     range: Some(SettingRange::Numeric(1..=65535)),
                 }),
-                ("hilbert_sample_size_per_block", DefaultSettingValue {
+                ("recluster_sample_size_per_block", DefaultSettingValue {
                     value: UserSettingValue::UInt64(1000),
-                    desc: "Specifies the number of sample points per block used in Hilbert clustering.",
+                    desc: "Specifies the number of sample points per block used in clustering.",
                     mode: SettingMode::Both,
                     scope: SettingScope::Both,
                     range: Some(SettingRange::Numeric(1..=u64::MAX)),
diff --git a/src/query/settings/src/settings_getter_setter.rs b/src/query/settings/src/settings_getter_setter.rs
@@ -889,8 +889,8 @@ impl Settings {
         self.try_get_u64("hilbert_num_range_ids")
     }
 
-    pub fn get_hilbert_sample_size_per_block(&self) -> Result<u64> {
-        self.try_get_u64("hilbert_sample_size_per_block")
+    pub fn get_recluster_sample_size_per_block(&self) -> Result<u64> {
+        self.try_get_u64("recluster_sample_size_per_block")
     }
 
     pub fn get_hilbert_clustering_min_bytes(&self) -> Result<u64> {
diff --git a/src/query/storages/fuse/src/io/write/stream/block_builder.rs b/src/query/storages/fuse/src/io/write/stream/block_builder.rs
@@ -238,9 +238,9 @@ impl StreamBlockBuilder {
     pub fn need_flush(&self) -> bool {
         let file_size = self.block_writer.compressed_size();
         self.row_count >= self.properties.block_thresholds.min_rows_per_block
-            || self.block_size >= self.properties.block_thresholds.max_bytes_per_block
+            || self.block_size >= self.properties.block_thresholds.min_bytes_per_block * 2
             || (file_size >= self.properties.block_thresholds.min_compressed_per_block
-                && self.block_size >= self.properties.block_thresholds.min_bytes_per_block / 2)
+                && self.block_size >= self.properties.block_thresholds.min_bytes_per_block)
     }
 
     pub fn write(&mut self, block: DataBlock) -> Result<()> {
diff --git a/src/query/storages/fuse/src/io/write/stream/column_statistics.rs b/src/query/storages/fuse/src/io/write/stream/column_statistics.rs
@@ -160,7 +160,7 @@ fn column_update_hll_cardinality(col: &Column, ty: &DataType, hll: &mut ColumnDi
         let col = col.as_nullable().unwrap();
         for (i, v) in col.validity.iter().enumerate() {
             if v {
-                let scalar = col.column.index(i).unwrap();
+                let scalar = unsafe { col.column.index_unchecked(i) };
                 scalar_update_hll_cardinality(&scalar, inner, hll);
             }
         }
diff --git a/src/query/storages/fuse/src/operations/append.rs b/src/query/storages/fuse/src/operations/append.rs
@@ -51,6 +51,9 @@ impl FuseTable {
         pipeline: &mut Pipeline,
         table_meta_timestamps: TableMetaTimestamps,
     ) -> Result<()> {
+        let block_thresholds = self.get_block_thresholds();
+        build_compact_block_pipeline(pipeline, block_thresholds)?;
+
         let enable_stream_block_write =
             ctx.get_settings().get_enable_block_stream_write()? && self.storage_format_as_parquet();
         if enable_stream_block_write {
@@ -76,22 +79,13 @@ impl FuseTable {
             }
 
             pipeline.add_transform(|input, output| {
-                TransformBlockBuilder::try_create(
-                    ctx.clone(),
-                    input,
-                    output,
-                    self,
-                    properties.clone(),
-                )
+                TransformBlockBuilder::try_create(input, output, properties.clone())
             })?;
 
             pipeline.add_async_accumulating_transformer(|| {
                 TransformBlockWriter::create(ctx.clone(), MutationKind::Insert, self, false)
             });
         } else {
-            let block_thresholds = self.get_block_thresholds();
-            build_compact_block_pipeline(pipeline, block_thresholds)?;
-
             let schema = DataSchema::from(&self.schema().remove_virtual_computed_fields()).into();
             let cluster_stats_gen =
                 self.cluster_gen_for_append(ctx.clone(), pipeline, block_thresholds, Some(schema))?;
diff --git a/src/query/storages/fuse/src/operations/common/processors/transform_block_writer.rs b/src/query/storages/fuse/src/operations/common/processors/transform_block_writer.rs
diff --git a/src/query/storages/fuse/src/operations/mutation/mutator/recluster_mutator.rs b/src/query/storages/fuse/src/operations/mutation/mutator/recluster_mutator.rs
diff --git a/tests/sqllogictests/suites/base/09_fuse_engine/09_0008_fuse_optimize_table.test b/tests/sqllogictests/suites/base/09_fuse_engine/09_0008_fuse_optimize_table.test

Original file line number	Diff line number	Diff line change
`@@ -36,10 +36,10 @@ where`
`36`	`36`	`T: ArgType + Send + Sync,`
`37`	`37`	`T::Scalar: Ord + Send,`
`38`	`38`	`{`
`39`		`- pub fn new(offset: usize, sample_rate: f64, seed: u64) -> Self {`
	`39`	`+ pub fn new(offset: usize, sample_size: usize, seed: u64) -> Self {`
`40`	`40`	`Self {`
`41`	`41`	`input_data: vec![],`
`42`		`- sampler: RangeBoundSampler::<T>::new(offset, sample_rate, seed),`
	`42`	`+ sampler: RangeBoundSampler::<T>::new(offset, sample_size, seed),`
`43`	`43`	`}`
`44`	`44`	`}`
`45`	`45`	`}`
Original file line number	Diff line number	Diff line change
`@@ -889,8 +889,8 @@ impl Settings {`
`889`	`889`	`self.try_get_u64("hilbert_num_range_ids")`
`890`	`890`	`}`
`891`	`891`
`892`		`- pub fn get_hilbert_sample_size_per_block(&self) -> Result<u64> {`
`893`		`- self.try_get_u64("hilbert_sample_size_per_block")`
	`892`	`+ pub fn get_recluster_sample_size_per_block(&self) -> Result<u64> {`
	`893`	`+ self.try_get_u64("recluster_sample_size_per_block")`
`894`	`894`	`}`
`895`	`895`
`896`	`896`	`pub fn get_hilbert_clustering_min_bytes(&self) -> Result<u64> {`