lint

adriangb · adriangb · commit 2c3fe5fbad4d · 2025-10-22T11:48:33.000-05:00
diff --git a/datafusion/physical-plan/src/repartition/mod.rs b/datafusion/physical-plan/src/repartition/mod.rs
@@ -1248,37 +1248,40 @@ impl Stream for RepartitionStream {
                 RepartitionStreamState::ReceivingFromChannel => {
                     let value = futures::ready!(self.input.recv().poll_unpin(cx));
                     match value {
-                        Some(Some(v)) => match v {
-                            Ok(RepartitionBatch::Memory(batch)) => {
-                                // Release memory and return
-                                self.reservation
-                                    .lock()
-                                    .shrink(batch.get_array_memory_size());
-                                return Poll::Ready(Some(Ok(batch)));
-                            }
-                            Ok(RepartitionBatch::Spilled) => {
-                                // Get next file from SpillPool and create a stream
-                                let next_file = self.spill_pool.lock().take_next_file()?;
-                                match next_file {
-                                    Some(spill_file) => {
-                                        // Create stream using SpillReaderStream + spawn_buffered
-                                        let stream = self
-                                            .spill_manager
-                                            .read_spill_as_stream(spill_file, None)?;
-                                        self.state =
+                        Some(Some(v)) => {
+                            match v {
+                                Ok(RepartitionBatch::Memory(batch)) => {
+                                    // Release memory and return
+                                    self.reservation
+                                        .lock()
+                                        .shrink(batch.get_array_memory_size());
+                                    return Poll::Ready(Some(Ok(batch)));
+                                }
+                                Ok(RepartitionBatch::Spilled) => {
+                                    // Get next file from SpillPool and create a stream
+                                    let next_file =
+                                        self.spill_pool.lock().take_next_file()?;
+                                    match next_file {
+                                        Some(spill_file) => {
+                                            // Create stream using SpillReaderStream + spawn_buffered
+                                            let stream = self
+                                                .spill_manager
+                                                .read_spill_as_stream(spill_file, None)?;
+                                            self.state =
                                             RepartitionStreamState::ReadingSpilledBatch(stream);
-                                        continue;
-                                    }
-                                    None => {
-                                        // No spilled files available, continue receiving from channel
-                                        continue;
+                                            continue;
+                                        }
+                                        None => {
+                                            // No spilled files available, continue receiving from channel
+                                            continue;
+                                        }
                                     }
                                 }
+                                Err(e) => {
+                                    return Poll::Ready(Some(Err(e)));
+                                }
                             }
-                            Err(e) => {
-                                return Poll::Ready(Some(Err(e)));
-                            }
-                        },
+                        }
                         Some(None) => {
                             self.num_input_partitions_processed += 1;
 
@@ -1317,12 +1320,15 @@ impl Stream for RepartitionStream {
                                         .spill_manager
                                         .read_spill_as_stream(spill_file, None)?;
                                     self.state =
-                                        RepartitionStreamState::ReadingSpilledBatch(new_stream);
+                                        RepartitionStreamState::ReadingSpilledBatch(
+                                            new_stream,
+                                        );
                                     continue;
                                 }
                                 None => {
                                     // No more spilled files, go back to receiving from channel
-                                    self.state = RepartitionStreamState::ReceivingFromChannel;
+                                    self.state =
+                                        RepartitionStreamState::ReceivingFromChannel;
                                     continue;
                                 }
                             }
@@ -1378,37 +1384,40 @@ impl Stream for PerPartitionStream {
                 RepartitionStreamState::ReceivingFromChannel => {
                     let value = futures::ready!(self.receiver.recv().poll_unpin(cx));
                     match value {
-                        Some(Some(v)) => match v {
-                            Ok(RepartitionBatch::Memory(batch)) => {
-                                // Release memory and return
-                                self.reservation
-                                    .lock()
-                                    .shrink(batch.get_array_memory_size());
-                                return Poll::Ready(Some(Ok(batch)));
-                            }
-                            Ok(RepartitionBatch::Spilled) => {
-                                // Get next file from SpillPool and create a stream
-                                let next_file = self.spill_pool.lock().take_next_file()?;
-                                match next_file {
-                                    Some(spill_file) => {
-                                        // Create stream using SpillReaderStream + spawn_buffered
-                                        let stream = self
-                                            .spill_manager
-                                            .read_spill_as_stream(spill_file, None)?;
-                                        self.state =
+                        Some(Some(v)) => {
+                            match v {
+                                Ok(RepartitionBatch::Memory(batch)) => {
+                                    // Release memory and return
+                                    self.reservation
+                                        .lock()
+                                        .shrink(batch.get_array_memory_size());
+                                    return Poll::Ready(Some(Ok(batch)));
+                                }
+                                Ok(RepartitionBatch::Spilled) => {
+                                    // Get next file from SpillPool and create a stream
+                                    let next_file =
+                                        self.spill_pool.lock().take_next_file()?;
+                                    match next_file {
+                                        Some(spill_file) => {
+                                            // Create stream using SpillReaderStream + spawn_buffered
+                                            let stream = self
+                                                .spill_manager
+                                                .read_spill_as_stream(spill_file, None)?;
+                                            self.state =
                                             RepartitionStreamState::ReadingSpilledBatch(stream);
-                                        continue;
-                                    }
-                                    None => {
-                                        // No spilled files available, continue receiving from channel
-                                        continue;
+                                            continue;
+                                        }
+                                        None => {
+                                            // No spilled files available, continue receiving from channel
+                                            continue;
+                                        }
                                     }
                                 }
+                                Err(e) => {
+                                    return Poll::Ready(Some(Err(e)));
+                                }
                             }
-                            Err(e) => {
-                                return Poll::Ready(Some(Err(e)));
-                            }
-                        },
+                        }
                         Some(None) => {
                             // Input partition has finished sending batches
                             return Poll::Ready(None);
@@ -1436,12 +1445,15 @@ impl Stream for PerPartitionStream {
                                         .spill_manager
                                         .read_spill_as_stream(spill_file, None)?;
                                     self.state =
-                                        RepartitionStreamState::ReadingSpilledBatch(new_stream);
+                                        RepartitionStreamState::ReadingSpilledBatch(
+                                            new_stream,
+                                        );
                                     continue;
                                 }
                                 None => {
                                     // No more spilled files, go back to receiving from channel
-                                    self.state = RepartitionStreamState::ReceivingFromChannel;
+                                    self.state =
+                                        RepartitionStreamState::ReceivingFromChannel;
                                     continue;
                                 }
                             }
diff --git a/docs/source/user-guide/configs.md b/docs/source/user-guide/configs.md
@@ -114,6 +114,7 @@ The following configuration settings are available:
 | datafusion.execution.spill_compression                                  | uncompressed              | Sets the compression codec used when spilling data to disk. Since datafusion writes spill files using the Arrow IPC Stream format, only codecs supported by the Arrow IPC Stream Writer are allowed. Valid values are: uncompressed, lz4_frame, zstd. Note: lz4_frame offers faster (de)compression, but typically results in larger spill files. In contrast, zstd achieves higher compression ratios at the cost of slower (de)compression speed.                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
 | datafusion.execution.sort_spill_reservation_bytes                       | 10485760                  | Specifies the reserved memory for each spillable sort operation to facilitate an in-memory merge. When a sort operation spills to disk, the in-memory data must be sorted and merged before being written to a file. This setting reserves a specific amount of memory for that in-memory sort/merge process. Note: This setting is irrelevant if the sort operation cannot spill (i.e., if there's no `DiskManager` configured).                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | datafusion.execution.sort_in_place_threshold_bytes                      | 1048576                   | When sorting, below what size should data be concatenated and sorted in a single RecordBatch rather than sorted in batches and merged.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
+| datafusion.execution.max_spill_file_size_bytes                          | 104857600                 | Maximum size in bytes for individual spill files before rotating to a new file. When operators spill data to disk (e.g., RepartitionExec, SortExec), they write multiple batches to the same file until this size limit is reached, then rotate to a new file. This reduces syscall overhead compared to one-file-per-batch while preventing files from growing too large. A larger value reduces file creation overhead but may hold more disk space. A smaller value creates more files but allows finer-grained space reclamation (especially in LIFO mode where files are truncated after reading). Default: 100 MB                                                                                                                                                                                                                                                                                                 |
 | datafusion.execution.meta_fetch_concurrency                             | 32                        | Number of files to read in parallel when inferring schema and statistics                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
 | datafusion.execution.minimum_parallel_output_files                      | 4                         | Guarantees a minimum level of output files running in parallel. RecordBatches will be distributed in round robin fashion to each parallel writer. Each writer is closed and a new file opened once soft_max_rows_per_output_file is reached.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | datafusion.execution.soft_max_rows_per_output_file                      | 50000000                  | Target number of rows in output files when writing multiple. This is a soft max, so it can be exceeded slightly. There also will be one file smaller than the limit if the total number of rows written is not roughly divisible by the soft max                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |