Sort: improve the code after recent changes #10647

xtqqczze · 2026-02-02T21:54:33Z

Suggested change

for (idx, selector) in settings.selectors.iter().enumerate() {

for (key_index, selector) in (1..).zip(settings.selectors.iter()) {

xtqqczze · 2026-02-02T21:35:37Z

enumerate() itself doesn’t guard against overflow, so guarding only at idx + 1 doesn’t add real safety.

In any case, I think idx.checked_add(1).unwrap() would make more sense.

Hang on, there is no potential overflow, key_index has the range 1..settings.selectors.len()

They all optimise to the same anyway: https://godbolt.org/z/f4WzhP1vf

-Original file line number
+Diff line change
@@ Expand Up / @@ -243,3 +243,7 @@ Hijri @@
     Nowruz
     charmap
     hijri
+    TERA
+    GIGA
+    PETA

-Original file line number
+Diff line change
@@ Expand Up / @@ -9,6 +9,8 @@ use std::ffi::OsString; @@
     use crate::{
         FALLBACK_AUTOMATIC_BUF_SIZE, MAX_AUTOMATIC_BUF_SIZE, MIN_AUTOMATIC_BUF_SIZE, STDIN_FILE,
     };
+    #[cfg(test)]
+    use uucore::parser::parse_size::MEGA;
     // Heuristics to size the external sort buffer without overcommit memory.
     pub(crate) fn automatic_buffer_size(files: &[OsString]) -> usize {
@@ Expand Down Expand Up / @@ -135,15 +137,15 @@ mod tests { @@
         #[test]
         fn desired_buffer_matches_total_when_small() {
-            let six_mebibytes = 6 * 1024 * 1024;
+            let six_mebibytes = 6 * MEGA;
             let expected = ((six_mebibytes as u128) * 12)
                 .clamp(six_mebibytes as u128, crate::MAX_AUTOMATIC_BUF_SIZE as u128);
             assert_eq!(desired_file_buffer_bytes(six_mebibytes as u128), expected);
         }
         #[test]
         fn desired_buffer_caps_at_max_for_large_inputs() {
-            let large = 256 * 1024 * 1024; // 256 MiB
+            let large = 256 * MEGA; // 256 MiB
             assert_eq!(
                 desired_file_buffer_bytes(large as u128),
                 crate::MAX_AUTOMATIC_BUF_SIZE as u128
@@ Expand Down @@

-Original file line number
+Diff line change
@@ Expand Up / @@ -22,8 +22,9 @@ use uucore::error::{UResult, USimpleError}; @@
     use crate::{
         GeneralBigDecimalParseResult, GlobalSettings, Line, SortMode, numeric_str_cmp::NumInfo,
     };
+    use uucore::parser::parse_size::MEGA;
-    const MAX_TOKEN_BUFFER_BYTES: usize = 4 * 1024 * 1024;
+    const MAX_TOKEN_BUFFER_BYTES: usize = 4 * MEGA;
     const MAX_TOKEN_BUFFER_ELEMS: usize = MAX_TOKEN_BUFFER_BYTES / std::mem::size_of::<Range<usize>>();
     self_cell!(
@@ Expand Down Expand Up / @@ -374,7 +375,7 @@ fn read_to_buffer<T: Read>( @@
                         // We need to read more lines
                         let len = buffer.len();
-                        let grow_by = (len / 2).max(1024 * 1024);
+                        let grow_by = (len / 2).max(MEGA);
                         buffer.resize(len + grow_by, 0);
                         read_target = &mut buffer[len..];
                     } else {
@@ Expand Down @@

-Original file line number
+Diff line change
@@ Expand Up / @@ -35,6 +35,7 @@ use crate::{ @@
         compare_by, merge, sort_by,
     };
     use crate::{Line, print_sorted};
+    use uucore::parser::parse_size::MEGA;
     // Note: update `test_sort::test_start_buffer` if this size is changed
     const START_BUFFER_SIZE: usize = 8_000;
@@ Expand Down Expand Up / @@ -116,11 +117,11 @@ fn reader_writer< @@
         // Cap oversized buffer requests to avoid unnecessary allocations and give the automatic
         // heuristic room to grow when the user does not provide an explicit value.
         let mut buffer_size = match settings.buffer_size {
-            size if size <= 512 * 1024 * 1024 => size,
+            size if size <= 512 * MEGA => size,
             size => size / 2,
         };
         if !settings.buffer_size_is_explicit {
-            buffer_size = buffer_size.max(8 * 1024 * 1024);
+            buffer_size = buffer_size.max(8 * MEGA);
         }
         let read_result: ReadResult<Tmp> = read_write_loop(
             files,
@@ Expand Down @@

-Original file line number
+Diff line change
@@ Expand Up / @@ -6,6 +6,14 @@ @@
     //! Parser for sizes in SI or IEC units (multiples of 1000 or 1024 bytes).
+    // SI unit constants for byte parsing (powers of 1024)
+    pub const KILO: usize = 1024;
+    pub const MEGA: usize = 1024 * 1024;
+    pub const GIGA: usize = 1024 * 1024 * 1024;
+    pub const TERA: usize = 1024 * 1024 * 1024 * 1024;
+    pub const PETA: usize = 1024 * 1024 * 1024 * 1024 * 1024;
+    pub const EXA: usize = 1024 * 1024 * 1024 * 1024 * 1024 * 1024;
     use std::error::Error;
     use std::fmt;
     use std::num::{IntErrorKind, ParseIntError};
@@ Expand Down @@

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Sort: improve the code after recent changes #10647

Diff view

Diff view

There are no files selected for viewing

xtqqczze Feb 2, 2026

Uh oh!

xtqqczze Feb 2, 2026 •

edited

Loading

Uh oh!

xtqqczze Feb 2, 2026 •

edited

Loading

Uh oh!

Uh oh!

Uh oh!

Sort: improve the code after recent changes #10647

Are you sure you want to change the base?

Sort: improve the code after recent changes #10647

Uh oh!

Uh oh!

Diff view

Diff view

There are no files selected for viewing

xtqqczze Feb 2, 2026

Choose a reason for hiding this comment

Uh oh!

xtqqczze Feb 2, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

xtqqczze Feb 2, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Uh oh!

xtqqczze Feb 2, 2026 •

edited

Loading

xtqqczze Feb 2, 2026 •

edited

Loading